fix data generation

This commit is contained in:
Torben Haack 2024-11-11 07:01:32 +01:00
parent 2b92bbf9f5
commit 6b5be5696d
No known key found for this signature in database
2 changed files with 358 additions and 732 deletions

View File

@ -1,257 +1,231 @@
"use strict"; const sqlite3 = require("sqlite3");
var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) { const faker = require("@faker-js/faker").faker;
function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); } const { random, sample, sampleSize, sum } = require("lodash");
return new (P || (P = Promise))(function (resolve, reject) { const { DateTime } = require("luxon");
function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } } const { open } = require("sqlite");
function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } } const { v4: uuidv4 } = require("uuid");
function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
step((generator = generator.apply(thisArg, _arguments || [])).next()); const dbPath = "./db/sqlite.db";
});
}; // Configuration for test data generation
var __generator = (this && this.__generator) || function (thisArg, body) { let startDate = DateTime.fromISO("2024-10-08");
var _ = { label: 0, sent: function() { if (t[0] & 1) throw t[1]; return t[1]; }, trys: [], ops: [] }, f, y, t, g = Object.create((typeof Iterator === "function" ? Iterator : Object).prototype); let endDate = DateTime.fromISO("2024-11-08");
return g.next = verb(0), g["throw"] = verb(1), g["return"] = verb(2), typeof Symbol === "function" && (g[Symbol.iterator] = function() { return this; }), g; let numberOfPrinters = 5;
function verb(n) { return function (v) { return step([n, v]); }; }
function step(op) { // Use weekday names for better readability and ease of setting trends
if (f) throw new TypeError("Generator is already executing."); let avgPrintTimesPerDay = {
while (g && (g = 0, op[0] && (_ = 0)), _) try { Monday: 4,
if (f = 1, y && (t = op[0] & 2 ? y["return"] : op[0] ? y["throw"] || ((t = y["return"]) && t.call(y), 0) : y.next) && !(t = t.call(y, op[1])).done) return t; Tuesday: 2,
if (y = 0, t) op = [op[0] & 2, t.value]; Wednesday: 5,
switch (op[0]) { Thursday: 2,
case 0: case 1: t = op; break; Friday: 3,
case 4: _.label++; return { value: op[1], done: false }; Saturday: 0,
case 5: _.label++; y = op[1]; op = [0]; continue; Sunday: 0,
case 7: op = _.ops.pop(); _.trys.pop(); continue; }; // Average number of prints for each weekday
default:
if (!(t = _.trys, t = t.length > 0 && t[t.length - 1]) && (op[0] === 6 || op[0] === 2)) { _ = 0; continue; } let avgPrintDurationPerDay = {
if (op[0] === 3 && (!t || (op[1] > t[0] && op[1] < t[3]))) { _.label = op[1]; break; } Monday: 240, // Total average duration in minutes for Monday
if (op[0] === 6 && _.label < t[1]) { _.label = t[1]; t = op; break; } Tuesday: 30,
if (t && _.label < t[2]) { _.label = t[2]; _.ops.push(op); break; } Wednesday: 45,
if (t[2]) _.ops.pop(); Thursday: 40,
_.trys.pop(); continue; Friday: 120,
} Saturday: 0,
op = body.call(thisArg, _); Sunday: 0,
} catch (e) { op = [6, e]; y = 0; } finally { f = t = 0; } }; // Average total duration of prints for each weekday
if (op[0] & 5) throw op[1]; return { value: op[0] ? op[1] : void 0, done: true };
} let printerUsage = {
}; "Drucker 1": 0.5,
var __spreadArray = (this && this.__spreadArray) || function (to, from, pack) { "Drucker 2": 0.7,
if (pack || arguments.length === 2) for (var i = 0, l = from.length, ar; i < l; i++) { "Drucker 3": 0.6,
if (ar || !(i in from)) { "Drucker 4": 0.3,
if (!ar) ar = Array.prototype.slice.call(from, 0, i); "Drucker 5": 0.4,
ar[i] = from[i]; }; // Usage percentages for each printer
}
} // **New Configurations for Error Rates**
return to.concat(ar || Array.prototype.slice.call(from)); let generalErrorRate = 0.05; // 5% chance any print job may fail
}; let printerErrorRates = {
Object.defineProperty(exports, "__esModule", { value: true }); "Drucker 1": 0.02, // 2% error rate for Printer 1
var sqlite3 = require("sqlite3"); "Drucker 2": 0.03,
var faker_1 = require("@faker-js/faker"); "Drucker 3": 0.01,
var lodash_1 = require("lodash"); "Drucker 4": 0.05,
var luxon_1 = require("luxon"); "Drucker 5": 0.04,
var sqlite_1 = require("sqlite"); }; // Error rates for each printer
var uuid_1 = require("uuid");
var dbPath = "./db/sqlite.db"; const holidays = []; // Example holidays
// Configurations for test data generation const existingJobs = [];
var startDate = luxon_1.DateTime.fromISO("2024-11-01");
var endDate = luxon_1.DateTime.fromISO("2024-11-30"); const initDB = async () => {
var holidays = []; // Example holidays
var existingJobs = [];
// Calendar week usage configs
var weekUsage = {
44: { minJobs: 4, maxJobs: 6 },
45: { minJobs: 10, maxJobs: 15 },
46: { minJobs: 10, maxJobs: 15 },
47: { minJobs: 3, maxJobs: 5 },
48: { minJobs: 10, maxJobs: 15 },
};
var printerUsageBias = {
fastPrints: ["Printer A", "Printer B"],
largePrints: ["Printer C", "Printer D", "Printer E"],
};
var initDB = function () { return __awaiter(void 0, void 0, void 0, function () {
return __generator(this, function (_a) {
console.log("Initializing database connection..."); console.log("Initializing database connection...");
return [2 /*return*/, (0, sqlite_1.open)({ return open({
filename: dbPath, filename: dbPath,
driver: sqlite3.Database, driver: sqlite3.Database,
})];
}); });
}); }; };
var createUser = function (isPowerUser) {
if (isPowerUser === void 0) { isPowerUser = false; } const createUser = (isPowerUser = false) => {
var name = [faker_1.faker.person.firstName(), faker_1.faker.person.lastName()]; const name = [faker.person.firstName(), faker.person.lastName()];
var user = {
id: (0, uuid_1.v4)(), const user = {
github_id: faker_1.faker.number.int(), id: uuidv4(),
username: "".concat(name[0].slice(0, 2)).concat(name[1].slice(0, 6)).toUpperCase(), github_id: faker.number.int(),
displayName: "".concat(name[0], " ").concat(name[1]).toUpperCase(), username: `${name[0].slice(0, 2)}${name[1].slice(0, 6)}`.toUpperCase(),
email: "".concat(name[0], ".").concat(name[1], "@mercedes-benz.com"), displayName: `${name[0]} ${name[1]}`.toUpperCase(),
role: (0, lodash_1.sample)(["user", "admin"]), email: `${name[0]}.${name[1]}@example.com`,
isPowerUser: isPowerUser, role: sample(["user", "admin"]),
isPowerUser,
}; };
console.log("Created user:", user); console.log("Created user:", user);
return user; return user;
}; };
var createPrinter = function () {
var printer = { const createPrinter = (index) => {
id: (0, uuid_1.v4)(), const printer = {
name: "Printer ".concat(faker_1.faker.number.int({ max: 9 })), id: uuidv4(),
description: faker_1.faker.lorem.sentence(), name: `Drucker ${index}`,
status: (0, lodash_1.random)(0, 2), description: faker.lorem.sentence(),
status: random(0, 2),
}; };
console.log("Created printer:", printer); console.log("Created printer:", printer);
return printer; return printer;
}; };
var isPrinterAvailable = function (printer, startAt, duration) {
var endAt = startAt + duration * 60 * 1000; // Convert minutes to milliseconds const isPrinterAvailable = (printer, startAt, duration) => {
return !existingJobs.some(function (job) { const endAt = startAt + duration * 60 * 1000; // Convert minutes to milliseconds
var jobStart = job.startAt; return !existingJobs.some((job) => {
var jobEnd = job.startAt + job.durationInMinutes * 60 * 1000; const jobStart = job.startAt;
return (printer.id === job.printerId && const jobEnd = job.startAt + job.durationInMinutes * 60 * 1000;
return (
printer.id === job.printerId &&
((startAt >= jobStart && startAt < jobEnd) || ((startAt >= jobStart && startAt < jobEnd) ||
(endAt > jobStart && endAt <= jobEnd) || (endAt > jobStart && endAt <= jobEnd) ||
(startAt <= jobStart && endAt >= jobEnd))); (startAt <= jobStart && endAt >= jobEnd))
);
}); });
}; };
var weightedSampleUser = function (users) {
var weights = users.map(function (user) { return (user.isPowerUser ? 3 : 1); }); const createPrintJob = (users, printers, startAt, duration) => {
var weightedUsers = users.flatMap(function (user, index) { return Array(weights[index]).fill(user); }); const user = sample(users);
return (0, lodash_1.sample)(weightedUsers); let printer;
};
var normalRandom = function (mean, stdDev) { // Weighted selection based on printer usage
var u = 0; const printerNames = Object.keys(printerUsage);
var v = 0; const weightedPrinters = printers.filter((p) => printerNames.includes(p.name));
while (u === 0)
u = Math.random(); // Create a weighted array of printers based on usage percentages
while (v === 0) const printerWeights = weightedPrinters.map((p) => ({
v = Math.random(); printer: p,
return mean + stdDev * Math.sqrt(-2 * Math.log(u)) * Math.cos(2 * Math.PI * v); weight: printerUsage[p.name],
}; }));
var createPrintJob = function (users, printers, startAt) {
var user = weightedSampleUser(users); const totalWeight = sum(printerWeights.map((pw) => pw.weight));
var printer; const randomWeight = Math.random() * totalWeight;
// Probabilistic determination for large prints let accumulatedWeight = 0;
var isLargePrint = (0, lodash_1.random)(0, 100) < 30; // 30% chance for a large print for (const pw of printerWeights) {
if (isLargePrint) { accumulatedWeight += pw.weight;
printer = (0, lodash_1.sample)(printers.filter(function (p) { return printerUsageBias.largePrints.includes(p.name); })); if (randomWeight <= accumulatedWeight) {
printer = pw.printer;
break;
} }
else {
printer = (0, lodash_1.sample)(printers.filter(function (p) { return printerUsageBias.fastPrints.includes(p.name); }));
} }
if (!printer) { if (!printer) {
printer = (0, lodash_1.sample)(printers); printer = sample(printers);
} }
// Variable duration for print jobs with realistic limits
var duration = Math.round(normalRandom(isLargePrint ? 240 : 75, 30));
var minDuration = 15;
var maxDuration = isLargePrint ? 5760 : 3540; // Maximum duration of 96 hours or 59 minutes in minutes
if (isLargePrint) {
duration = Math.min(duration, maxDuration);
}
duration = Math.max(duration, minDuration);
duration = Math.min(duration, maxDuration);
// Ensure printer availability
if (!isPrinterAvailable(printer, startAt, duration)) { if (!isPrinterAvailable(printer, startAt, duration)) {
console.log("Printer not available, skipping job creation."); console.log("Printer not available, skipping job creation.");
return null; return null;
} }
// Dynamic error probability based on printer status, duration, and other factors
var aborted = false; // **Determine if the job should be aborted based on error rates**
var abortReason = null; let aborted = false;
var baseErrorRate = Math.max(0, Math.min(5, 100)); // Ensure error rate is between 0% and 100% let abortReason = null;
var userErrorModifier = user.isPowerUser ? -2 : 2; // Power users make fewer errors
var timeErrorModifier = startAt >= luxon_1.DateTime.fromObject({ hour: 14 }).toMillis() && startAt <= luxon_1.DateTime.fromObject({ hour: 17 }).toMillis() // Calculate the combined error rate
? 1 const printerErrorRate = printerErrorRates[printer.name] || 0;
: 0; // More errors in the afternoon const combinedErrorRate = 1 - (1 - generalErrorRate) * (1 - printerErrorRate);
var errorRate = baseErrorRate + userErrorModifier + timeErrorModifier;
if ((0, lodash_1.random)(0, 100) < Math.max(0, Math.min(errorRate, 100))) { if (Math.random() < combinedErrorRate) {
aborted = true; aborted = true;
abortReason = generateDynamicAbortReason(); const errorMessages = [
"Unbekannt",
"Keine Ahnung",
"Falsch gebucht",
"Filament gelöst",
"Druckabbruch",
"Düsenverstopfung",
"Schichthaftung fehlgeschlagen",
"Materialmangel",
"Dateifehler",
"Temperaturproblem",
"Mechanischer Fehler",
"Softwarefehler",
"Kalibrierungsfehler",
"Überhitzung",
];
abortReason = sample(errorMessages); // Generate a random abort reason
} }
var printJob = {
id: (0, uuid_1.v4)(), const printJob = {
id: uuidv4(),
printerId: printer.id, printerId: printer.id,
userId: user.id, userId: user.id,
startAt: startAt, startAt,
durationInMinutes: duration, durationInMinutes: duration,
comments: faker_1.faker.lorem.sentence(), comments: faker.lorem.sentence(),
aborted: aborted, aborted,
abortReason: abortReason, abortReason,
}; };
console.log("Created print job:", printJob); console.log("Created print job:", printJob);
return printJob; return printJob;
}; };
var generateDynamicAbortReason = function () {
var reasons = [ const generatePrintJobsForDay = async (users, printers, dayDate, totalJobsForDay, totalDurationForDay, db, dryRun) => {
"Filament gerissen", console.log(`Generating print jobs for ${dayDate.toISODate()}...`);
"Drucker überhitzt",
"Schichtversatz festgestellt", // Generate random durations that sum up approximately to totalDurationForDay
"Düse verstopft", const durations = [];
"Kalibrierung fehlgeschlagen", let remainingDuration = totalDurationForDay;
"E".concat((0, lodash_1.random)(500, 599)), for (let i = 0; i < totalJobsForDay; i++) {
]; const avgJobDuration = remainingDuration / (totalJobsForDay - i);
var reason = (0, lodash_1.sample)(reasons); const jobDuration = Math.max(
// Add typos to simulate human variability Math.round(random(avgJobDuration * 0.8, avgJobDuration * 1.2)),
if ((0, lodash_1.random)(0, 1)) { 5, // Minimum duration of 5 minutes
reason = reason.replace("e", (0, lodash_1.random)(0, 1) ? "é" : "e"); );
durations.push(jobDuration);
remainingDuration -= jobDuration;
} }
return reason;
}; // Shuffle durations to randomize job lengths
var generatePrintJobsForWeek = function (users, printers, weekNumber, const shuffledDurations = sampleSize(durations, durations.length);
// biome-ignore lint/suspicious/noExplicitAny: <explanation>
db, dryRun) { return __awaiter(void 0, void 0, void 0, function () { for (let i = 0; i < totalJobsForDay; i++) {
var weekConfig, totalJobs, startOfWeek, jobsRemaining, day, dayDate, _i, printers_1, printer, jobsForDay, i, timeSlots, selectedSlot, startAt, printJob; const duration = shuffledDurations[i];
return __generator(this, function (_a) {
switch (_a.label) { // Random start time between 8 AM and 6 PM, adjusted to avoid overlapping durations
case 0: const possibleStartHours = Array.from({ length: 10 }, (_, idx) => idx + 8); // 8 AM to 6 PM
console.log("Generating print jobs for week ".concat(weekNumber, "...")); let startAt;
weekConfig = weekUsage[weekNumber]; let attempts = 0;
totalJobs = (0, lodash_1.random)(weekConfig.minJobs, weekConfig.maxJobs); do {
startOfWeek = startDate.plus({ weeks: weekNumber - 44 }); const hour = sample(possibleStartHours);
jobsRemaining = totalJobs; const minute = random(0, 59);
day = 0; startAt = dayDate.set({ hour, minute, second: 0, millisecond: 0 }).toMillis();
_a.label = 1; attempts++;
case 1: if (attempts > 10) {
if (!(day < 7)) return [3 /*break*/, 7]; console.log("Unable to find available time slot, skipping job.");
dayDate = startOfWeek.plus({ days: day }); break;
if (dayDate > endDate || jobsRemaining <= 0)
return [3 /*break*/, 7];
if (holidays.includes(dayDate.toISODate()) || dayDate.weekday === 6 || dayDate.weekday === 7) {
console.log("Skipping holiday or weekend: ".concat(dayDate.toISODate()));
return [3 /*break*/, 6];
} }
// Update printer status to simulate maintenance or breakdowns } while (!isPrinterAvailable(sample(printers), startAt, duration));
for (_i = 0, printers_1 = printers; _i < printers_1.length; _i++) {
printer = printers_1[_i]; if (attempts > 10) continue;
if ((0, lodash_1.random)(0, 100) < 5) {
// 5% chance per day that a printer goes out of service const printJob = createPrintJob(users, printers, startAt, duration);
printer.status = 2; // Status 2 means "out of service" if (printJob) {
console.log("Printer ".concat(printer.name, " is out of service on ").concat(dayDate.toISODate())); if (!dryRun) {
} await db.run(
else if (printer.status === 2) { `INSERT INTO printJob (id, printerId, userId, startAt, durationInMinutes, comments, aborted, abortReason)
printer.status = 0; // Printer becomes available again VALUES (?, ?, ?, ?, ?, ?, ?, ?)`,
} [
}
jobsForDay = Math.min(jobsRemaining, (0, lodash_1.random)(1, 3));
jobsRemaining -= jobsForDay;
console.log("Generating ".concat(jobsForDay, " print jobs for day ").concat(dayDate.toISODate(), "..."));
i = 0;
_a.label = 2;
case 2:
if (!(i < jobsForDay)) return [3 /*break*/, 6];
timeSlots = [
{ hour: 7, minute: 0 },
{ hour: 11, minute: 0 },
{ hour: 13, minute: 0 },
{ hour: 15, minute: 0 },
];
selectedSlot = (0, lodash_1.sample)(timeSlots);
startAt = luxon_1.DateTime.fromISO("".concat(dayDate.toISODate(), "T").concat(String(selectedSlot.hour).padStart(2, "0"), ":").concat(String(selectedSlot.minute + (0, lodash_1.random)(0, 30)).padStart(2, "0"), ":00"));
printJob = createPrintJob(users, printers, startAt.toMillis());
if (!printJob) return [3 /*break*/, 5];
if (!!dryRun) return [3 /*break*/, 4];
return [4 /*yield*/, db.run("INSERT INTO printJob (id, printerId, userId, startAt, durationInMinutes, comments, aborted, abortReason)\n VALUES (?, ?, ?, ?, ?, ?, ?, ?)", [
printJob.id, printJob.id,
printJob.printerId, printJob.printerId,
printJob.userId, printJob.userId,
@ -260,125 +234,134 @@ db, dryRun) { return __awaiter(void 0, void 0, void 0, function () {
printJob.comments, printJob.comments,
printJob.aborted ? 1 : 0, printJob.aborted ? 1 : 0,
printJob.abortReason, printJob.abortReason,
])]; ],
case 3: );
_a.sent(); }
_a.label = 4;
case 4:
existingJobs.push(printJob); existingJobs.push(printJob);
console.log("Inserted print job into database:", printJob.id); console.log("Inserted print job into database:", printJob.id);
console.log(JSON.stringify({
event: "PrintJobCreated",
jobId: printJob.id,
printerId: printJob.printerId,
userId: printJob.userId,
startAt: new Date(printJob.startAt).toISOString(),
duration: printJob.durationInMinutes,
aborted: printJob.aborted,
}));
_a.label = 5;
case 5:
i++;
return [3 /*break*/, 2];
case 6:
day++;
return [3 /*break*/, 1];
case 7: return [2 /*return*/];
} }
});
}); };
var generateTestData = function () {
var args_1 = [];
for (var _i = 0; _i < arguments.length; _i++) {
args_1[_i] = arguments[_i];
} }
return __awaiter(void 0, __spreadArray([], args_1, true), void 0, function (dryRun) {
var db, users, printers, _a, users_1, user, _b, printers_2, printer, validateData, _c, _d, weekNumber;
if (dryRun === void 0) { dryRun = false; }
return __generator(this, function (_e) {
switch (_e.label) {
case 0:
console.log("Starting test data generation...");
return [4 /*yield*/, initDB()];
case 1:
db = _e.sent();
users = __spreadArray(__spreadArray([], Array.from({ length: 7 }, function () { return createUser(false); }), true), Array.from({ length: 3 }, function () { return createUser(true); }), true);
printers = Array.from({ length: 5 }, createPrinter);
if (!!dryRun) return [3 /*break*/, 9];
_a = 0, users_1 = users;
_e.label = 2;
case 2:
if (!(_a < users_1.length)) return [3 /*break*/, 5];
user = users_1[_a];
return [4 /*yield*/, db.run("INSERT INTO user (id, github_id, name, displayName, email, role)\n VALUES (?, ?, ?, ?, ?, ?)", [user.id, user.github_id, user.username, user.displayName, user.email, user.role])];
case 3:
_e.sent();
console.log("Inserted user into database:", user.id);
_e.label = 4;
case 4:
_a++;
return [3 /*break*/, 2];
case 5:
_b = 0, printers_2 = printers;
_e.label = 6;
case 6:
if (!(_b < printers_2.length)) return [3 /*break*/, 9];
printer = printers_2[_b];
return [4 /*yield*/, db.run("INSERT INTO printer (id, name, description, status)\n VALUES (?, ?, ?, ?)", [printer.id, printer.name, printer.description, printer.status])];
case 7:
_e.sent();
console.log("Inserted printer into database:", printer.id);
_e.label = 8;
case 8:
_b++;
return [3 /*break*/, 6];
case 9:
validateData = function (printJobs, users, printers) {
var _loop_1 = function (job) {
var userExists = users.some(function (user) { return user.id === job.userId; });
var printerExists = printers.some(function (printer) { return printer.id === job.printerId; });
if (!userExists || !printerExists) {
console.error("Invalid job detected: ".concat(job.id));
}
};
for (var _i = 0, printJobs_1 = printJobs; _i < printJobs_1.length; _i++) {
var job = printJobs_1[_i];
_loop_1(job);
}
};
_c = 0, _d = Object.keys(weekUsage);
_e.label = 10;
case 10:
if (!(_c < _d.length)) return [3 /*break*/, 13];
weekNumber = _d[_c];
return [4 /*yield*/, generatePrintJobsForWeek(users, printers, Number.parseInt("".concat(weekNumber)), db, dryRun)];
case 11:
_e.sent();
console.log("======> \uD83D\uDCC5 Week ".concat(weekNumber));
validateData(existingJobs, users, printers);
_e.label = 12;
case 12:
_c++;
return [3 /*break*/, 10];
case 13:
if (!!dryRun) return [3 /*break*/, 15];
return [4 /*yield*/, db.close()];
case 14:
_e.sent();
console.log("Database connection closed. Test data generation complete.");
return [3 /*break*/, 16];
case 15:
console.log("Dry run complete. No data was written to the database.");
_e.label = 16;
case 16: return [2 /*return*/];
}
});
});
}; };
generateTestData(process.argv.includes("--dry-run"))
.then(function () { const generateTestData = async (dryRun = false) => {
console.log("Test data generation script finished."); console.log("Starting test data generation...");
}) const db = await initDB();
.catch(function (err) {
console.error("Error generating test data:", err); // Generate users and printers
const users = [
...Array.from({ length: 7 }, () => createUser(false)),
...Array.from({ length: 3 }, () => createUser(true)),
];
const printers = Array.from({ length: numberOfPrinters }, (_, index) => createPrinter(index + 1));
if (!dryRun) {
// Insert users into the database
for (const user of users) {
await db.run(
`INSERT INTO user (id, github_id, name, displayName, email, role)
VALUES (?, ?, ?, ?, ?, ?)`,
[user.id, user.github_id, user.username, user.displayName, user.email, user.role],
);
console.log("Inserted user into database:", user.id);
}
// Insert printers into the database
for (const printer of printers) {
await db.run(
`INSERT INTO printer (id, name, description, status)
VALUES (?, ?, ?, ?)`,
[printer.id, printer.name, printer.description, printer.status],
);
console.log("Inserted printer into database:", printer.id);
}
}
// Generate print jobs for each day within the specified date range
let currentDay = startDate;
while (currentDay <= endDate) {
const weekdayName = currentDay.toFormat("EEEE"); // Get weekday name (e.g., 'Monday')
if (holidays.includes(currentDay.toISODate()) || avgPrintTimesPerDay[weekdayName] === 0) {
console.log(`Skipping holiday or no jobs scheduled: ${currentDay.toISODate()}`);
currentDay = currentDay.plus({ days: 1 });
continue;
}
const totalJobsForDay = avgPrintTimesPerDay[weekdayName];
const totalDurationForDay = avgPrintDurationPerDay[weekdayName];
await generatePrintJobsForDay(users, printers, currentDay, totalJobsForDay, totalDurationForDay, db, dryRun);
currentDay = currentDay.plus({ days: 1 });
}
if (!dryRun) {
await db.close();
console.log("Database connection closed. Test data generation complete.");
} else {
console.log("Dry run complete. No data was written to the database.");
}
};
const setConfigurations = (config) => {
if (config.startDate) startDate = DateTime.fromISO(config.startDate);
if (config.endDate) endDate = DateTime.fromISO(config.endDate);
if (config.numberOfPrinters) numberOfPrinters = config.numberOfPrinters;
if (config.avgPrintTimesPerDay) avgPrintTimesPerDay = config.avgPrintTimesPerDay;
if (config.avgPrintDurationPerDay) avgPrintDurationPerDay = config.avgPrintDurationPerDay;
if (config.printerUsage) printerUsage = config.printerUsage;
if (config.generalErrorRate !== undefined) generalErrorRate = config.generalErrorRate;
if (config.printerErrorRates) printerErrorRates = config.printerErrorRates;
};
// Example usage
setConfigurations({
startDate: "2024-10-08",
endDate: "2024-11-08",
numberOfPrinters: 6,
avgPrintTimesPerDay: {
Monday: 4, // High usage
Tuesday: 2, // Low usage
Wednesday: 3, // Low usage
Thursday: 2, // Low usage
Friday: 8, // High usage
Saturday: 0,
Sunday: 0,
},
avgPrintDurationPerDay: {
Monday: 300, // High total duration
Tuesday: 60, // Low total duration
Wednesday: 90,
Thursday: 60,
Friday: 240,
Saturday: 0,
Sunday: 0,
},
printerUsage: {
"Drucker 1": 2.3,
"Drucker 2": 1.7,
"Drucker 3": 0.1,
"Drucker 4": 1.5,
"Drucker 5": 2.4,
"Drucker 6": 0.3,
"Drucker 7": 0.9,
"Drucker 8": 0.1,
},
generalErrorRate: 0.05, // 5% general error rate
printerErrorRates: {
"Drucker 1": 0.02,
"Drucker 2": 0.03,
"Drucker 3": 0.1,
"Drucker 4": 0.05,
"Drucker 5": 0.04,
"Drucker 6": 0.02,
"Drucker 7": 0.01,
"PrinteDrucker 8": 0.03,
},
}); });
generateTestData(process.argv.includes("--dry-run"))
.then(() => {
console.log("Test data generation script finished.");
})
.catch((err) => {
console.error("Error generating test data:", err);
});

View File

@ -1,357 +0,0 @@
import * as sqlite3 from "sqlite3";
type User = {
id: string;
github_id: number;
username: string;
displayName: string;
email: string;
role: string | undefined;
isPowerUser: boolean;
};
type Printer = {
id: string;
name: string;
description: string;
status: number;
};
type PrintJob = {
id: string;
printerId: string;
userId: string;
startAt: number;
durationInMinutes: number;
comments: string;
aborted: boolean;
abortReason: string | null;
};
import { faker } from "@faker-js/faker";
import { random, sample } from "lodash";
import { DateTime } from "luxon";
import { open } from "sqlite";
import { v4 as uuidv4 } from "uuid";
const dbPath = "./db/sqlite.db";
// Configurations for test data generation
const startDate = DateTime.fromISO("2024-11-01");
const endDate = DateTime.fromISO("2024-11-30");
const holidays: string[] = []; // Example holidays
const existingJobs: PrintJob[] = [];
// Calendar week usage configs
const weekUsage = {
44: { minJobs: 4, maxJobs: 6 },
45: { minJobs: 10, maxJobs: 15 },
46: { minJobs: 10, maxJobs: 15 },
47: { minJobs: 3, maxJobs: 5 },
48: { minJobs: 10, maxJobs: 15 },
};
const printerUsageBias = {
fastPrints: ["Printer A", "Printer B"],
largePrints: ["Printer C", "Printer D", "Printer E"],
};
const initDB = async () => {
console.log("Initializing database connection...");
return open({
filename: dbPath,
driver: sqlite3.Database,
});
};
const createUser = (isPowerUser = false): User => {
const name = [faker.person.firstName(), faker.person.lastName()];
const user = {
id: uuidv4(),
github_id: faker.number.int(),
username: `${name[0].slice(0, 2)}${name[1].slice(0, 6)}`.toUpperCase(),
displayName: `${name[0]} ${name[1]}`.toUpperCase(),
email: `${name[0]}.${name[1]}@mercedes-benz.com`,
role: sample(["user", "admin"]),
isPowerUser,
};
console.log("Created user:", user);
return user;
};
const createPrinter = (): Printer => {
const printer = {
id: uuidv4(),
name: `Printer ${faker.number.int({ max: 9 })}`,
description: faker.lorem.sentence(),
status: random(0, 2),
};
console.log("Created printer:", printer);
return printer;
};
const isPrinterAvailable = (printer: Printer, startAt: number, duration: number): boolean => {
const endAt = startAt + duration * 60 * 1000; // Convert minutes to milliseconds
return !existingJobs.some((job) => {
const jobStart = job.startAt;
const jobEnd = job.startAt + job.durationInMinutes * 60 * 1000;
return (
printer.id === job.printerId &&
((startAt >= jobStart && startAt < jobEnd) ||
(endAt > jobStart && endAt <= jobEnd) ||
(startAt <= jobStart && endAt >= jobEnd))
);
});
};
const weightedSampleUser = (users: User[]): User | undefined => {
const weights = users.map((user) => (user.isPowerUser ? 3 : 1));
const weightedUsers = users.flatMap((user, index) => Array(weights[index]).fill(user));
return sample(weightedUsers);
};
const normalRandom = (mean: number, stdDev: number): number => {
let u = 0;
let v = 0;
while (u === 0) u = Math.random();
while (v === 0) v = Math.random();
return mean + stdDev * Math.sqrt(-2 * Math.log(u)) * Math.cos(2 * Math.PI * v);
};
const createPrintJob = (users: User[], printers: Printer[], startAt: number): PrintJob | null => {
const user = weightedSampleUser(users) as User;
let printer: Printer;
// Probabilistic determination for large prints
const isLargePrint = random(0, 100) < 30; // 30% chance for a large print
if (isLargePrint) {
printer = sample(printers.filter((p) => printerUsageBias.largePrints.includes(p.name))) as Printer;
} else {
printer = sample(printers.filter((p) => printerUsageBias.fastPrints.includes(p.name))) as Printer;
}
if (!printer) {
printer = sample(printers) as Printer;
}
// Variable duration for print jobs with realistic limits
let duration = Math.round(normalRandom(isLargePrint ? 240 : 75, 30));
const minDuration = 15;
const maxDuration = isLargePrint ? 5760 : 3540; // Maximum duration of 96 hours or 59 minutes in minutes
if (isLargePrint) {
duration = Math.min(duration, maxDuration);
}
duration = Math.max(duration, minDuration);
duration = Math.min(duration, maxDuration);
// Ensure printer availability
if (!isPrinterAvailable(printer, startAt, duration)) {
console.log("Printer not available, skipping job creation.");
return null;
}
// Dynamic error probability based on printer status, duration, and other factors
let aborted = false;
let abortReason = null;
const baseErrorRate = Math.max(0, Math.min(5, 100)); // Ensure error rate is between 0% and 100%
const userErrorModifier = user.isPowerUser ? -2 : 2; // Power users make fewer errors
const timeErrorModifier =
startAt >= DateTime.fromObject({ hour: 14 }).toMillis() && startAt <= DateTime.fromObject({ hour: 17 }).toMillis()
? 1
: 0; // More errors in the afternoon
const errorRate = baseErrorRate + userErrorModifier + timeErrorModifier;
if (random(0, 100) < Math.max(0, Math.min(errorRate, 100))) {
aborted = true;
abortReason = generateDynamicAbortReason();
}
const printJob = {
id: uuidv4(),
printerId: printer.id,
userId: user.id,
startAt,
durationInMinutes: duration,
comments: faker.lorem.sentence(),
aborted,
abortReason,
};
console.log("Created print job:", printJob);
return printJob;
};
const generateDynamicAbortReason = (): string => {
const reasons = [
"Filament gerissen",
"Drucker überhitzt",
"Schichtversatz festgestellt",
"Düse verstopft",
"Kalibrierung fehlgeschlagen",
`E${random(500, 599)}`, // Error codes
];
let reason = sample(reasons) as string;
// Add typos to simulate human variability
if (random(0, 1)) {
reason = reason.replace("e", random(0, 1) ? "é" : "e");
}
return reason;
};
const generatePrintJobsForWeek = async (
users: User[],
printers: Printer[],
weekNumber: number,
// biome-ignore lint/suspicious/noExplicitAny: <explanation>
db: any,
dryRun: boolean,
) => {
console.log(`Generating print jobs for week ${weekNumber}...`);
const weekConfig = weekUsage[weekNumber as keyof typeof weekUsage];
const totalJobs = random(weekConfig.minJobs, weekConfig.maxJobs);
const startOfWeek = startDate.plus({ weeks: weekNumber - 44 });
let jobsRemaining = totalJobs;
for (let day = 0; day < 7; day++) {
const dayDate = startOfWeek.plus({ days: day });
if (dayDate > endDate || jobsRemaining <= 0) break;
if (holidays.includes(dayDate.toISODate() as string) || dayDate.weekday === 6 || dayDate.weekday === 7) {
console.log(`Skipping holiday or weekend: ${dayDate.toISODate()}`);
continue;
}
// Update printer status to simulate maintenance or breakdowns
for (const printer of printers) {
if (random(0, 100) < 5) {
// 5% chance per day that a printer goes out of service
printer.status = 2; // Status 2 means "out of service"
console.log(`Printer ${printer.name} is out of service on ${dayDate.toISODate()}`);
} else if (printer.status === 2) {
printer.status = 0; // Printer becomes available again
}
}
const jobsForDay = Math.min(jobsRemaining, random(1, 3));
jobsRemaining -= jobsForDay;
console.log(`Generating ${jobsForDay} print jobs for day ${dayDate.toISODate()}...`);
for (let i = 0; i < jobsForDay; i++) {
// Simulate peak usage in the morning and after lunch
const timeSlots = [
{ hour: 7, minute: 0 },
{ hour: 11, minute: 0 },
{ hour: 13, minute: 0 },
{ hour: 15, minute: 0 },
];
const selectedSlot = sample(timeSlots) as {
hour: number;
minute: number;
};
const startAt = DateTime.fromISO(
`${dayDate.toISODate()}T${String(selectedSlot.hour).padStart(2, "0")}:${String(selectedSlot.minute + random(0, 30)).padStart(2, "0")}:00`,
);
const printJob = createPrintJob(users, printers, startAt.toMillis());
if (printJob) {
if (!dryRun) {
await db.run(
`INSERT INTO printJob (id, printerId, userId, startAt, durationInMinutes, comments, aborted, abortReason)
VALUES (?, ?, ?, ?, ?, ?, ?, ?)`,
[
printJob.id,
printJob.printerId,
printJob.userId,
printJob.startAt,
printJob.durationInMinutes,
printJob.comments,
printJob.aborted ? 1 : 0,
printJob.abortReason,
],
);
}
existingJobs.push(printJob);
console.log("Inserted print job into database:", printJob.id);
console.log(
JSON.stringify({
event: "PrintJobCreated",
jobId: printJob.id,
printerId: printJob.printerId,
userId: printJob.userId,
startAt: new Date(printJob.startAt).toISOString(),
duration: printJob.durationInMinutes,
aborted: printJob.aborted,
}),
);
}
}
}
};
const generateTestData = async (dryRun = false): Promise<void> => {
console.log("Starting test data generation...");
const db = await initDB();
// Generate users and printers
const users = [
...Array.from({ length: 7 }, () => createUser(false)),
...Array.from({ length: 3 }, () => createUser(true)),
];
const printers = Array.from({ length: 5 }, createPrinter);
if (!dryRun) {
// Insert users into the database
for (const user of users) {
await db.run(
`INSERT INTO user (id, github_id, name, displayName, email, role)
VALUES (?, ?, ?, ?, ?, ?)`,
[user.id, user.github_id, user.username, user.displayName, user.email, user.role],
);
console.log("Inserted user into database:", user.id);
}
// Insert printers into the database
for (const printer of printers) {
await db.run(
`INSERT INTO printer (id, name, description, status)
VALUES (?, ?, ?, ?)`,
[printer.id, printer.name, printer.description, printer.status],
);
console.log("Inserted printer into database:", printer.id);
}
}
const validateData = (printJobs: PrintJob[], users: User[], printers: Printer[]): void => {
for (const job of printJobs) {
const userExists = users.some((user) => user.id === job.userId);
const printerExists = printers.some((printer) => printer.id === job.printerId);
if (!userExists || !printerExists) {
console.error(`Invalid job detected: ${job.id}`);
}
}
};
// Generate print jobs for each week
for (const weekNumber of Object.keys(weekUsage) as unknown as number[]) {
await generatePrintJobsForWeek(users, printers, Number.parseInt(`${weekNumber}`), db, dryRun);
console.log(`======> 📅 Week ${weekNumber}`);
validateData(existingJobs, users, printers);
}
if (!dryRun) {
await db.close();
console.log("Database connection closed. Test data generation complete.");
} else {
console.log("Dry run complete. No data was written to the database.");
}
};
generateTestData(process.argv.includes("--dry-run"))
.then(() => {
console.log("Test data generation script finished.");
})
.catch((err) => {
console.error("Error generating test data:", err);
});