add ability to launch the scraper from package.json.scripts

2025-07-29 12:43:48 +02:00
parent e0cb439234
commit 36f6de4edd
2 changed files with 63 additions and 0 deletions
--- a/package.json
+++ b/package.json
@@ -18,6 +18,8 @@
    "build": "tsc",
    "start": "node dist/server.js",
    "dev": "tsx watch src/server.ts",
+    "scraper": "node dist/scraper.js",
+    "scraper:dev": "tsx watch src/scraper.ts",
    "test": "jest",
    "test:watch": "jest --watch",
    "lint": "eslint src/**/*.ts",
--- a/src/scraper.ts
+++ b/src/scraper.ts
@@ -0,0 +1,61 @@
+import { ScrapingScheduler } from './services/ScrapingScheduler.js';
+import { FeedRepository } from './repositories/FeedRepository.js';
+import { DatabaseConnection } from './config/database.js';
+import { Logger } from './utils/logger.js';
+
+let scheduler: ScrapingScheduler;
+
+async function initializeScraper() {
+  try {
+    // Connect to database
+    await DatabaseConnection.getInstance().connect();
+    Logger.database.connected();
+    
+    // Initialize repository and scheduler
+    const feedRepository = new FeedRepository();
+    scheduler = new ScrapingScheduler(feedRepository, {
+      intervalMinutes: 30, // Run every 30 minutes
+      maxRetries: 2,
+      retryDelayMinutes: 5,
+      enabled: true
+    });
+    
+    // Start the scheduler
+    scheduler.start();
+    Logger.info('Scraping scheduler started successfully');
+    
+    // Log initial stats
+    const stats = scheduler.getStats();
+    Logger.info('Initial scheduler stats', stats);
+    
+  } catch (error) {
+    Logger.error('Failed to start scraper', { error });
+    process.exit(1);
+  }
+}
+
+const shutdown = async () => {
+  try {
+    if (scheduler) {
+      await scheduler.shutdown();
+      Logger.info('Scraping scheduler stopped');
+    }
+    
+    await DatabaseConnection.getInstance().disconnect();
+    Logger.database.disconnected();
+    process.exit(0);
+  } catch (error) {
+    Logger.error('Error during scraper shutdown', { error });
+    process.exit(1);
+  }
+};
+
+// Handle graceful shutdown
+process.on('SIGINT', shutdown);
+process.on('SIGTERM', shutdown);
+
+// Start the scraper
+initializeScraper().catch(error => {
+  Logger.error('Failed to initialize scraper', { error });
+  process.exit(1);
+});