Skip to content

Commit 3126603

Browse files
small changes
1 parent f531670 commit 3126603

5 files changed

Lines changed: 15 additions & 17 deletions

File tree

.env.example

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
# Scraper
22
CORNELL_DINING_API_URL=
3+
WORKERS=
34

45
# Server Configuration
56
PORT=8000

prisma/scraper.ts

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ import { readFileSync } from 'fs';
44
import { join } from 'path';
55
import type { RawScrapedData, RawEatery, RawStaticEatery } from './scraperTypes.js';
66
import { mapCampusArea, mapEateryType, mapPaymentMethod, mapEventType, mapImageUrl, createWeeklyDate } from './mappers.js';
7-
import { CampusArea, PaymentMethod, EateryType, EventType } from '@prisma/client';
7+
import type { CampusArea, PaymentMethod, EateryType } from '@prisma/client';
88

99
dotenv.config();
1010

@@ -376,11 +376,11 @@ async function testProcessEateries(numEateries: number) {
376376

377377
export async function main() {
378378
const startTime = Date.now();
379-
console.log('Starting scraper...\n');
379+
console.log('Starting scraper at', new Date(startTime).toString(), '\n');
380380

381381
// Load static eateries
382382
const staticStartTime = Date.now();
383-
console.log('Loading static eateries...');
383+
console.log('Loading static eateries at', new Date(staticStartTime).toString());
384384
const staticEateries = loadStaticEateries();
385385
const transformedStaticEateries: ReturnType<typeof transformStaticEatery>[] = [];
386386
const skippedStaticEateries: Array<{ name: string; error: string }> = [];
@@ -411,8 +411,8 @@ export async function main() {
411411
console.log(`Found ${diningData.data.eateries.length} eateries from API (${apiFetchDuration}s)`);
412412

413413
const transformStartTime = Date.now();
414-
console.log('Transforming API eatery data with 5 concurrent workers...');
415-
const transformResults = await transformEateriesConcurrently(diningData.data.eateries, 5);
414+
console.log(`Transforming API eatery data with ${process.env.WORKERS} concurrent workers...`);
415+
const transformResults = await transformEateriesConcurrently(diningData.data.eateries, parseInt(process.env.WORKERS || '4', 10));
416416
const transformedApiEateries = transformResults.map((r) => r.result);
417417
const transformDuration = ((Date.now() - transformStartTime) / 1000).toFixed(2);
418418
console.log(`✓ Successfully transformed ${transformedApiEateries.length} API eateries (${transformDuration}s)\n`);

prisma/scraperTypes.ts

Lines changed: 2 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -117,14 +117,8 @@ export type RawStaticEatery = {
117117
latitude: number;
118118
longitude: number;
119119
location: string;
120-
campusArea: {
121-
descr: string;
122-
descrshort: string;
123-
};
124-
eateryTypes: Array<{
125-
descr: string;
126-
descrshort: string;
127-
}>;
120+
campusArea: RawCampusArea;
121+
eateryTypes: RawEateryType[];
128122
onlineOrdering?: boolean;
129123
onlineOrderUrl?: string | null;
130124
operatingHours: Array<{

prisma/staticEateries.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -990,4 +990,4 @@
990990
]
991991
}
992992
]
993-
}
993+
}

src/scheduler/scraperScheduler.ts

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,13 +6,17 @@ let isRunning = false;
66

77
export async function runScraperSafely() {
88
if (isRunning) {
9-
console.log('[Scheduler] Scraper is already running, skipping this execution');
9+
console.log(
10+
'[Scheduler] Scraper is already running, skipping this execution',
11+
);
1012
return;
1113
}
1214

1315
isRunning = true;
1416
const startTime = Date.now();
15-
console.log(`[Scheduler] Starting scheduled scraper run at ${new Date().toISOString()}`);
17+
console.log(
18+
`[Scheduler] Starting scheduled scraper run at ${new Date().toISOString()}`,
19+
);
1620

1721
try {
1822
await runScraper();
@@ -45,4 +49,3 @@ export function startScraperScheduler() {
4549

4650
return task;
4751
}
48-

0 commit comments

Comments
 (0)