Nick: llm extract in batch scrape

This commit is contained in:
Nicolas 2024-10-28 16:51:49 -03:00
parent 298a343a90
commit 726430c2e6

View File

@ -4,6 +4,7 @@ import {
BatchScrapeRequest, BatchScrapeRequest,
batchScrapeRequestSchema, batchScrapeRequestSchema,
CrawlResponse, CrawlResponse,
legacyExtractorOptions,
legacyScrapeOptions, legacyScrapeOptions,
RequestWithAuth, RequestWithAuth,
} from "./types"; } from "./types";
@ -34,6 +35,8 @@ export async function batchScrapeController(
} }
const pageOptions = legacyScrapeOptions(req.body); const pageOptions = legacyScrapeOptions(req.body);
const extractorOptions = req.body.extract ? legacyExtractorOptions(req.body.extract) : undefined;
const sc: StoredCrawl = { const sc: StoredCrawl = {
crawlerOptions: null, crawlerOptions: null,
@ -65,6 +68,7 @@ export async function batchScrapeController(
plan: req.auth.plan, plan: req.auth.plan,
crawlerOptions: null, crawlerOptions: null,
pageOptions, pageOptions,
extractorOptions,
origin: "api", origin: "api",
crawl_id: id, crawl_id: id,
sitemapped: true, sitemapped: true,