소스 검색

Merge pull request #50 from Umar-Azam/main

modified config.ts to fix containerized execution
Steve Sewell 1 년 전
부모
커밋
27b65d36d4
1개의 변경된 파일3개의 추가작업 그리고 26개의 파일을 삭제
  1. 3 26
      containerapp/data/config.ts

+ 3 - 26
containerapp/data/config.ts

@@ -1,31 +1,8 @@
-import { Page } from "playwright";
+import { Config } from "./src/config";
 
-type Config = {
-  /** URL to start the crawl */
-  url: string;
-  /** Pattern to match against for links on a page to subsequently crawl */
-  match: string;
-  /** Selector to grab the inner text from */
-  selector: string;
-  /** Don't crawl more than this many pages */
-  maxPagesToCrawl: number;
-  /** File name for the finished data */
-  outputFileName: string;
-  /** Optional cookie to be set. E.g. for Cookie Consent */
-  cookie?: { name: string; value: string };
-  /** Optional function to run for each page found */
-  onVisitPage?: (options: {
-    page: Page;
-    pushData: (data: any) => Promise<void>;
-  }) => Promise<void>;
-  /** Optional timeout for waiting for a selector to appear */
-  waitForSelectorTimeout?: number;
-};
-
-export const config: Config = {
+export const defaultConfig: Config = {
   url: "https://www.builder.io/c/docs/developers",
   match: "https://www.builder.io/c/docs/**",
-  selector: `.docs-builder-container`,
   maxPagesToCrawl: 50,
   outputFileName: "../data/output.json",
-};
+};