firecrawl/apps/test-suite/tests/scrape.test.ts

import request from "supertest";
import dotenv from "dotenv";
import { numTokensFromString } from "../utils/tokens";
import OpenAI from "openai";
import { WebsiteScrapeError } from "../utils/types";
import { logErrors } from "../utils/log";

import websitesData from "../data/scrape.json";
import "dotenv/config";

import fs from 'fs';
dotenv.config();

interface WebsiteData {
  website: string;
  prompt: string;
  expected_output: string;
}

const TEST_URL = "http://127.0.0.1:3002";

describe("Scraping Checkup (E2E)", () => {
  beforeAll(() => {
    if (!process.env.TEST_API_KEY) {
      throw new Error("TEST_API_KEY is not set");
    }
    if (!process.env.OPENAI_API_KEY) {
      throw new Error("OPENAI_API_KEY is not set");
    }
  });

  describe("Scraping website tests with a dataset", () => {
    it("Should scrape the website and prompt it against OpenAI", async () => {
      let passedTests = 0;
      const batchSize = 15; // Adjusted to comply with the rate limit of 15 per minute
      const batchPromises = [];
      let totalTokens = 0;

      const startTime = new Date().getTime();
      const date = new Date();
      const logsDir = `logs/${date.getMonth() + 1}-${date.getDate()}-${date.getFullYear()}`;
      
      let errorLogFileName = `${logsDir}/run.log_${new Date().toTimeString().split(' ')[0]}`;
      const errorLog: WebsiteScrapeError[] = [];
      
      for (let i = 0; i < websitesData.length; i += batchSize) {
        // Introducing delay to respect the rate limit of 15 requests per minute
        await new Promise(resolve => setTimeout(resolve, 10000)); 

        const batch = websitesData.slice(i, i + batchSize);
        const batchPromise = Promise.all(
          batch.map(async (websiteData: WebsiteData) => {
            try {
              const scrapedContent = await request(TEST_URL || "")
                .post("/v0/scrape")
                .set("Content-Type", "application/json")
                .set("Authorization", `Bearer ${process.env.TEST_API_KEY}`)
                .send({ url: websiteData.website, pageOptions: { onlyMainContent: true } });

              if (scrapedContent.statusCode !== 200) {
                console.error(`Failed to scrape ${websiteData.website} ${scrapedContent.statusCode}`);
                errorLog.push({
                  website: websiteData.website,
                  prompt: websiteData.prompt,
                  expected_output: websiteData.expected_output,
                  actual_output: "",
                  error: `Failed to scrape website. ${scrapedContent.statusCode} ${scrapedContent.body.error}`
                });
                return null;
              }

              const openai = new OpenAI({
                apiKey: process.env.OPENAI_API_KEY,
              });

              const prompt = `Based on this markdown extracted from a website html page, ${websiteData.prompt} Just say 'yes' or 'no' to the question.\nWebsite markdown: ${scrapedContent.body.data.markdown}\n`;
              
              let msg = null;
              const maxRetries = 3;
              let attempts = 0;
              while (!msg && attempts < maxRetries) {
                try {
                  msg = await openai.chat.completions.create({
                    model: "gpt-4-turbo",
                    max_tokens: 100,
                    temperature: 0,
                    messages: [
                      {
                        role: "user",
                        content: prompt
                      },
                    ],
                  });
                } catch (error) {
                  console.error(`Attempt ${attempts + 1}: Failed to prompt for ${websiteData.website}, error: ${error}`);
                  attempts++;
                  if (attempts < maxRetries) {
                    console.log(`Retrying... Attempt ${attempts + 1}`);
                    await new Promise(resolve => setTimeout(resolve, 2000)); // Wait for 2 seconds before retrying
                  }
                }
              }

              if (!msg) {
                console.error(`Failed to prompt for ${websiteData.website} after ${maxRetries} attempts`);
                errorLog.push({
                  website: websiteData.website,
                  prompt: websiteData.prompt,
                  expected_output: websiteData.expected_output,
                  actual_output: "",
                  error: "Failed to prompt... model error."
                });
                return null;
              }

              const actualOutput = (msg.choices[0].message.content ?? "").toLowerCase()
              const expectedOutput = websiteData.expected_output.toLowerCase();

              const numTokens = numTokensFromString(prompt,"gpt-4") + numTokensFromString(actualOutput,"gpt-4");

              totalTokens += numTokens;
              if (actualOutput.includes(expectedOutput)) {
                passedTests++;
              } else {
                console.error(
                  `This website failed the test: ${websiteData.website}`
                );
                console.error(`Actual output: ${actualOutput}`);
                errorLog.push({
                  website: websiteData.website,
                  prompt: websiteData.prompt,
                  expected_output: websiteData.expected_output,
                  actual_output: actualOutput,
                  error: "Output mismatch"
                });
              }

              return {
                website: websiteData.website,
                prompt: websiteData.prompt,
                expectedOutput,
                actualOutput,
              };
            } catch (error) {
              console.error(
                `Error processing ${websiteData.website}: ${error}`
              );
              errorLog.push({
                website: websiteData.website,
                prompt: websiteData.prompt,
                expected_output: websiteData.expected_output,
                actual_output: "",
                error: `Error processing ${websiteData.website}: ${error}`
              });
              return null;
            }
          })
        );
        batchPromises.push(batchPromise);
      }

      (await Promise.all(batchPromises)).flat();
      const score = (passedTests / websitesData.length) * 100;
      const endTime = new Date().getTime();
      const timeTaken = (endTime - startTime) / 1000;
      console.log(`Score: ${score}%`);
      console.log(`Total tokens: ${totalTokens}`);

      await logErrors(errorLog, timeTaken, totalTokens, score, websitesData.length);
      
      if (process.env.ENV === "local" && errorLog.length > 0) {
        if (!fs.existsSync(logsDir)){
          fs.mkdirSync(logsDir, { recursive: true });
        }
        fs.writeFileSync(errorLogFileName, JSON.stringify(errorLog, null, 2));
      }
        

      expect(score).toBeGreaterThanOrEqual(70);
    }, 350000); // 150 seconds timeout
  });
});
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00			`import request from "supertest";`
			`import dotenv from "dotenv";`
added crawl test suite 2024-05-16 02:50:50 +08:00			`import { numTokensFromString } from "../utils/tokens";`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`import OpenAI from "openai";`
added crawl test suite 2024-05-16 02:50:50 +08:00			`import { WebsiteScrapeError } from "../utils/types";`
			`import { logErrors } from "../utils/log";`
Nick: test suite 2024-05-09 03:36:54 +08:00
added crawl test suite 2024-05-16 02:50:50 +08:00			`import websitesData from "../data/scrape.json";`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`import "dotenv/config";`

added crawl test suite 2024-05-16 02:50:50 +08:00			`import fs from 'fs';`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00			`dotenv.config();`

Nick: test suite init 2024-05-09 02:38:46 +08:00			`interface WebsiteData {`
			`website: string;`
			`prompt: string;`
			`expected_output: string;`
			`}`

Nick: test suite 2024-05-09 03:36:54 +08:00			`const TEST_URL = "http://127.0.0.1:3002";`

added crawl test suite 2024-05-16 02:50:50 +08:00			`describe("Scraping Checkup (E2E)", () => {`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00			`beforeAll(() => {`
			`if (!process.env.TEST_API_KEY) {`
			`throw new Error("TEST_API_KEY is not set");`
			`}`
			`if (!process.env.OPENAI_API_KEY) {`
			`throw new Error("OPENAI_API_KEY is not set");`
			`}`
			`});`

Ni 2024-05-09 03:18:53 +08:00			`describe("Scraping website tests with a dataset", () => {`
			`it("Should scrape the website and prompt it against OpenAI", async () => {`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`let passedTests = 0;`
Ni 2024-05-09 03:18:53 +08:00			`const batchSize = 15; // Adjusted to comply with the rate limit of 15 per minute`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`const batchPromises = [];`
			`let totalTokens = 0;`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Nick: test suite init 2024-05-09 02:38:46 +08:00			`const startTime = new Date().getTime();`
			`const date = new Date();`
			const logsDir = `logs/${date.getMonth() + 1}-${date.getDate()}-${date.getFullYear()}`;

			let errorLogFileName = `${logsDir}/run.log_${new Date().toTimeString().split(' ')[0]}`;
			`const errorLog: WebsiteScrapeError[] = [];`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Nick: test suite init 2024-05-09 02:38:46 +08:00			`for (let i = 0; i < websitesData.length; i += batchSize) {`
Ni 2024-05-09 03:18:53 +08:00			`// Introducing delay to respect the rate limit of 15 requests per minute`
			`await new Promise(resolve => setTimeout(resolve, 10000));`

Nick: test suite init 2024-05-09 02:38:46 +08:00			`const batch = websitesData.slice(i, i + batchSize);`
			`const batchPromise = Promise.all(`
			`batch.map(async (websiteData: WebsiteData) => {`
			`try {`
Nick: test suite 2024-05-09 03:36:54 +08:00			`const scrapedContent = await request(TEST_URL \|\| "")`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`.post("/v0/scrape")`
			`.set("Content-Type", "application/json")`
			.set("Authorization", `Bearer ${process.env.TEST_API_KEY}`)
Update index.test.ts 2024-05-09 03:26:04 +08:00			`.send({ url: websiteData.website, pageOptions: { onlyMainContent: true } });`
Nick: test suite init 2024-05-09 02:38:46 +08:00
			`if (scrapedContent.statusCode !== 200) {`
Update index.test.ts 2024-05-09 04:23:53 +08:00			console.error(`Failed to scrape ${websiteData.website} ${scrapedContent.statusCode}`);
Update index.test.ts 2024-05-09 04:00:20 +08:00			`errorLog.push({`
			`website: websiteData.website,`
			`prompt: websiteData.prompt,`
			`expected_output: websiteData.expected_output,`
			`actual_output: "",`
Update index.test.ts 2024-05-09 04:23:53 +08:00			error: `Failed to scrape website. ${scrapedContent.statusCode} ${scrapedContent.body.error}`
Update index.test.ts 2024-05-09 04:00:20 +08:00			`});`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`return null;`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00			`}`

Nick: test suite init 2024-05-09 02:38:46 +08:00			`const openai = new OpenAI({`
			`apiKey: process.env.OPENAI_API_KEY,`
			`});`

			const prompt = `Based on this markdown extracted from a website html page, ${websiteData.prompt} Just say 'yes' or 'no' to the question.\nWebsite markdown: ${scrapedContent.body.data.markdown}\n`;

Update index.test.ts 2024-05-09 04:13:38 +08:00			`let msg = null;`
			`const maxRetries = 3;`
			`let attempts = 0;`
			`while (!msg && attempts < maxRetries) {`
			`try {`
			`msg = await openai.chat.completions.create({`
			`model: "gpt-4-turbo",`
			`max_tokens: 100,`
			`temperature: 0,`
			`messages: [`
			`{`
			`role: "user",`
			`content: prompt`
			`},`
			`],`
			`});`
			`} catch (error) {`
			console.error(`Attempt ${attempts + 1}: Failed to prompt for ${websiteData.website}, error: ${error}`);
			`attempts++;`
			`if (attempts < maxRetries) {`
			console.log(`Retrying... Attempt ${attempts + 1}`);
			`await new Promise(resolve => setTimeout(resolve, 2000)); // Wait for 2 seconds before retrying`
			`}`
			`}`
			`}`
Nick: test suite init 2024-05-09 02:38:46 +08:00
			`if (!msg) {`
Update index.test.ts 2024-05-09 04:13:38 +08:00			console.error(`Failed to prompt for ${websiteData.website} after ${maxRetries} attempts`);
Nick: test suite init 2024-05-09 02:38:46 +08:00			`errorLog.push({`
			`website: websiteData.website,`
			`prompt: websiteData.prompt,`
			`expected_output: websiteData.expected_output,`
			`actual_output: "",`
			`error: "Failed to prompt... model error."`
			`});`
			`return null;`
			`}`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Nick: test suite init 2024-05-09 02:38:46 +08:00			`const actualOutput = (msg.choices[0].message.content ?? "").toLowerCase()`
			`const expectedOutput = websiteData.expected_output.toLowerCase();`

			`const numTokens = numTokensFromString(prompt,"gpt-4") + numTokensFromString(actualOutput,"gpt-4");`

			`totalTokens += numTokens;`
			`if (actualOutput.includes(expectedOutput)) {`
			`passedTests++;`
			`} else {`
			`console.error(`
			`This website failed the test: ${websiteData.website}`
			`);`
			console.error(`Actual output: ${actualOutput}`);
			`errorLog.push({`
			`website: websiteData.website,`
			`prompt: websiteData.prompt,`
			`expected_output: websiteData.expected_output,`
			`actual_output: actualOutput,`
			`error: "Output mismatch"`
			`});`
			`}`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Nick: test suite init 2024-05-09 02:38:46 +08:00			`return {`
			`website: websiteData.website,`
			`prompt: websiteData.prompt,`
			`expectedOutput,`
			`actualOutput,`
			`};`
			`} catch (error) {`
			`console.error(`
			`Error processing ${websiteData.website}: ${error}`
			`);`
Update index.test.ts 2024-05-09 04:00:20 +08:00			`errorLog.push({`
			`website: websiteData.website,`
			`prompt: websiteData.prompt,`
			`expected_output: websiteData.expected_output,`
			`actual_output: "",`
Update index.test.ts 2024-05-09 04:23:53 +08:00			error: `Error processing ${websiteData.website}: ${error}`
Update index.test.ts 2024-05-09 04:00:20 +08:00			`});`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`return null;`
			`}`
			`})`
			`);`
			`batchPromises.push(batchPromise);`
			`}`
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Update index.test.ts 2024-05-09 03:26:04 +08:00			`(await Promise.all(batchPromises)).flat();`
			`const score = (passedTests / websitesData.length) * 100;`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`const endTime = new Date().getTime();`
			`const timeTaken = (endTime - startTime) / 1000;`
			console.log(`Score: ${score}%`);
			console.log(`Total tokens: ${totalTokens}`);

Update index.test.ts 2024-05-09 03:26:04 +08:00			`await logErrors(errorLog, timeTaken, totalTokens, score, websitesData.length);`
Ni 2024-05-09 03:18:53 +08:00
			`if (process.env.ENV === "local" && errorLog.length > 0) {`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`if (!fs.existsSync(logsDir)){`
			`fs.mkdirSync(logsDir, { recursive: true });`
			`}`
			`fs.writeFileSync(errorLogFileName, JSON.stringify(errorLog, null, 2));`
			`}`
Ni 2024-05-09 03:18:53 +08:00
[Test] Added integration tests suite solves #15 2024-05-04 04:23:25 +08:00
Nick: 2024-05-16 03:11:16 +08:00			`expect(score).toBeGreaterThanOrEqual(70);`
Ni 2024-05-09 03:18:53 +08:00			`}, 350000); // 150 seconds timeout`
Nick: test suite init 2024-05-09 02:38:46 +08:00			`});`
			`});`