mirror of
https://github.com/mendableai/firecrawl.git
synced 2024-11-16 03:32:22 +08:00
Removed .env.example, improved docs and docker compose envs
This commit is contained in:
parent
b32057ec89
commit
18480b2005
15
.env.example
15
.env.example
|
@ -1,15 +0,0 @@
|
||||||
NUM_WORKERS_PER_QUEUE=8
|
|
||||||
OPENAI_API_KEY=
|
|
||||||
SLACK_WEBHOOK_URL=
|
|
||||||
SERPER_API_KEY=
|
|
||||||
LLAMAPARSE_API_KEY=
|
|
||||||
LOGTAIL_KEY=
|
|
||||||
BULL_AUTH_KEY=
|
|
||||||
TEST_API_KEY=
|
|
||||||
POSTHOG_API_KEY=
|
|
||||||
POSTHOG_HOST=
|
|
||||||
SUPABASE_ANON_TOKEN=
|
|
||||||
SUPABASE_URL=
|
|
||||||
SUPABASE_SERVICE_TOKEN=
|
|
||||||
SCRAPING_BEE_API_KEY=
|
|
||||||
USE_DB_AUTHENTICATION=false
|
|
31
SELF_HOST.md
31
SELF_HOST.md
|
@ -1,36 +1,17 @@
|
||||||
# Self-hosting Firecrawl
|
# Self-hosting Firecrawl
|
||||||
|
|
||||||
First, clone this repository and copy `.env.example` to `.env`.
|
## Getting Started
|
||||||
|
|
||||||
|
First, clone this repository and copy the example env file from api folder `.env.example` to `.env`.
|
||||||
```bash
|
```bash
|
||||||
git clone https://github.com/mendableai/firecrawl.git
|
git clone https://github.com/mendableai/firecrawl.git
|
||||||
cd firecrawl
|
cd firecrawl
|
||||||
cp .env.example .env
|
cp ./apps/api/.env.example ./.env
|
||||||
```
|
```
|
||||||
|
|
||||||
Then, edit the .env.example to have the correct values for your environment.
|
For running the simplest version of FireCrawl, edit the `USE_DB_AUTHENTICATION` on `.env` to not use the database authentication.
|
||||||
```
|
```yml
|
||||||
## To turn on DB authentication, you need to set up supabase.
|
|
||||||
USE_DB_AUTHENTICATION=false
|
USE_DB_AUTHENTICATION=false
|
||||||
|
|
||||||
# ===== Optional ENVS ======
|
|
||||||
|
|
||||||
# Supabase Setup (used to support DB authentication, advanced logging, etc.)
|
|
||||||
SUPABASE_ANON_TOKEN=
|
|
||||||
SUPABASE_URL=
|
|
||||||
SUPABASE_SERVICE_TOKEN=
|
|
||||||
|
|
||||||
# Other Optionals
|
|
||||||
TEST_API_KEY= # use if you've set up authentication and want to test with a real API key
|
|
||||||
SCRAPING_BEE_API_KEY= #Set if you'd like to use scraping Be to handle JS blocking
|
|
||||||
OPENAI_API_KEY= # add for LLM dependednt features (image alt generation, etc.)
|
|
||||||
BULL_AUTH_KEY= #
|
|
||||||
LOGTAIL_KEY= # Use if you're configuring basic logging with logtail
|
|
||||||
PLAYWRIGHT_MICROSERVICE_URL= # set if you'd like to run a playwright fallback
|
|
||||||
LLAMAPARSE_API_KEY= #Set if you have a llamaparse key you'd like to use to parse pdfs
|
|
||||||
SERPER_API_KEY= #Set if you have a serper key you'd like to use as a search api
|
|
||||||
SLACK_WEBHOOK_URL= # set if you'd like to send slack server health status messages
|
|
||||||
POSTHOG_API_KEY= # set if you'd like to send posthog events like job logs
|
|
||||||
POSTHOG_HOST= # set if you'd like to send posthog events like job logs
|
|
||||||
```
|
```
|
||||||
|
|
||||||
Once that's complete, you can simply run the following commands to get started:
|
Once that's complete, you can simply run the following commands to get started:
|
||||||
|
|
|
@ -3,6 +3,7 @@ NUM_WORKERS_PER_QUEUE=8
|
||||||
PORT=3002
|
PORT=3002
|
||||||
HOST=0.0.0.0
|
HOST=0.0.0.0
|
||||||
REDIS_URL=redis://localhost:6379
|
REDIS_URL=redis://localhost:6379
|
||||||
|
PLAYWRIGHT_MICROSERVICE_URL=http://playwright-service:3000
|
||||||
|
|
||||||
## To turn on DB authentication, you need to set up supabase.
|
## To turn on DB authentication, you need to set up supabase.
|
||||||
USE_DB_AUTHENTICATION=true
|
USE_DB_AUTHENTICATION=true
|
||||||
|
@ -20,7 +21,6 @@ SCRAPING_BEE_API_KEY= #Set if you'd like to use scraping Be to handle JS blockin
|
||||||
OPENAI_API_KEY= # add for LLM dependednt features (image alt generation, etc.)
|
OPENAI_API_KEY= # add for LLM dependednt features (image alt generation, etc.)
|
||||||
BULL_AUTH_KEY= #
|
BULL_AUTH_KEY= #
|
||||||
LOGTAIL_KEY= # Use if you're configuring basic logging with logtail
|
LOGTAIL_KEY= # Use if you're configuring basic logging with logtail
|
||||||
PLAYWRIGHT_MICROSERVICE_URL= # set if you'd like to run a playwright fallback
|
|
||||||
LLAMAPARSE_API_KEY= #Set if you have a llamaparse key you'd like to use to parse pdfs
|
LLAMAPARSE_API_KEY= #Set if you have a llamaparse key you'd like to use to parse pdfs
|
||||||
SERPER_API_KEY= #Set if you have a serper key you'd like to use as a search api
|
SERPER_API_KEY= #Set if you have a serper key you'd like to use as a search api
|
||||||
SLACK_WEBHOOK_URL= # set if you'd like to send slack server health status messages
|
SLACK_WEBHOOK_URL= # set if you'd like to send slack server health status messages
|
||||||
|
|
|
@ -12,10 +12,10 @@ services:
|
||||||
api:
|
api:
|
||||||
build: apps/api
|
build: apps/api
|
||||||
environment:
|
environment:
|
||||||
- REDIS_URL=redis://redis:6379
|
- REDIS_URL=${REDIS_URL}
|
||||||
- PLAYWRIGHT_SERVICE_URL=http://playwright-service:3000
|
- PLAYWRIGHT_MICROSERVICE_URL=${PLAYWRIGHT_MICROSERVICE_URL}
|
||||||
- USE_DB_AUTHENTICATION=${USE_DB_AUTHENTICATION}
|
- USE_DB_AUTHENTICATION=${USE_DB_AUTHENTICATION}
|
||||||
- PORT=3002
|
- PORT=${PORT}
|
||||||
- NUM_WORKERS_PER_QUEUE=${NUM_WORKERS_PER_QUEUE}
|
- NUM_WORKERS_PER_QUEUE=${NUM_WORKERS_PER_QUEUE}
|
||||||
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
||||||
- SLACK_WEBHOOK_URL=${SLACK_WEBHOOK_URL}
|
- SLACK_WEBHOOK_URL=${SLACK_WEBHOOK_URL}
|
||||||
|
@ -30,7 +30,7 @@ services:
|
||||||
- SUPABASE_URL=${SUPABASE_URL}
|
- SUPABASE_URL=${SUPABASE_URL}
|
||||||
- SUPABASE_SERVICE_TOKEN=${SUPABASE_SERVICE_TOKEN}
|
- SUPABASE_SERVICE_TOKEN=${SUPABASE_SERVICE_TOKEN}
|
||||||
- SCRAPING_BEE_API_KEY=${SCRAPING_BEE_API_KEY}
|
- SCRAPING_BEE_API_KEY=${SCRAPING_BEE_API_KEY}
|
||||||
- HOST=0.0.0.0
|
- HOST=${HOST}
|
||||||
depends_on:
|
depends_on:
|
||||||
- redis
|
- redis
|
||||||
- playwright-service
|
- playwright-service
|
||||||
|
@ -41,10 +41,10 @@ services:
|
||||||
worker:
|
worker:
|
||||||
build: apps/api
|
build: apps/api
|
||||||
environment:
|
environment:
|
||||||
- REDIS_URL=redis://redis:6379
|
- REDIS_URL=${REDIS_URL}
|
||||||
- PLAYWRIGHT_SERVICE_URL=http://playwright-service:3000
|
- PLAYWRIGHT_MICROSERVICE_URL=${PLAYWRIGHT_MICROSERVICE_URL}
|
||||||
- USE_DB_AUTHENTICATION=${USE_DB_AUTHENTICATION}
|
- USE_DB_AUTHENTICATION=${USE_DB_AUTHENTICATION}
|
||||||
- PORT=3002
|
- PORT=${PORT}
|
||||||
- NUM_WORKERS_PER_QUEUE=${NUM_WORKERS_PER_QUEUE}
|
- NUM_WORKERS_PER_QUEUE=${NUM_WORKERS_PER_QUEUE}
|
||||||
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
||||||
- SLACK_WEBHOOK_URL=${SLACK_WEBHOOK_URL}
|
- SLACK_WEBHOOK_URL=${SLACK_WEBHOOK_URL}
|
||||||
|
@ -59,6 +59,8 @@ services:
|
||||||
- SUPABASE_URL=${SUPABASE_URL}
|
- SUPABASE_URL=${SUPABASE_URL}
|
||||||
- SUPABASE_SERVICE_TOKEN=${SUPABASE_SERVICE_TOKEN}
|
- SUPABASE_SERVICE_TOKEN=${SUPABASE_SERVICE_TOKEN}
|
||||||
- SCRAPING_BEE_API_KEY=${SCRAPING_BEE_API_KEY}
|
- SCRAPING_BEE_API_KEY=${SCRAPING_BEE_API_KEY}
|
||||||
|
- HOST=${HOST}
|
||||||
depends_on:
|
depends_on:
|
||||||
- redis
|
- redis
|
||||||
- playwright-service
|
- playwright-service
|
||||||
|
- api
|
||||||
|
|
Loading…
Reference in New Issue
Block a user