mirror of
https://github.com/Dvorinka/Devour.git
synced 2026-06-03 20:13:03 +00:00
52 lines
883 B
YAML
52 lines
883 B
YAML
# Devour Configuration
|
|
version: 1
|
|
|
|
# Storage paths
|
|
storage:
|
|
docs_dir: ./devour_data/docs
|
|
index_dir: ./devour_data/index
|
|
metadata_dir: ./devour_data/metadata
|
|
|
|
# Embedding settings
|
|
embeddings:
|
|
provider: openai
|
|
model: text-embedding-3-small
|
|
dimensions: 1536
|
|
api_key: ${OPENAI_API_KEY}
|
|
batch_size: 100
|
|
|
|
# Vector database
|
|
vector_db:
|
|
type: chromem
|
|
persist: true
|
|
similarity_metric: cosine
|
|
|
|
# Scraping settings
|
|
scraper:
|
|
user_agent: "Devour/1.0"
|
|
timeout: 30s
|
|
retry_count: 3
|
|
concurrency: 10
|
|
rate_limit: 500ms
|
|
max_depth: 3
|
|
cache_dir: ./devour_data/cache
|
|
|
|
# Scheduler
|
|
scheduler:
|
|
enabled: true
|
|
interval: 72h
|
|
check_method: hash
|
|
|
|
# Server settings
|
|
server:
|
|
mode: local
|
|
port: 8080
|
|
host: localhost
|
|
|
|
# Sources (add your own)
|
|
sources: []
|
|
# - name: example-docs
|
|
# type: url
|
|
# url: https://docs.example.com
|
|
# include: ["**/*.md", "**/*.html"]
|