-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy path.env.example
More file actions
133 lines (112 loc) · 3.26 KB
/
.env.example
File metadata and controls
133 lines (112 loc) · 3.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
# System Configuration
ENVIRONMENT=development
LOG_LEVEL=INFO
DEBUG=true
# API Configuration
API_HOST=0.0.0.0
API_PORT=8000
API_WORKERS=4
API_RELOAD=true
# MongoDB Configuration (install: brew install mongodb-community)
MONGODB_URI=mongodb://localhost:27017
MONGODB_DATABASE=graphbuilder_rag
MONGODB_MAX_POOL_SIZE=50
MONGODB_MIN_POOL_SIZE=10
# Neo4j Configuration (install: brew install neo4j)
NEO4J_URI=bolt://localhost:7687
NEO4J_USER=neo4j
NEO4J_PASSWORD=password
NEO4J_DATABASE=neo4j
NEO4J_MAX_CONNECTION_LIFETIME=3600
NEO4J_MAX_CONNECTION_POOL_SIZE=50
# Redis Configuration (install: brew install redis)
REDIS_URI=redis://localhost:6379/0
REDIS_MAX_CONNECTIONS=50
# Groq Cloud API Configuration (get key from: https://console.groq.com/keys)
GROQ_API_KEY=your_groq_api_key_here
GROQ_MODEL=llama-3.3-70b-versatile
GROQ_TIMEOUT=30
GROQ_MAX_RETRIES=3
GROQ_MAX_TOKENS=4096
GROQ_TEMPERATURE=0.2
# Embedding Configuration
EMBEDDING_MODEL=BAAI/bge-small-en-v1.5
EMBEDDING_DIMENSION=384
EMBEDDING_BATCH_SIZE=32
EMBEDDING_DEVICE=cpu
# FAISS Configuration
FAISS_INDEX_TYPE=IndexFlatIP
FAISS_INDEX_PATH=./data/faiss_index
FAISS_NPROBE=10
FAISS_NLIST=100
# Extraction Configuration
EXTRACTION_MAX_TOKENS=2048
EXTRACTION_TEMPERATURE=0.1
EXTRACTION_MIN_CONFIDENCE=0.5
EXTRACTION_BATCH_SIZE=10
# Validation Configuration
VALIDATION_MIN_CONFIDENCE=0.7
VALIDATION_EXTERNAL_TIMEOUT=10
VALIDATION_PARALLEL_CHECKS=5
# Bootstrap Validation (strict external verification for first 1000 triples)
VALIDATION_BOOTSTRAP_THRESHOLD=1000
VALIDATION_BOOTSTRAP_MIN_CONFIDENCE=0.8
VALIDATION_BOOTSTRAP_REQUIRE_WIKIPEDIA=true
VALIDATION_BOOTSTRAP_REQUIRE_WIKIDATA=true
# Entity Resolution Configuration
ENTITY_SIMILARITY_THRESHOLD=0.85
ENTITY_FAISS_TOP_K=10
# Fusion Configuration
FUSION_BATCH_SIZE=100
FUSION_CONFLICT_THRESHOLD=0.8
# Retrieval Configuration
RETRIEVAL_MAX_CHUNKS=10
RETRIEVAL_GRAPH_DEPTH=2
RETRIEVAL_MIN_SIMILARITY=0.5
RETRIEVAL_GRAPH_WEIGHT=0.6
RETRIEVAL_SEMANTIC_WEIGHT=0.4
# Query Configuration
QUERY_MAX_TOKENS=4096
QUERY_TEMPERATURE=0.2
QUERY_TIMEOUT=60
# GraphVerify Configuration
GRAPHVERIFY_CONTRADICTION_THRESHOLD=0.7
GRAPHVERIFY_SUPPORT_THRESHOLD=0.8
GRAPHVERIFY_MAX_EDGES_CHECK=50
# Agent Configuration
AGENT_REVERIFY_INTERVAL_SECONDS=3600 # 1 hour
AGENT_CONFLICT_RESOLUTION_INTERVAL_SECONDS=7200 # 2 hours
AGENT_SCHEMA_SUGGESTION_INTERVAL_SECONDS=86400 # 24 hours
AGENT_REVERIFY_BATCH_SIZE=100
AGENT_CONFLICT_BATCH_SIZE=50
AGENT_MIN_PREDICATE_FREQUENCY=5
AGENT_MAX_CONCURRENT=3
# Celery Configuration
CELERY_BROKER_URL=redis://localhost:6379/0
CELERY_RESULT_BACKEND=redis://localhost:6379/1
CELERY_TASK_SERIALIZER=json
CELERY_RESULT_SERIALIZER=json
CELERY_ACCEPT_CONTENT=["json"]
CELERY_TIMEZONE=UTC
CELERY_TASK_TRACK_STARTED=true
CELERY_TASK_TIME_LIMIT=3600
CELERY_TASK_SOFT_TIME_LIMIT=3000
# Monitoring Configuration
PROMETHEUS_PORT=9090
SENTRY_DSN=
METRICS_ENABLED=true
# Storage Configuration
STORAGE_TEMP_DIR=./data/temp
STORAGE_FAISS_INDEX_PATH=./data/faiss/index.faiss
STORAGE_CHUNK_MAP_PATH=./data/faiss/chunk_map.pkl
STORAGE_MAX_FILE_SIZE=104857600
STORAGE_ALLOWED_EXTENSIONS=["pdf","html","csv","json","txt"]
# Retry Configuration
RETRY_MAX_ATTEMPTS=3
RETRY_BACKOFF_FACTOR=2
RETRY_MAX_DELAY=60
# Security Configuration
API_KEY_HEADER=X-API-Key
CORS_ORIGINS=*
CORS_METHODS=GET,POST,PUT,DELETE
CORS_HEADERS=*