payman / config /config.yaml
satyamdev404's picture
Upload 31 files
e0aa230 verified
api_keys:
gemini_api_key: ""
openai_api_key: ""
pinecone_api_key: ""
backup:
enabled: false
include_configuration: true
include_documents: true
include_logs: false
include_vector_db: true
interval_hours: 24
retention_days: 30
storage_path: backups/
customization:
custom_css: ""
default_query_examples:
- What is the main topic of the uploaded documents?
- Can you summarize the key points?
- What are the important findings mentioned?
favicon_url: ""
footer_text: ""
help_text: ""
logo_url: ""
welcome_message: ""
deployment:
auto_scale: true
development:
debug_mode: true
enable_profiling: true
log_level: DEBUG
enable_metrics: true
graceful_shutdown_timeout: 30
health_check_interval: 60
health_endpoint: /health
max_cpu_percent: 80
max_disk_usage_mb: 5120
max_memory_mb: 2048
metrics_endpoint: /metrics
platform: huggingface
production:
debug_mode: false
enable_profiling: false
log_level: WARNING
staging:
debug_mode: true
enable_profiling: true
log_level: INFO
development:
debug_mode: false
enable_test_endpoints: false
mock_apis: false
profiling_enabled: false
save_intermediate_results: false
test_data_path: data/test_data
test_mode: false
document_processing:
chunk_overlap: 200
chunk_size: 1000
detect_language: true
extract_images: false
extract_metadata: true
max_file_size_mb: 50
min_chunk_size: 100
preserve_formatting: true
supported_formats:
- .pdf
- .docx
- .doc
- .csv
- .xlsx
- .xls
- .pptx
- .txt
- .md
supported_languages:
- en
- es
- fr
- de
- it
- pt
- ru
- zh
- ja
- ko
embedding:
batch_size: 1
cache_embeddings: true
fallback_model: sentence-transformers
max_retries: 3
max_tokens: 8192
model: gemini-embedding-exp-03-07
output_dimensionality: 3072
rate_limit_delay: 1.0
retry_delay: 2
task_type: RETRIEVAL_DOCUMENT
title: ""
features:
async_processing: false
audio_processing: false
auto_summarization: false
batch_processing: true
content_recommendation: false
document_upload: true
image_processing: false
live_search: true
multi_language_support: false
query_processing: true
question_generation: false
real_time_updates: false
url_processing: true
video_processing: false
integrations:
aws_s3:
access_key: ""
bucket_name: ""
enabled: false
secret_key: ""
google_analytics:
enabled: false
tracking_id: ""
huggingface:
api_key: ""
enabled: false
models: []
postgresql:
connection_string: ""
enabled: false
sentry:
dsn: ""
enabled: false
logging:
backup_count: 5
component_levels:
document_processing: INFO
embedding: INFO
rag: INFO
ui: INFO
url_processing: INFO
vector_db: INFO
file: logs/rag_ai.log
format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
level: INFO
max_file_size_mb: 10
notifications:
email:
enabled: false
from_address: ""
password: ""
smtp_port: 587
smtp_server: ""
to_addresses: []
username: ""
enabled: false
webhook:
enabled: false
events:
- error
- system_health
- processing_complete
url: ""
performance:
batch_processing_size: 10
cache_ttl: 3600
enable_caching: true
enable_parallel_processing: true
garbage_collection_interval: 300
max_concurrent_requests: 5
max_memory_usage_mb: 1024
max_worker_threads: 4
request_timeout: 30
rag:
confidence_threshold: 0.3
context_window_overlap: 0.1
deduplicate_results: true
enable_query_caching: true
enable_query_expansion: true
fallback_model: gpt-3.5-turbo
include_sources: true
max_context_length: 8000
max_response_length: 2000
max_tokens: 500
model: gemini-2.5-flash-preview-05-20
query_cache_ttl: 7200
rerank_results: true
similarity_threshold: 0.4
temperature: 0.7
top_k: 10
top_p: 0.9
live_search:
enabled: true
enable_caching: true
include_raw_content: true
max_results: 10
search_depth: basic
time_range: month
query_router:
confidence_threshold: 0.5
enable_hybrid_search: true
live_weight: 0.4
local_weight: 0.6
max_hybrid_results: 10
security:
allowed_domains: []
blocked_content_types:
- executable
- script
blocked_domains:
- localhost
- 127.0.0.1
- 0.0.0.0
enable_content_filtering: true
enable_rate_limiting: true
max_text_length: 1000000
max_upload_size_mb: 100
requests_per_hour: 1000
requests_per_minute: 60
sanitize_input: true
ui:
demo_mode: false
description:
Upload documents or provide URLs to build your knowledge base, then
ask questions!
features:
analytics_dashboard: true
confidence_display: true
file_upload: true
knowledge_base_management: true
query_interface: true
source_display: true
system_health_monitoring: true
url_input: true
max_file_uploads: 10
max_query_length: 1000
port: 7860
sample_documents: []
server_name: 0.0.0.0
share: false
show_advanced_options: true
theme: default
title: "\xF0\u0178\xA7\_ AI Embedded Knowledge Agent"
url_processing:
allowed_domains: []
blocked_domains:
- localhost
- 127.0.0.1
- 0.0.0.0
delay_between_requests: 0.5
extract_main_content: true
follow_links: true
max_depth: 1
max_pages: 10
remove_ads: true
remove_navigation: true
requests_per_second: 2
respect_robots_txt: true
timeout: 10
user_agent: RAG-AI-Bot/1.0
vector_db:
batch_size: 100
create_index_if_not_exists: true
dimension: 3072
environment: us-east-1
fallback_provider: memory
index_name: rag-ai-index
max_retries: 3
metric: cosine
provider: pinecone
retry_delay: 1