all_possible_config.toml 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290
  1. ################################################################################
  2. # Global Application Settings (AppConfig)
  3. ################################################################################
  4. [app]
  5. # Global project name (optional)
  6. project_name = ""
  7. # Maximum number of documents per user (default from code: 100, sample: 10000)
  8. default_max_documents_per_user = 100
  9. # Maximum number of chunks per user (default: 10000)
  10. default_max_chunks_per_user = 10000
  11. # Maximum number of collections per user (default: 5)
  12. default_max_collections_per_user = 5
  13. # Maximum upload size in bytes (default: 2000000 ~2MB)
  14. default_max_upload_size = 2000000
  15. # LLM used for user‐facing output (quality)
  16. quality_llm = ""
  17. # LLM used for fast internal operations
  18. fast_llm = ""
  19. # LLM used for visual inputs
  20. vlm = ""
  21. # LLM used for audio transcription
  22. audio_lm = ""
  23. # A mapping from file extension to maximum upload size
  24. [app.max_upload_size_by_type]
  25. txt = 2000000
  26. md = 2000000
  27. tsv = 2000000
  28. csv = 5000000
  29. xml = 2000000
  30. html = 5000000
  31. doc = 10000000
  32. docx = 10000000
  33. ppt = 20000000
  34. pptx = 20000000
  35. xls = 10000000
  36. xlsx = 10000000
  37. odt = 5000000
  38. pdf = 30000000
  39. eml = 5000000
  40. msg = 5000000
  41. p7s = 5000000
  42. bmp = 5000000
  43. heic = 5000000
  44. jpeg = 5000000
  45. jpg = 5000000
  46. png = 5000000
  47. tiff = 5000000
  48. epub = 10000000
  49. rtf = 5000000
  50. rst = 5000000
  51. org = 5000000
  52. ################################################################################
  53. # Agent Settings (Custom configuration used by your system)
  54. ################################################################################
  55. [agent]
  56. rag_agent_static_prompt = "static_rag_agent"
  57. rag_agent_dynamic_prompt = "dynamic_rag_agent"
  58. tools = ["search_file_knowledge", "content"]
  59. ################################################################################
  60. # Authentication Settings (AuthConfig)
  61. ################################################################################
  62. [auth]
  63. provider = "r2r"
  64. # (Optional secret key for signing tokens)
  65. secret_key = ""
  66. # Lifetime for access tokens (in minutes)
  67. access_token_lifetime_in_minutes = 60000
  68. # Lifetime for refresh tokens (in days)
  69. refresh_token_lifetime_in_days = 7
  70. # Whether authentication is required
  71. require_authentication = false
  72. # Whether email verification is required
  73. require_email_verification = false
  74. # Default admin credentials
  75. default_admin_email = "admin@example.com"
  76. default_admin_password = "change_me_immediately"
  77. ################################################################################
  78. # Completion / LLM Generation Settings (CompletionConfig and nested GenerationConfig)
  79. ################################################################################
  80. [completion]
  81. provider = "r2r"
  82. # Maximum number of concurrent requests allowed
  83. concurrent_request_limit = 256
  84. [completion.generation_config]
  85. # Generation parameters
  86. temperature = 0.1
  87. top_p = 1.0
  88. max_tokens_to_sample = 4096
  89. stream = false
  90. # Additional generation kwargs (empty table by default)
  91. add_generation_kwargs = {}
  92. ################################################################################
  93. # Cryptography Settings (CryptoConfig)
  94. ################################################################################
  95. [crypto]
  96. provider = "bcrypt"
  97. ################################################################################
  98. # Database Settings (DatabaseConfig and related nested settings)
  99. ################################################################################
  100. [database]
  101. provider = "postgres"
  102. user = ""
  103. password = ""
  104. host = "localhost"
  105. port = 5432
  106. db_name = ""
  107. project_name = ""
  108. default_collection_name = "Default"
  109. default_collection_description = "Your default collection."
  110. collection_summary_system_prompt = "system"
  111. collection_summary_prompt = "collection_summary"
  112. enable_fts = false
  113. batch_size = 1
  114. kg_store_path = ""
  115. # PostgreSQL tuning settings
  116. [database.postgres_configuration_settings]
  117. checkpoint_completion_target = 0.9
  118. default_statistics_target = 100
  119. effective_io_concurrency = 1
  120. effective_cache_size = 524288
  121. huge_pages = "try"
  122. maintenance_work_mem = 65536
  123. max_connections = 256
  124. max_parallel_workers_per_gather = 2
  125. max_parallel_workers = 8
  126. max_parallel_maintenance_workers = 2
  127. max_wal_size = 1024
  128. max_worker_processes = 8
  129. min_wal_size = 80
  130. shared_buffers = 16384
  131. statement_cache_size = 100
  132. random_page_cost = 4.0
  133. wal_buffers = 512
  134. work_mem = 4096
  135. # Graph creation settings
  136. [database.graph_creation_settings]
  137. graph_entity_description_prompt = "graph_entity_description"
  138. graph_extraction_prompt = "graph_extraction"
  139. entity_types = []
  140. relation_types = []
  141. automatic_deduplication = true
  142. # Graph enrichment settings
  143. [database.graph_enrichment_settings]
  144. graph_communities_prompt = "graph_communities"
  145. # (Optional) Graph search settings – add fields as needed
  146. [database.graph_search_settings]
  147. # e.g., search_mode = "default"
  148. # Rate limiting settings
  149. [database.limits]
  150. global_per_min = 60
  151. route_per_min = 20
  152. monthly_limit = 10000
  153. # Route-specific limits (empty by default)
  154. [database.route_limits]
  155. # e.g., "/api/search" = { global_per_min = 30, route_per_min = 10, monthly_limit = 5000 }
  156. # User-specific limits (empty by default)
  157. [database.user_limits]
  158. # e.g., "user_uuid_here" = { global_per_min = 20, route_per_min = 5, monthly_limit = 2000 }
  159. ################################################################################
  160. # Embedding Settings (EmbeddingConfig)
  161. ################################################################################
  162. [embedding]
  163. provider = "litellm"
  164. base_model = "openai/text-embedding-3-small"
  165. base_dimension = 512
  166. # Optional reranking settings (leave empty if not used)
  167. rerank_model = ""
  168. rerank_url = ""
  169. batch_size = 1
  170. prefixes = {} # Provide prefix overrides here if needed
  171. add_title_as_prefix = true
  172. concurrent_request_limit = 256
  173. max_retries = 3
  174. initial_backoff = 1.0
  175. max_backoff = 64.0
  176. # Deprecated fields (if still used)
  177. rerank_dimension = 0
  178. rerank_transformer_type = ""
  179. # Vector quantization settings for embeddings
  180. [embedding.quantization_settings]
  181. quantization_type = "FP32"
  182. # (Additional quantization parameters can be added here)
  183. ################################################################################
  184. # Completion Embedding Settings
  185. # (Usually mirrors the embedding settings; override if needed.)
  186. ################################################################################
  187. [completion_embedding]
  188. provider = "litellm"
  189. base_model = "openai/text-embedding-3-small"
  190. base_dimension = 512
  191. batch_size = 1
  192. add_title_as_prefix = true
  193. concurrent_request_limit = 256
  194. ################################################################################
  195. # File Storage Settings
  196. ################################################################################
  197. [file]
  198. provider = "postgres"
  199. ################################################################################
  200. # Ingestion Settings (IngestionConfig and nested settings)
  201. ################################################################################
  202. [ingestion]
  203. provider = "r2r"
  204. excluded_parsers = ["mp4"]
  205. chunking_strategy = "recursive"
  206. chunk_size = 1024
  207. # Extra field handled by extra_fields – not defined explicitly in IngestionConfig:
  208. chunk_overlap = 512
  209. automatic_extraction = true
  210. # Audio transcription and vision model settings
  211. audio_transcription_model = ""
  212. skip_document_summary = false
  213. document_summary_system_prompt = "system"
  214. document_summary_task_prompt = "summary"
  215. document_summary_max_length = 100000
  216. chunks_for_document_summary = 128
  217. document_summary_model = ""
  218. parser_overrides = {}
  219. # Chunk enrichment settings
  220. [ingestion.chunk_enrichment_settings]
  221. chunk_enrichment_prompt = "chunk_enrichment"
  222. enable_chunk_enrichment = false
  223. n_chunks = 2
  224. # Extra parsers (mapping from file type to parser name)
  225. [ingestion.extra_parsers]
  226. pdf = "zerox"
  227. ################################################################################
  228. # Logging Settings
  229. ################################################################################
  230. [logging]
  231. provider = "r2r"
  232. log_table = "logs"
  233. log_info_table = "log_info"
  234. ################################################################################
  235. # Orchestration Settings (OrchestrationConfig)
  236. ################################################################################
  237. [orchestration]
  238. provider = "simple"
  239. max_runs = 2048
  240. kg_creation_concurrency_limit = 32
  241. ingestion_concurrency_limit = 16
  242. kg_concurrency_limit = 4
  243. ################################################################################
  244. # Prompt Settings
  245. ################################################################################
  246. [prompt]
  247. provider = "r2r"
  248. ################################################################################
  249. # Email Settings (EmailConfig)
  250. ################################################################################
  251. [email]
  252. # Supported providers: "smtp", "console", "sendgrid", etc.
  253. provider = "console"
  254. smtp_server = ""
  255. smtp_port = 587
  256. smtp_username = ""
  257. smtp_password = ""
  258. from_email = ""
  259. use_tls = true
  260. sendgrid_api_key = ""
  261. mailersend_api_key = ""
  262. verify_email_template_id = ""
  263. reset_password_template_id = ""
  264. password_changed_template_id = ""
  265. frontend_url = ""
  266. sender_name = ""