r2r_azure.toml 1.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546
  1. # A config which overrides all instances of `openai` with `azure` in the `r2r.toml` config
  2. [agent]
  3. [agent.generation_config]
  4. model = "azure/gpt-4o"
  5. [completion]
  6. [completion.generation_config]
  7. model = "azure/gpt-4o"
  8. # KG settings
  9. batch_size = 256
  10. [database.graph_creation_settings]
  11. generation_config = { model = "azure/gpt-4o-mini" }
  12. [database.graph_entity_deduplication_settings]
  13. generation_config = { model = "azure/gpt-4o-mini" }
  14. [database.graph_enrichment_settings]
  15. generation_config = { model = "azure/gpt-4o-mini" }
  16. [database.graph_search_settings]
  17. generation_config = { model = "azure/gpt-4o-mini" }
  18. [embedding]
  19. provider = "litellm"
  20. base_model = "openai/text-embedding-3-small" # continue with `openai` for embeddings, due to server rate limit on azure
  21. base_dimension = 512
  22. [file]
  23. provider = "postgres"
  24. [ingestion]
  25. provider = "r2r"
  26. chunking_strategy = "recursive"
  27. chunk_size = 1_024
  28. chunk_overlap = 512
  29. excluded_parsers = ["mp4"]
  30. audio_transcription_model="azure/whisper-1"
  31. document_summary_model = "azure/gpt-4o-mini"
  32. vision_img_model = "azure/gpt-4o"
  33. vision_pdf_model = "azure/gpt-4o"
  34. [ingestion.chunk_enrichment_settings]
  35. generation_config = { model = "azure/gpt-4o-mini" }