r2r.py 1.7 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162
  1. from typing import Optional, Any
  2. from r2r import R2RClient
  3. from app.libs.util import verify_jwt_expiration
  4. from config.llm import tool_settings
  5. import nest_asyncio
  6. import asyncio
  7. # Apply nest_asyncio to allow nested event loops
  8. nest_asyncio.apply()
  9. class R2R:
  10. client: R2RClient
  11. def __init__(self):
  12. self.auth_enabled = tool_settings.R2R_USERNAME and tool_settings.R2R_PASSWORD
  13. self.client = None
  14. async def init(self):
  15. if not self.auth_enabled:
  16. return
  17. if not self.client:
  18. self.client = R2RClient(tool_settings.R2R_BASE_URL)
  19. await self.client.users.login(
  20. tool_settings.R2R_USERNAME, tool_settings.R2R_PASSWORD
  21. )
  22. def ingest_file(self, file_path: str, metadata: Optional[dict]):
  23. self._check_login()
  24. ingest_response = self.client.documents.create(
  25. file_path=file_path, metadata=metadata if metadata else None, id=None
  26. )
  27. return ingest_response.get("results")
  28. def search(self, query: str, filters: dict[str, Any]):
  29. self._check_login()
  30. search_response = self.client.retrieval.search(
  31. query=query,
  32. search_settings={
  33. "filters": filters,
  34. "limit": tool_settings.R2R_SEARCH_LIMIT,
  35. },
  36. )
  37. return search_response.get("results").get("chunk_search_results")
  38. def _check_login(self):
  39. if not self.auth_enabled:
  40. return
  41. if verify_jwt_expiration(self.client.access_token):
  42. return
  43. else:
  44. asyncio.create_task(self.init())
  45. # 创建 R2R 实例
  46. r2r = R2R()
  47. # 在您的应用程序启动时调用 initialize_r2r()
  48. async def initialize_r2r():
  49. await r2r.init()