|
|
@@ -98,7 +98,7 @@ class UnstructuredIngestionProvider(IngestionProvider):
|
|
|
DocumentType.XLSX: [parsers.XLSXParser], # type: ignore
|
|
|
#DocumentType.DOC: [parsers.DOCParser], # type: ignore
|
|
|
DocumentType.PPT: [parsers.PPTParser], # type: ignore
|
|
|
- #DocumentType.CSV: [parsers.CSVParser], # type: ignore
|
|
|
+ DocumentType.CSV: [parsers.CSVParserAdvanced], # type: ignore
|
|
|
}
|
|
|
|
|
|
EXTRA_PARSERS = {
|
|
|
@@ -176,7 +176,7 @@ class UnstructuredIngestionProvider(IngestionProvider):
|
|
|
|
|
|
self.parsers: dict[DocumentType, AsyncParser] = {}
|
|
|
self._initialize_parsers()
|
|
|
-
|
|
|
+
|
|
|
def _initialize_parsers(self):
|
|
|
for doc_type, parsers in self.R2R_FALLBACK_PARSERS.items():
|
|
|
for parser in parsers:
|