fix: Fix issue with detecting docx files, and files with upper case extensions (#1609)
fix detecting files with uppercase extensions Signed-off-by: MoheyElDin Badr <moheyeldin.badr@gmail.com>
This commit is contained in:
parent
0e00a263fa
commit
f4d9d4111b
@ -302,7 +302,7 @@ class _DocumentConversionInput(BaseModel):
|
|||||||
if ("." in obj.name and not obj.name.startswith("."))
|
if ("." in obj.name and not obj.name.startswith("."))
|
||||||
else ""
|
else ""
|
||||||
)
|
)
|
||||||
mime = _DocumentConversionInput._mime_from_extension(ext)
|
mime = _DocumentConversionInput._mime_from_extension(ext.lower())
|
||||||
if mime is not None and mime.lower() == "application/zip":
|
if mime is not None and mime.lower() == "application/zip":
|
||||||
objname = obj.name.lower()
|
objname = obj.name.lower()
|
||||||
if objname.endswith(".xlsx"):
|
if objname.endswith(".xlsx"):
|
||||||
@ -376,6 +376,13 @@ class _DocumentConversionInput(BaseModel):
|
|||||||
mime = FormatToMimeType[InputFormat.JSON_DOCLING][0]
|
mime = FormatToMimeType[InputFormat.JSON_DOCLING][0]
|
||||||
elif ext in FormatToExtensions[InputFormat.PDF]:
|
elif ext in FormatToExtensions[InputFormat.PDF]:
|
||||||
mime = FormatToMimeType[InputFormat.PDF][0]
|
mime = FormatToMimeType[InputFormat.PDF][0]
|
||||||
|
elif ext in FormatToExtensions[InputFormat.DOCX]:
|
||||||
|
mime = FormatToMimeType[InputFormat.DOCX][0]
|
||||||
|
elif ext in FormatToExtensions[InputFormat.PPTX]:
|
||||||
|
mime = FormatToMimeType[InputFormat.PPTX][0]
|
||||||
|
elif ext in FormatToExtensions[InputFormat.XLSX]:
|
||||||
|
mime = FormatToMimeType[InputFormat.XLSX][0]
|
||||||
|
|
||||||
return mime
|
return mime
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
|
Loading…
Reference in New Issue
Block a user