Skip to content

Commit

Permalink
synced base.py updates
Browse files Browse the repository at this point in the history
  • Loading branch information
anoopshrma authored Mar 27, 2024
1 parent c845de7 commit 92c54fb
Showing 1 changed file with 50 additions and 3 deletions.
53 changes: 50 additions & 3 deletions llama_parse/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,9 @@ class ResultType(str, Enum):
"""The result type for the parser."""
TXT = "text"
MD = "markdown"
JSON = "json"

class Language(str, Enum):
"""Language of the document to be parsed"""
BAZA = "abq"
ADYGHE = "ady"
AFRIKAANS = "af"
Expand Down Expand Up @@ -98,12 +98,59 @@ class Language(str, Enum):

SUPPORTED_FILE_TYPES = [
".pdf",
".xml"
# Microsoft word - all versions
".doc",
".docx",
".pptx",
".docm",
".dot",
".dotx",
".dotm",
# Rich text format
".rtf",
# Microsoft Works
".wps",
# Word Perfect
".wpd",

# Open Office
".sxw",
".stw",
".sxg",

# Apple
".pages",

# Mac Write
".mw",
".mcw",


# Unified Office Format text
".uot",
".uof",
".uos",
".uop",

# Microsoft powerpoints
".ppt",
".pptx",
".pot",
".pptm",
".potx",
".potm",


# Apple keynote
".key",

# Open Office Presentations
".odp",
".odg",
".otp",
".fopd",
".sxi",
".sti",

# ebook
".epub"
]

0 comments on commit 92c54fb

Please sign in to comment.