Get supported file formats Leave feedback

Get all supported file formats

Python

from groupdocs.parser.options import FileType

# Get all supported file types
supported_file_types = FileType.get_supported_file_types()

# Iterate through the collection
for file_type in sorted(supported_file_types, key=lambda x: x.extension):
    print(f"{file_type.extension} - {file_type.file_format}")

print(f"
Total supported formats: {len(list(supported_file_types))}")

Filter supported formats by category

You can filter supported formats based on your needs:

Python

from groupdocs.parser.options import FileType

# Get all supported file types
supported_file_types = FileType.get_supported_file_types()

# Define format categories
word_formats = [".doc", ".docx", ".docm", ".dot", ".dotx", ".dotm", ".odt", ".ott", ".rtf"]
excel_formats = [".xls", ".xlsx", ".xlsm", ".xlsb", ".xlt", ".xltx", ".xltm", ".ods"]
pdf_formats = [".pdf"]

print("Word Processing Formats:")
for file_type in supported_file_types:
    if file_type.extension.lower() in word_formats:
        print(f"  {file_type.extension} - {file_type.file_format}")

print("Spreadsheet Formats:")
for file_type in supported_file_types:
    if file_type.extension.lower() in excel_formats:
        print(f"  {file_type.extension} - {file_type.file_format}")

print("PDF Formats:")
for file_type in supported_file_types:
    if file_type.extension.lower() in pdf_formats:
        print(f"  {file_type.extension} - {file_type.file_format}")

Check if a specific format is supported

You can check if a particular file format is supported:

Python

from groupdocs.parser.options import FileType

def is_format_supported(extension):
    """Check if a file format is supported by GroupDocs.Parser"""
    supported_file_types = FileType.get_supported_file_types()
    
    for file_type in supported_file_types:
        if file_type.extension.lower() == extension.lower():
            return True
    return False

# Check various formats
formats_to_check = [".pdf", ".docx", ".xlsx", ".txt", ".unknown"]

for ext in formats_to_check:
    if is_format_supported(ext):
        print(f"{ext} - Supported")
    else:
        print(f"{ext} - Not Supported")

Get format details

You can retrieve detailed information about each supported format:

Python

from groupdocs.parser.options import FileType

# Get all supported file types
supported_file_types = FileType.get_supported_file_types()

# Display format details
print("Supported Document Formats:\n")
print(f"{'Extension':<12} {'Format Name':<50}")
print("-" * 62)

for file_type in sorted(supported_file_types, key=lambda x: x.extension):
    print(f"{file_type.extension:<12} {file_type.file_format:<50}")

Practical usage example

Here’s a practical example of validating user input:

Python

from groupdocs.parser import Parser
from groupdocs.parser.options import FileType
import os

def process_file(file_path):
    """Process a file if its format is supported"""
    
    # Get file extension
    _, ext = os.path.splitext(file_path)
    
    # Check if format is supported
    supported_file_types = FileType.get_supported_file_types()
    is_supported = any(ft.extension.lower() == ext.lower() for ft in supported_file_types)
    
    if not is_supported:
        print(f"Error: File format '{ext}' is not supported")
        return False
    
    try:
        # Process the file
        with Parser(file_path) as parser:
            doc_info = parser.get_document_info()
            print(f"Processing: {file_path}")
            print(f"Format: {doc_info.file_type.file_format}")
            print(f"Pages: {doc_info.page_count}")
            
            # Extract text
            text_reader = parser.get_text()
            if text_reader:
                print("Text extraction successful")
                return True
    except Exception as e:
        print(f"Error processing file: {e}")
        return False

# Example usage
process_file("sample.pdf")
process_file("sample.docx")

sample.pdf

The following sample file is used in this example: sample.pdf

sample.docx

The following sample file is used in this example: sample.docx

More resources

Advanced usage topics

To learn more about document data extraction features, please refer to the advanced usage section.

GitHub examples

You may find more code examples in our GitHub repository:

GroupDocs.Parser for Python via .NET examples

Free online document parser

Along with the full-featured library, we provide a free online document parser app. You are welcome to extract data from PDF, DOCX, XLSX, and more with our Free Online Document Parser App.

We value your opinion. Your feedback will help us improve our documentation.

Get supported file formats Leave feedback

On this page

Get all supported file formats

Filter supported formats by category

Check if a specific format is supported

Get format details

Practical usage example

More resources

Advanced usage topics

GitHub examples

Free online document parser

Was this page helpful?

Any additional feedback you'd like to share with us?

Please tell us how we can improve this page.

Thank you for your feedback!

On this page