diff --git a/src/extractcode/extract.py b/src/extractcode/extract.py index 8c547f2..5dfcf6a 100644 --- a/src/extractcode/extract.py +++ b/src/extractcode/extract.py @@ -9,6 +9,7 @@ import logging import traceback +import zipfile from collections import namedtuple from functools import partial @@ -229,6 +230,15 @@ def extract_files( if TRACE: logger.debug('extract:walk:recurse:extraction event: %(xevent)r' % locals()) yield xevent + +def extract_libre_office_document(location, target): + """Extract Libre Office documents (e.g., .ods files) as ZIP archives.""" + try: + with zipfile.ZipFile(location, 'r') as zip_ref: + zip_ref.extractall(target) + logger.info(f"Extracted Libre Office document from {location} to {target}") + except zipfile.BadZipFile: + raise ValueError(f"File at {location} is not a valid ZIP archive.") def extract_file(