- Extract All office file's content.
$ extract_office_content -h
usage: extract_office_content [-h] [-img_dir SAVE_IMG_DIR] file_path
positional arguments:
file_path
optional arguments:
-h, --help show this help message and exit
-img_dir SAVE_IMG_DIR, --save_img_dir SAVE_IMG_DIR
$ extract_office_content tests/test_files
- Extract Word.
$ extract_word -h
usage: extract_word [-h] [-img_dir SAVE_IMG_DIR] word_path
positional arguments:
word_path
optional arguments:
-h, --help show this help message and exit
-img_dir SAVE_IMG_DIR, --save_img_dir SAVE_IMG_DIR
$ extract_word tests/test_files/word_example.docx
- Extract PPT.
$ extract_ppt -h
usage: extract_ppt [-h] [-img_dir SAVE_IMG_DIR] ppt_path
positional arguments:
ppt_path
optional arguments:
-h, --help show this help message and exit
-img_dir SAVE_IMG_DIR, --save_img_dir SAVE_IMG_DIR
$ extract_ppt tests/test_files/ppt_example.pptx
- Extract Excel.
$ extract_excel -h
usage: extract_excel [-h] [-f {markdown,html,latex,string}] [-o SAVE_IMG_DIR]
excel_path
positional arguments:
excel_path
optional arguments:
-h, --help show this help message and exit
-f {markdown,html,latex,string}, --output_format {markdown,html,latex,string}
-o SAVE_IMG_DIR, --save_img_dir SAVE_IMG_DIR
$ extract_excel tests/test_files/excel_example.xlsx