new: added ExcelParser(tested) to read .xlsx files

This commit is contained in:
devendra.parihar
2024-10-01 22:03:10 +05:30
parent af1b81097f
commit 7794129929
8 changed files with 116 additions and 27 deletions

25
test.py Normal file
View File

@@ -0,0 +1,25 @@
from pathlib import Path
from application.parser.file.tabular_parser import ExcelParser,PandasCSVParser
# Define the path to the .xlsx file
file_path = Path("/home/dev523/DocsGPT/Ledgers in Default Template.xlsx")
parser = ExcelParser(concat_rows=True, pandas_config={})
# Initialize the ExcelParser
# file_path = Path("/home/dev523/DocsGPT/mlb_teams_2012.csv")
# parser = PandasCSVParser(concat_rows=True, pandas_config={})
# Initialize the parser configuration (this can be customized if needed)
parser.init_parser()
# Check if the parser config is set (this is optional)
if parser.parser_config_set:
print("Parser config has been set.")
# Parse the Excel file
parsed_data = parser.parse_file(file_path)
print(parsed_data)