in chunking/chunkers/spreadsheet_chunker.py [0:0]
def _get_sheet_data(self, sheet):
"""
Retrieves data and headers from the given sheet. Each row's data is processed into a list format, ensuring that empty rows are excluded.
Args:
sheet (Worksheet): The worksheet object to extract data from.
Returns:
Tuple[List[List[str]], List[str]]: A tuple containing a list of row data and a list of headers.
"""
data = []
for row in sheet.iter_rows(min_row=2): # Start from the second row to skip headers
row_data = []
for cell in row:
cell_value = cell.value
if cell_value is None:
cell_value = ""
cell_text = str(cell_value)
row_data.append(cell_text)
if "".join(row_data).strip() != "":
data.append(row_data)
headers = [cell.value if cell.value is not None else "" for cell in sheet[1]]
return data, headers