dnk8n · January 2, 2025 19:44 · dnk8n · Sep 28, 2021 · splosarek · Feb 2, 2022
diff --git a/dictreader.py b/dictreader.py
 from pathlib import Path
 from typing import Any, Callable, Dict, Iterator, List, Optional, Union

 from openpyxl import load_workbook


 def xlsx_dictreader(
    filename: Union[str, Path],
    sheet_index: int = 0,
    header_row_index: int = 1,
    data_start_row_index: int = 2,
    data_only: bool = True,
    post_process_funcs: Optional[List[Callable[[Any], Any]]] = None,
    null_vals: List[Union[None, str]] = [None, "None"],
 ) -> Iterator[Dict[str, Any]]:
    book = load_workbook(filename, data_only=data_only)
    sheet = book.worksheets[sheet_index]
    header = [
        c
        for c in (cell.value for cell in sheet[header_row_index])
        if c not in null_vals
    ]
    if not post_process_funcs:
        post_process_funcs = [lambda x: x] * len(header)
    else:
        if len(post_process_funcs) != len(header):
            raise Exception(
                "post-processing functions do not line up with headers"
            )
    for row_idx in range(data_start_row_index, sheet.max_row + 1):
        candidate = {}
        for col_idx in range(1, sheet.max_column + 1):
            if col_idx <= len(header):
                candidate[header[col_idx - 1]] = post_process_funcs[
                    col_idx - 1
                ](sheet.cell(row=row_idx, column=col_idx).value)
        if not all(value in null_vals for value in candidate.values()):
            yield candidate
	from pathlib import Path
	from typing import Any, Callable, Dict, Iterator, List, Optional, Union

	from openpyxl import load_workbook


	def xlsx_dictreader(
	filename: Union[str, Path],
	sheet_index: int = 0,
	header_row_index: int = 1,
	data_start_row_index: int = 2,
	data_only: bool = True,
	post_process_funcs: Optional[List[Callable[[Any], Any]]] = None,
	null_vals: List[Union[None, str]] = [None, "None"],
	) -> Iterator[Dict[str, Any]]:
	book = load_workbook(filename, data_only=data_only)
	sheet = book.worksheets[sheet_index]
	header = [
	c
	for c in (cell.value for cell in sheet[header_row_index])
	if c not in null_vals
	]
	if not post_process_funcs:
	post_process_funcs = [lambda x: x] * len(header)
	else:
	if len(post_process_funcs) != len(header):
	raise Exception(
	"post-processing functions do not line up with headers"
	)
	for row_idx in range(data_start_row_index, sheet.max_row + 1):
	candidate = {}
	for col_idx in range(1, sheet.max_column + 1):
	if col_idx <= len(header):
	candidate[header[col_idx - 1]] = post_process_funcs[
	col_idx - 1
	](sheet.cell(row=row_idx, column=col_idx).value)
	if not all(value in null_vals for value in candidate.values()):
	yield candidate