jymchng · June 15, 2022 16:11
diff --git a/_parse_xlxs_merged_cells b/_parse_xlxs_merged_cells
 from openpyxl.workbook import Workbook
 from openpyxl import load_workbook
 from openpyxl.utils.cell import range_boundaries
 import pandas as pd
 import numpy as np

 def _parse_xlxs_merged_cells(filepath, how='top-left'):
    """
    Takes in a Path-like object specifying the .xlsx file and returns a pandas DataFrame with unmerged cells' values
    appropriately filled.
    
    -params-
    filepath: Path-like
    how: a string, specifying which cell's value to be copied to all unmerged cells, default is 'top-left'
    
    -returns-
    pandas DataFrame with with unmerged cells' filled with specified values
    """
    
    df = pd.read_excel(filepath)
    how_mapping = {'top-left': (1, 0)}

    wb = load_workbook(filename=filepath)

    for st_name in wb.sheetnames:
        st = wb[st_name]
        mcr_coord_list = [mcr.coord for mcr in st.merged_cells.ranges]

        range_bound_arr = np.array([range_boundaries(mcr) for mcr in mcr_coord_list])
        range_bound_arr_pyindexes = range_bound_arr - [1, 2, 1, 2]

        for range_bound_arr_pyindex in range_bound_arr_pyindexes:
            # min_col, min_row, max_col, max_row
            # 0,     , 1      , 2      , 3
            df.iloc[range_bound_arr_pyindex[1]:range_bound_arr_pyindex[-1]+1, range_bound_arr_pyindex[0]:range_bound_arr_pyindex[-2]+1] = \
            df.iloc[range_bound_arr_pyindex[how_mapping[how][0]],range_bound_arr_pyindex[how_mapping[how][1]]]
                
    return df
	from openpyxl.workbook import Workbook
	from openpyxl import load_workbook
	from openpyxl.utils.cell import range_boundaries
	import pandas as pd
	import numpy as np

	def _parse_xlxs_merged_cells(filepath, how='top-left'):
	"""
	Takes in a Path-like object specifying the .xlsx file and returns a pandas DataFrame with unmerged cells' values
	appropriately filled.

	-params-
	filepath: Path-like
	how: a string, specifying which cell's value to be copied to all unmerged cells, default is 'top-left'

	-returns-
	pandas DataFrame with with unmerged cells' filled with specified values
	"""

	df = pd.read_excel(filepath)
	how_mapping = {'top-left': (1, 0)}

	wb = load_workbook(filename=filepath)

	for st_name in wb.sheetnames:
	st = wb[st_name]
	mcr_coord_list = [mcr.coord for mcr in st.merged_cells.ranges]

	range_bound_arr = np.array([range_boundaries(mcr) for mcr in mcr_coord_list])
	range_bound_arr_pyindexes = range_bound_arr - [1, 2, 1, 2]

	for range_bound_arr_pyindex in range_bound_arr_pyindexes:
	# min_col, min_row, max_col, max_row
	# 0, , 1 , 2 , 3
	df.iloc[range_bound_arr_pyindex[1]:range_bound_arr_pyindex[-1]+1, range_bound_arr_pyindex[0]:range_bound_arr_pyindex[-2]+1] = \
	df.iloc[range_bound_arr_pyindex[how_mapping[how][0]],range_bound_arr_pyindex[how_mapping[how][1]]]

	return df