Fix: rebuild join_excel

This commit is contained in:
Bertrand Benjamin 2023-10-05 15:10:39 +02:00
parent ec9cc19be5
commit f2bcf6241a
2 changed files with 27 additions and 1 deletions

22
pdf_oralia/join.py Normal file
View File

@ -0,0 +1,22 @@
import glob
import pandas as pd
def join_excel(src, dest, file_pattern):
"""Join every excel file in arc respecting file_pattern into on unique file in dist"""
filenames = list_files(src, file_pattern)
dfs = extract_dfs(filenames)
joined_df = pd.concat(dfs)
joined_df.to_excel(dest)
def list_files(src, file_glob):
return list(glob.iglob(f"{src}/{file_glob}"))
def extract_dfs(filenames):
dfs = []
for filename in filenames:
dfs.append(pd.read_excel(filename))
return dfs

View File

@ -5,6 +5,7 @@ from pathlib import Path
import click
from .extract import extract_save
from .join import join_excel
logging_config = dict(
version=1,
@ -65,4 +66,7 @@ def all(src, dest):
@click.option("--src", help="Tous les fichiers dans src", default="./")
@click.option("--dest", help="Où mettre les fichiers produits", default="")
def join(src, dest):
join_excel(src, dest, df_names=["charge", "locataire"])
dest_charge = f"{dest}/charge.xlsx"
join_excel(src, dest_charge, "*_charge.xlsx")
dest_locataire = f"{dest}/locataire.xlsx"
join_excel(src, dest_locataire, "*_locataire.xlsx")