Add options for dry run and grouping

This commit is contained in:
Felix Blanke 2023-08-17 22:21:31 +02:00
parent f34e5faecc
commit 0d9774ac00

View File

@ -74,7 +74,10 @@ bundesland_dict = {
def main( def main(
url: str = "https://beschaeftigtenbefragung.verdi.de/", tag: str = "bez_data_2" url: str = "https://beschaeftigtenbefragung.verdi.de/",
tag: str = "bez_data_2",
dry_run: bool = False,
grouped: bool = False,
) -> pd.DataFrame: ) -> pd.DataFrame:
options = Options() options = Options()
options.add_argument("--headless") options.add_argument("--headless")
@ -107,6 +110,12 @@ def main(
data["Digitale Befragung"] = pd.Series(tot_col_data, index=tot_col_index) data["Digitale Befragung"] = pd.Series(tot_col_data, index=tot_col_index)
df = pd.DataFrame(data=data) df = pd.DataFrame(data=data)
filename = f"data/{datetime.today().strftime('%Y-%m-%d')}_data.ods" filename = f"data/{datetime.today().strftime('%Y-%m-%d')}_data.ods"
if grouped:
df = df.groupby("Bundesland")[["Digitale Befragung"]].sum()
if dry_run:
df.loc["Total"] = df.sum(numeric_only=True)
print(df)
else:
if Path(filename).exists(): if Path(filename).exists():
print("File already exists!") print("File already exists!")
else: else: