renamed: exel_datein/2024/06/Tagesbericht Beispiel.xlsx -> exel_datein/2024/06/13.xlsx new file: exel_datein/2024/09/4.xlsx
37 lines
1.4 KiB
Python
37 lines
1.4 KiB
Python
import pandas as pd
|
|
import json
|
|
import os
|
|
import re
|
|
|
|
root_dir = "exel_datein"
|
|
# Passe das Pattern an: Jahr/Monat/Tag
|
|
date_pattern = re.compile(r'(\d{4})[\\/](\d{2})[\\/](\d{1,2})')
|
|
|
|
all_notes = []
|
|
|
|
for dirpath, _, filenames in os.walk(root_dir):
|
|
for filename in filenames:
|
|
if filename.lower().endswith(('.xlsx', '.xls')):
|
|
excel_path = os.path.join(dirpath, filename)
|
|
# Versuche, Jahr, Monat und Tag aus dem Pfad zu extrahieren
|
|
match = date_pattern.search(excel_path)
|
|
if match:
|
|
jahr, monat, tag = match.groups()
|
|
else:
|
|
jahr = monat = tag = "unbekannt"
|
|
try:
|
|
df = pd.read_excel(excel_path, sheet_name=0, usecols=[0, 1], names=["Kunde", "Info"])
|
|
df = df.dropna(subset=["Kunde", "Info"])
|
|
for _, row in df.iterrows():
|
|
# Format: Kunde: Info (Jahr: xxxx, Monat: xx, Tag: xx)
|
|
note = f"{row['Kunde']}: {row['Info']} (Jahr: {jahr}, Monat: {monat}, Tag: {tag})"
|
|
all_notes.append(note)
|
|
print(f"Verarbeitet: {excel_path}")
|
|
except Exception as e:
|
|
print(f"Fehler bei {excel_path}: {e}")
|
|
|
|
# Alles als JSON speichern
|
|
with open("background_data.json", "w", encoding="utf-8") as f:
|
|
json.dump(all_notes, f, ensure_ascii=False, indent=2)
|
|
|
|
print("Alle Daten erfolgreich als background_data.json gespeichert.") |