Update project structure and move to beancount

2025-03-02 11:08:33 -05:00
parent 886bcdbdd1
commit 08c50e776e
17 changed files with 1844 additions and 296 deletions
--- a/src/toldg/process.py
+++ b/src/toldg/process.py
@@ -0,0 +1,121 @@
+import csv
+import datetime
+import logging
+import re
+import sys
+from typing import Dict, List
+
+import toldg.models
+import toldg.predict
+import toldg.utils
+import toldg.write
+from toldg.models import Config, CsvConfig, Transaction
+
+
+def process_ldg_files(config: Config):
+    for ldg_file in toldg.utils.get_ldg_files(config.input_directory):
+        with open(ldg_file, "r") as f_in:
+            with open(config.output_file, "a") as f_out:
+                f_out.write(f_in.read())
+
+
+def get_csv_config(csv_file: str, csv_configs: List[CsvConfig]) -> CsvConfig:
+    cs = [c for c in csv_configs if re.match(c.file_match_regex, csv_file)]
+    if not cs:
+        logging.critical(f"No CSV config for {csv_file}.")
+        sys.exit(1)
+    elif len(cs) > 1:
+        logging.critical(f"Multiple CSV configs for {csv_file}.")
+        sys.exit(1)
+    return cs[0]
+
+
+def get_transactions(csv_file: str, config: CsvConfig) -> List[Transaction]:
+    def date_to_date(date: str) -> str:
+        d = datetime.datetime.strptime(date, config.input_date_format)
+        return d.strftime(config.output_date_format)
+
+    def flip_sign(amount: str) -> str:
+        return amount[1:] if amount.startswith("-") else "-" + amount
+
+    def row_to_transaction(row, fields):
+        """The user can configure the mapping of CSV fields to the three
+        required fields date, amount and description via the CsvConfig."""
+        t = {field: row[index] for index, field in fields}
+        amount = t["amount"]
+        return Transaction(
+            currency=config.currency,
+            debit=flip_sign(amount),
+            credit=amount,
+            date=date_to_date(t["date"]),
+            account1=config.account1,
+            account2=toldg.models.UNKNOWN_CATEGORY,
+            description=t["description"],
+            csv_file=csv_file,
+            row=csv_file + ", " + ", ".join(row),
+        )
+
+    fields = [(i, f) for i, f in enumerate(config.fields) if f]
+    with open(csv_file, "r") as f:
+        reader = csv.reader(f, delimiter=config.delimiter, quotechar=config.quotechar)
+        for _ in range(config.skip):
+            next(reader)
+        transactions = [row_to_transaction(row, fields) for row in reader if row]
+    return transactions
+
+
+def find_duplicates(transactions: List[Transaction]):
+    rows = set()
+    for t in transactions:
+        row = t.row
+        if row in rows:
+            logging.critical(f"'{row}' is duplicated.")
+            logging.critical("Exit because of duplicated transactions.")
+            sys.exit(1)
+        else:
+            rows.add(row)
+
+
+def apply_mappings(transactions: List[Transaction], mappings: Dict[str, str]):
+    unused_mappings = set(mappings.keys())
+    for t in transactions:
+        if t.row in mappings:
+            t.account2 = mappings[t.row]
+            unused_mappings.discard(t.row)
+        else:
+            logging.warning(f"No mapping for '{t}'.")
+    for row in unused_mappings:
+        logging.warning(f"Unused mapping '{row}' -> {mappings[row]}.")
+
+
+def apply_descriptions(transactions: List[Transaction], descriptions: Dict[str, str]):
+    unused_descriptions = set(descriptions.keys())
+    for t in transactions:
+        if t.row in descriptions:
+            t.description = descriptions[t.row]
+            unused_descriptions.discard(t.row)
+    for row in unused_descriptions:
+        logging.warning(f"Unused mapping '{row}' -> {descriptions[row]}.")
+
+
+def process_csv_files(config: Config):
+    csv_files = toldg.utils.get_csv_files(config.input_directory)
+    transactions = []
+    for csv_file in csv_files:
+        csv_file = str(csv_file)
+        csv_config = get_csv_config(csv_file, config.csv_configs)
+        transactions += get_transactions(csv_file, csv_config)
+
+    if config.find_duplicates:
+        find_duplicates(transactions)
+
+    if config.descriptions_file is not None:
+        descriptions = toldg.utils.read_descriptions(config.descriptions_file)
+        apply_descriptions(transactions, descriptions)
+
+    mappings = toldg.utils.read_mappings(config.mappings_file)
+    apply_mappings(transactions, mappings)
+
+    toldg.predict.add_account2(transactions, config.categories)
+    toldg.utils.write_mappings(transactions, config.mappings_file)
+    toldg.write.render_to_file(transactions, config)