diff --git a/src/processor/ledger/beancount_to_jsonl.py b/src/processor/ledger/beancount_to_jsonl.py index 3baa2d54..b2f26b7b 100644 --- a/src/processor/ledger/beancount_to_jsonl.py +++ b/src/processor/ledger/beancount_to_jsonl.py @@ -99,16 +99,16 @@ def extract_beancount_transactions(beancount_files): for entry in re.split(empty_newline, ledger_content, flags=re.MULTILINE) if re.match(transaction_regex, entry)] - transaction_to_file_map += [beancount_file]*len(transactions_per_file) + transaction_to_file_map += zip(transactions_per_file, [beancount_file]*len(transactions_per_file)) entries.extend(transactions_per_file) - return entries, transaction_to_file_map + return entries, dict(transaction_to_file_map) def convert_transactions_to_maps(entries: list[str], transaction_to_file_map) -> list[dict]: "Convert each Beancount transaction into a dictionary" entry_maps = [] - for entry_id, entry in enumerate(entries): - entry_maps.append({'compiled': entry, 'raw': entry, 'file': f'{transaction_to_file_map[entry_id]}'}) + for entry in entries: + entry_maps.append({'compiled': entry, 'raw': entry, 'file': f'{transaction_to_file_map[entry]}'}) logger.info(f"Converted {len(entries)} transactions to dictionaries") diff --git a/src/processor/markdown/markdown_to_jsonl.py b/src/processor/markdown/markdown_to_jsonl.py index 118e66dd..7a91533b 100644 --- a/src/processor/markdown/markdown_to_jsonl.py +++ b/src/processor/markdown/markdown_to_jsonl.py @@ -98,17 +98,17 @@ def extract_markdown_entries(markdown_files): markdown_entries_per_file = [f'#{entry.strip(empty_escape_sequences)}' for entry in re.split(markdown_heading_regex, markdown_content, flags=re.MULTILINE)] - entry_to_file_map += [markdown_file]*len(markdown_entries_per_file) + entry_to_file_map += zip(markdown_entries_per_file, [markdown_file]*len(markdown_entries_per_file)) entries.extend(markdown_entries_per_file) - return entries, entry_to_file_map + return entries, dict(entry_to_file_map) def convert_markdown_entries_to_maps(entries: list[str], entry_to_file_map) -> list[dict]: "Convert each Markdown entries into a dictionary" entry_maps = [] - for entry_id, entry in enumerate(entries): - entry_maps.append({'compiled': entry, 'raw': entry, 'file': f'{entry_to_file_map[entry_id]}'}) + for entry in entries: + entry_maps.append({'compiled': entry, 'raw': entry, 'file': f'{entry_to_file_map[entry]}'}) logger.info(f"Converted {len(entries)} markdown entries to dictionaries") diff --git a/src/processor/org_mode/org_to_jsonl.py b/src/processor/org_mode/org_to_jsonl.py index 47dc54fa..f166810f 100644 --- a/src/processor/org_mode/org_to_jsonl.py +++ b/src/processor/org_mode/org_to_jsonl.py @@ -141,7 +141,7 @@ def convert_org_nodes_to_entries(entries: list[orgnode.Orgnode], entry_to_file_m return entry_maps -def convert_org_entries_to_jsonl(entries) -> str: +def convert_org_entries_to_jsonl(entries: list[dict]) -> str: "Convert each Org-Mode entry to JSON and collate as JSONL" return ''.join([f'{json.dumps(entry_dict, ensure_ascii=False)}\n' for entry_dict in entries])