mirror of
https://github.com/khoaliber/khoj.git
synced 2026-03-02 21:19:12 +00:00
Identify markdown headings by any whitespace character after ^#+
Previously only markdown headings with space characters after # would be considered a heading. So ^##\t wouldn't be considered a valid heading
This commit is contained in:
@@ -146,7 +146,7 @@ class MarkdownToEntries(TextToEntries):
|
||||
else:
|
||||
entry_filename = str(Path(raw_filename))
|
||||
|
||||
heading = parsed_entry.splitlines()[0] if re.search("^#+\s", parsed_entry) else ""
|
||||
heading = parsed_entry.splitlines()[0] if re.search(r"^#+\s", parsed_entry) else ""
|
||||
# Append base filename to compiled entry for context to model
|
||||
# Increment heading level for heading entries and make filename as its top level heading
|
||||
prefix = f"# {entry_filename}\n#" if heading else f"# {entry_filename}\n"
|
||||
|
||||
Reference in New Issue
Block a user