Implement recursive page crawling

2023-12-06 08:29:39 +10:30 · 2023-12-06 08:29:39 +10:30 · 9fc2e1af53
commit 9fc2e1af53
parent 3d7b72e5ef
5 changed files with 47 additions and 26 deletions
--- a/src/index.py
+++ b/src/index.py
@ -27,7 +27,7 @@ def build_index():
                        if len(matching_urls) == 0:
 #                        if not url.strip() in dictionary[word]:
                            entries = dictionary[word]
-                            entry = {"url": url.strip(), "count": 1}
+                            entry = {"url": url.strip(), "count": 1, "filename": str(path)}
                            dictionary[word].append(entry)
                        else:
                            entries = dictionary[word]