mirror of
https://github.com/donnemartin/system-design-primer.git
synced 2025-12-14 17:08:56 +03:00
Crawler should add page to index and document queue
This commit is contained in:
@@ -159,6 +159,8 @@ class Crawler(object):
|
||||
...
|
||||
|
||||
def crawl_page(self, page):
|
||||
self.reverse_index_queue.add(page.url)
|
||||
self.doc_index_queue.add(page.url)
|
||||
for url in page.child_urls:
|
||||
self.data_store.add_link_to_crawl(url)
|
||||
page.signature = self.create_signature(page)
|
||||
|
||||
Reference in New Issue
Block a user