More robust crawling

2018-02-26 13:01:05 +01:00 · 2018-02-26 13:01:05 +01:00 · 968ff6d24c
commit 968ff6d24c
parent 5d4bd30e20
2 changed files with 3 additions and 1 deletions
--- a/crawl/crawl.py
+++ b/crawl/crawl.py
@ -291,6 +291,8 @@ async def async_crawler(url, output_tree, headers=None):
                        if sample_url not in queued
                        and sample_url not in crawled
                    ]
            else:
                print("No html received")
    print(crawled)
    output_tree += crawl_tree
--- a/histories/models.py
+++ b/histories/models.py
@ -244,6 +244,6 @@ def generate_history(user, start_time):
                    new_line.full_clean()
                    new_line.save()
                except ValidationError:
-                    pass
+                    continue
    return history