diff options
-rw-r--r-- | crocoite/behavior.py | 7 |
1 files changed, 5 insertions, 2 deletions
diff --git a/crocoite/behavior.py b/crocoite/behavior.py index efb2ced..4d89ae7 100644 --- a/crocoite/behavior.py +++ b/crocoite/behavior.py @@ -259,9 +259,12 @@ class DomSnapshot (Behavior): if url in haveUrls: # ignore duplicate URLs. they are usually caused by # javascript-injected iframes (advertising) with no(?) src - self.logger.warning (f'have DOM snapshot for URL {url}, ignoring') + self.logger.warning ('dom snapshot duplicate', + uuid='d44de989-98d4-456e-82e7-9d4c49acab5e') elif url.scheme in ('http', 'https'): - self.logger.debug (f'saving DOM snapshot for url {url}, base {doc["baseURL"]}') + self.logger.debug ('dom snapshot', + uuid='ece7ff05-ccd9-44b5-b6a8-be25a24b96f4', + base=doc["baseURL"]) haveUrls.add (url) walker = ChromeTreeWalker (doc) # remove script, to make the page static and noscript, because at the |