summaryrefslogtreecommitdiff
path: root/crocoite
diff options
context:
space:
mode:
Diffstat (limited to 'crocoite')
-rw-r--r--crocoite/behavior.py7
1 files changed, 5 insertions, 2 deletions
diff --git a/crocoite/behavior.py b/crocoite/behavior.py
index efb2ced..4d89ae7 100644
--- a/crocoite/behavior.py
+++ b/crocoite/behavior.py
@@ -259,9 +259,12 @@ class DomSnapshot (Behavior):
if url in haveUrls:
# ignore duplicate URLs. they are usually caused by
# javascript-injected iframes (advertising) with no(?) src
- self.logger.warning (f'have DOM snapshot for URL {url}, ignoring')
+ self.logger.warning ('dom snapshot duplicate',
+ uuid='d44de989-98d4-456e-82e7-9d4c49acab5e')
elif url.scheme in ('http', 'https'):
- self.logger.debug (f'saving DOM snapshot for url {url}, base {doc["baseURL"]}')
+ self.logger.debug ('dom snapshot',
+ uuid='ece7ff05-ccd9-44b5-b6a8-be25a24b96f4',
+ base=doc["baseURL"])
haveUrls.add (url)
walker = ChromeTreeWalker (doc)
# remove script, to make the page static and noscript, because at the