From 3787f756f3b8e72ea8d5267e8d3fbb7d42872c8c Mon Sep 17 00:00:00 2001 From: Marco Lents Date: Sun, 16 Nov 2025 13:01:56 +0100 Subject: [PATCH] improve no disclosure handling --- crawler.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/crawler.py b/crawler.py index ff05b46..5b70260 100644 --- a/crawler.py +++ b/crawler.py @@ -303,7 +303,11 @@ def get_disclosures(elem): continue if child.text.strip() == "": continue + if child.text.strip() == "Keine veröffentlichungspflichtigen Angaben.": + continue current_body.append(child.text.strip()) + if current_heading == "" and current_body == []: + continue out.append((current_heading, current_body)) return out