We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 40fd1a8 commit a9c44e2Copy full SHA for a9c44e2
src/fundus/publishers/de/dw.py
@@ -23,7 +23,7 @@ class V2(BaseParser):
23
# https://regex101.com/r/uZLwyb/1
24
_author_regex = r"^([a-z]{2,3}\/|[A-Z]{2,3}\/)*([a-z]{2,3}|[A-Z]{2,3})\s\(([a-z]{2,3}, )*([a-z]{2,3})\)$"
25
_paragraph_selector = XPath(
26
- f"//div[contains(@class, 'rich-text')] /p[not(em) or text() and not(re:test(text(), '{_author_regex}'))]",
+ f"//div[contains(@class, 'rich-text')] /p[text() and not(re:test(text(), '{_author_regex}'))]",
27
namespaces={"re": "http://exslt.org/regular-expressions"},
28
)
29
_summary_selector = CSSSelector("header > p")
0 commit comments