From 52197be83341ad3b4ed4792d083c3b9f6ad00319 Mon Sep 17 00:00:00 2001 From: Holger <3876469+HolgerAusB@users.noreply.github.com> Date: Thu, 5 Dec 2024 13:20:13 +0000 Subject: [PATCH] Update immub.org.txt (#1518) --- immub.org.txt | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/immub.org.txt b/immub.org.txt index 819630a3..f0f095af 100644 --- a/immub.org.txt +++ b/immub.org.txt @@ -4,7 +4,8 @@ http_header(User-Agent): Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:135.0) Gecko/20100101 Firefox/135.0 body: //article[contains(concat(' ',normalize-space(@class),' '),' article ')] -a +body: //article[contains(concat(' ',normalize-space(@class),' '),' project ')] + #due to JavaScript the real conent is found with a different URL: next_page_link: concat( substring-before( substring-after ( (//script[contains(text(), 'bucket_domain =')]/text()) , "bucket_domain = '") , "'") , substring-before( substring-after ( (//script[contains(text(), 'sarquivo_pt =')]/text()) , "sarquivo_pt = '") , "'") ) @@ -13,6 +14,9 @@ strip_id_or_class: article-header strip_id_or_class: article-footer strip_id_or_class: visible-xs +# prevent FTR to inject picture from og:image +insert_detected_image: no + prune: no tidy: no