From ca13aea547ab4c7eeef66495ce9a2b45823a26e8 Mon Sep 17 00:00:00 2001 From: blankie Date: Wed, 24 May 2023 21:42:29 +0700 Subject: [PATCH] Remove Gamespot reviews/ads https://lists.sr.ht/~cadence/breezewiki-discuss/%3C0ad4dbad07a1be394eefe43e33fff860b2d6176e%40disroot.org%3E --- lib/tree-updater.rkt | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/lib/tree-updater.rkt b/lib/tree-updater.rkt index 0dbf695e..e7d48b43 100644 --- a/lib/tree-updater.rkt +++ b/lib/tree-updater.rkt @@ -58,7 +58,9 @@ (data-src "https://static.wikia.nocookie.net/nice-image-thumbnail.png") (class "thumbimage"))))) (figcaption "Test figure!")) - (iframe (@ (src "https://example.com/iframe-src"))))))) + (iframe (@ (src "https://example.com/iframe-src"))) + (div (@ (class "reviews")) + (header "GameSpot Expert Reviews")))))) (define (updater wikiname #:strict-proxy? [strict-proxy? #f]) ;; precompute wikiurl regex for efficency @@ -238,6 +240,9 @@ [(list (list 'img _)) #t] [_ #f])) return-no-element] + ; remove gamespot reviews/ads + [(has-class? "reviews" attributes) + return-no-element] [#t (list element-type ;; attributes @@ -297,6 +302,8 @@ "/proxy?dest=https%3A%2F%2Fstatic.wikia.nocookie.net%2Fnice-image.png") ; check that noscript images are removed (check-equal? ((query-selector (λ (t a c) (eq? t 'noscript)) transformed)) #f) + ; check that gamespot reviews/ads are removed + (check-equal? ((query-selector (λ (t a c) (has-class? "reviews" a)) transformed)) #f) ; benchmark (when (file-exists? "../storage/Frog.html") (with-input-from-file "../storage/Frog.html"