Replace thread-let with thread-utils

This commit is contained in:
Cadence Ember 2023-02-12 13:55:33 +13:00
parent 5fa6e2fb9e
commit 501dcaa3fc
Signed by untrusted user: cadence
GPG key ID: BC1C2C61CF521B17
9 changed files with 255 additions and 215 deletions

View file

@ -4,8 +4,6 @@
(provide (provide
; help make a nested if. if/in will gain the same false form of its containing if/out. ; help make a nested if. if/in will gain the same false form of its containing if/out.
if/out if/out
; let, but the value for each variable is evaluated within a thread
thread-let
; cond, but values can be defined between conditions ; cond, but values can be defined between conditions
cond/var cond/var
; wrap sql statements into lambdas so they can be executed during migration ; wrap sql statements into lambdas so they can be executed during migration
@ -25,7 +23,6 @@
(provide (provide
transform-if/out transform-if/out
transform-thread-let
transform/out-cond/var) transform/out-cond/var)
(define (transform-if/out stx) (define (transform-if/out stx)
@ -51,26 +48,6 @@
[#t node]))) [#t node])))
(datum->syntax stx (cons 'if result))) (datum->syntax stx (cons 'if result)))
(define (transform-thread-let stx)
(define tree (cdr (syntax->datum stx)))
(define defs (car tree))
(define forms (cdr tree))
(when (eq? (length forms) 0)
(error (format "thread-let: bad syntax (need some forms to execute after the threads)~n forms: ~a" forms)))
(define counter (build-list (length defs) values))
(datum->syntax
stx
`(let ([chv (build-vector ,(length defs) (λ (_) (make-channel)))])
,@(map (λ (n)
(define def (list-ref defs n))
`(thread (λ () (channel-put (vector-ref chv ,n) (let _ () ,@(cdr def))))))
counter)
(let ,(map (λ (n)
(define def (list-ref defs n))
`(,(car def) (channel-get (vector-ref chv ,n))))
counter)
,@forms))))
(define (transform/out-cond/var stx) (define (transform/out-cond/var stx)
(define tree (transform-cond/var (cdr (syntax->datum stx)))) (define tree (transform-cond/var (cdr (syntax->datum stx))))
(datum->syntax (datum->syntax
@ -119,35 +96,6 @@
(check-equal? (if/out #t (if/in #f 'yes) 'no) 'no) (check-equal? (if/out #t (if/in #f 'yes) 'no) 'no)
(check-equal? (if/out #f (if/in #f 'yes) 'no) 'no)) (check-equal? (if/out #f (if/in #f 'yes) 'no) 'no))
(define-syntax (thread-let stx)
(transform-thread-let stx))
(module+ test
; check that it is transformed as expected
(check-syntax-equal?
(transform-thread-let
#'(thread-let ([a (hey "this is a")]
[b (hey "this is b")])
(list a b)))
#'(let ([chv (build-vector 2 (λ (_) (make-channel)))])
(thread (λ () (channel-put (vector-ref chv 0) (let _ () (hey "this is a")))))
(thread (λ () (channel-put (vector-ref chv 1) (let _ () (hey "this is b")))))
(let ([a (channel-get (vector-ref chv 0))]
[b (channel-get (vector-ref chv 1))])
(list a b))))
; check that they actually execute concurrently
(define ch (make-channel))
(check-equal? (thread-let ([a (begin
(channel-put ch 'a)
(channel-get ch))]
[b (begin0
(channel-get ch)
(channel-put ch 'b))])
(list a b))
'(b a))
; check that it assigns the correct value to the correct variable
(check-equal? (thread-let ([a (sleep 0) 'a] [b 'b]) (list a b))
'(a b)))
(define-syntax (cond/var stx) (define-syntax (cond/var stx)
(transform/out-cond/var stx)) (transform/out-cond/var stx))
(module+ test (module+ test

72
lib/thread-utils.rkt Normal file
View file

@ -0,0 +1,72 @@
#lang racket/base
(require (prefix-in easy: net/http-easy)
"../src/data.rkt"
"xexpr-utils.rkt")
(provide
thread-values)
(module+ test
(require rackunit))
(define (thread-values . thunks)
(parameterize-break #t
(define the-exn (box #f))
(define original-thread (current-thread))
(define (break e)
(when (box-cas! the-exn #f e)
(break-thread original-thread))
(sleep 0))
(define-values (threads channels)
(for/fold ([ts null]
[chs null]
#:result (values (reverse ts) (reverse chs)))
([th thunks])
(define ch (make-channel))
(define t
(thread (λ ()
(with-handlers ([exn? break])
(channel-put ch (th))))))
(values (cons t ts) (cons ch chs))))
(apply
values
(with-handlers ([exn:break? (λ (_)
(for ([t threads]) (kill-thread t))
(if (unbox the-exn)
(raise (unbox the-exn))
(error 'thread-values "a thread broke, but without reporting its exception")))])
(for/list ([ch channels])
(channel-get ch))))))
(module+ test
; check that they actually execute concurrently
(define ch (make-channel))
(check-equal? (let-values ([(a b)
(thread-values
(λ ()
(begin
(channel-put ch 'a)
(channel-get ch)))
(λ ()
(begin0
(channel-get ch)
(channel-put ch 'b))))])
(list a b))
'(b a))
; check that it assigns the correct value to the correct variable
(check-equal? (let-values ([(a b)
(thread-values
(λ () (sleep 0) 'a)
(λ () 'b))])
(list a b))
'(a b))
; check that exceptions are passed to the original thread, and other threads are killed
;; TODO: if the other thread was making an HTTP request, could it be left stuck open by the kill?
(check-equal? (let* ([x "!"]
[res
(with-handlers ([exn:fail:user? (λ (e) (exn-message e))])
(thread-values
(λ () (sleep 0) (set! x "?") (println "this side effect should not happen"))
(λ () (raise-user-error "catch me"))))])
(string-append res x))
"catch me!"))

View file

@ -277,8 +277,8 @@
; check that noscript images are removed ; check that noscript images are removed
(check-equal? ((query-selector (λ (t a c) (eq? t 'noscript)) transformed)) #f) (check-equal? ((query-selector (λ (t a c) (eq? t 'noscript)) transformed)) #f)
; benchmark ; benchmark
(when (file-exists? "../misc/Frog.html") (when (file-exists? "../storage/Frog.html")
(with-input-from-file "../misc/Frog.html" (with-input-from-file "../storage/Frog.html"
(λ () (λ ()
(define tree (html->xexp (current-input-port))) (define tree (html->xexp (current-input-port)))
(time (length (update-tree-wiki tree "minecraft"))))))) (time (length (update-tree-wiki tree "minecraft")))))))

View file

@ -201,13 +201,16 @@
,(if (config-true? 'instance_is_official) ,(if (config-true? 'instance_is_official)
(let ([balloon '(img (@ (src "/static/three-balloons.png") (class "bw-balloon") (title "Image Source: pngimg.com/image/4955 | License: CC BY-NC 4.0 | Modifications: Resized") (width "52") (height "56")))] (let ([balloon '(img (@ (src "/static/three-balloons.png") (class "bw-balloon") (title "Image Source: pngimg.com/image/4955 | License: CC BY-NC 4.0 | Modifications: Resized") (width "52") (height "56")))]
[extension-eligible? [extension-eligible?
(and req (let* ([ua-pair (assq 'user-agent (request-headers req))] (cond/var
[ua (string-downcase (cdr ua-pair))]) [(not req) #f]
;; everyone pretends to be chrome, so we do it in reverse (var ua-pair (assq 'user-agent (request-headers req)))
;; this excludes common browsers that don't support the extension [(not ua-pair) #f]
(and (not (string-contains? ua "edge/")) (var ua (string-downcase (cdr ua-pair)))
(not (string-contains? ua "edg/")) ;; everyone pretends to be chrome, so we do it in reverse
(not (string-contains? ua "mobile")))))]) ;; this excludes common browsers that don't support the extension
[#t (and (not (string-contains? ua "edge/"))
(not (string-contains? ua "edg/"))
(not (string-contains? ua "mobile")))])])
`(div (@ (class "bw-top-banner")) `(div (@ (class "bw-top-banner"))
,balloon ,balloon
(div (div

View file

@ -28,7 +28,7 @@
(hash-set! wikis-hash (symbol->string wikiname) w))) (hash-set! wikis-hash (symbol->string wikiname) w)))
(module+ test (module+ test
(check-equal? (cadr (hash-ref wikis-hash "gallowmere")) (check-equal? (cadr (hash-ref wikis-hash "gallowmere"))
"Gallowmere Historia")) "MediEvil Wiki"))
(define (parse-table table) (define (parse-table table)
(define rows (query-selector (λ (t a c) (eq? t 'tr)) table)) (define rows (query-selector (λ (t a c) (eq? t 'tr)) table))

View file

@ -17,6 +17,7 @@
"data.rkt" "data.rkt"
"page-wiki.rkt" "page-wiki.rkt"
"../lib/syntax.rkt" "../lib/syntax.rkt"
"../lib/thread-utils.rkt"
"../lib/url-utils.rkt" "../lib/url-utils.rkt"
"whole-utils.rkt" "whole-utils.rkt"
"../lib/xexpr-utils.rkt") "../lib/xexpr-utils.rkt")
@ -69,55 +70,59 @@
(define origin (format "https://~a.fandom.com" wikiname)) (define origin (format "https://~a.fandom.com" wikiname))
(define source-url (format "~a/wiki/~a" origin prefixed-category)) (define source-url (format "~a/wiki/~a" origin prefixed-category))
(thread-let (define-values (members-data page-data siteinfo)
([members-data (define dest-url (thread-values
(format "~a/api.php?~a" (λ ()
origin (define dest-url
(params->query `(("action" . "query") (format "~a/api.php?~a"
("list" . "categorymembers") origin
("cmtitle" . ,prefixed-category) (params->query `(("action" . "query")
("cmlimit" . "max") ("list" . "categorymembers")
("formatversion" . "2") ("cmtitle" . ,prefixed-category)
("format" . "json"))))) ("cmlimit" . "max")
(log-outgoing dest-url) ("formatversion" . "2")
(define dest-res (easy:get dest-url #:timeouts timeouts)) ("format" . "json")))))
(easy:response-json dest-res)] (log-outgoing dest-url)
[page-data (define dest-url (define dest-res (easy:get dest-url #:timeouts timeouts))
(format "~a/api.php?~a" (easy:response-json dest-res))
origin (λ ()
(params->query `(("action" . "parse") (define dest-url
("page" . ,prefixed-category) (format "~a/api.php?~a"
("prop" . "text|headhtml|langlinks") origin
("formatversion" . "2") (params->query `(("action" . "parse")
("format" . "json"))))) ("page" . ,prefixed-category)
(log-outgoing dest-url) ("prop" . "text|headhtml|langlinks")
(define dest-res (easy:get dest-url #:timeouts timeouts)) ("formatversion" . "2")
(easy:response-json dest-res)] ("format" . "json")))))
[siteinfo (siteinfo-fetch wikiname)]) (log-outgoing dest-url)
(define dest-res (easy:get dest-url #:timeouts timeouts))
(easy:response-json dest-res))
(λ ()
(siteinfo-fetch wikiname))))
(define title (preprocess-html-wiki (jp "/parse/title" page-data prefixed-category))) (define title (preprocess-html-wiki (jp "/parse/title" page-data prefixed-category)))
(define page-html (preprocess-html-wiki (jp "/parse/text" page-data ""))) (define page-html (preprocess-html-wiki (jp "/parse/text" page-data "")))
(define page (html->xexp page-html)) (define page (html->xexp page-html))
(define head-data ((head-data-getter wikiname) page-data)) (define head-data ((head-data-getter wikiname) page-data))
(define body (generate-results-page (define body (generate-results-page
#:req req #:req req
#:source-url source-url #:source-url source-url
#:wikiname wikiname #:wikiname wikiname
#:title title #:title title
#:members-data members-data #:members-data members-data
#:page page #:page page
#:head-data head-data #:head-data head-data
#:siteinfo siteinfo)) #:siteinfo siteinfo))
(when (config-true? 'debug) (when (config-true? 'debug)
; used for its side effects ; used for its side effects
; convert to string with error checking, error will be raised if xexp is invalid ; convert to string with error checking, error will be raised if xexp is invalid
(xexp->html body)) (xexp->html body))
(response/output (response/output
#:code 200 #:code 200
#:headers (build-headers always-headers) #:headers (build-headers always-headers)
(λ (out) (λ (out)
(write-html body out)))))) (write-html body out)))))
(module+ test (module+ test
(check-not-false ((query-selector (attribute-selector 'href "/test/wiki/Ankle_Monitor") (check-not-false ((query-selector (attribute-selector 'href "/test/wiki/Ankle_Monitor")
(generate-results-page (generate-results-page

View file

@ -17,6 +17,7 @@
"data.rkt" "data.rkt"
"page-wiki.rkt" "page-wiki.rkt"
"../lib/syntax.rkt" "../lib/syntax.rkt"
"../lib/thread-utils.rkt"
"../lib/url-utils.rkt" "../lib/url-utils.rkt"
"whole-utils.rkt" "whole-utils.rkt"
"../lib/xexpr-utils.rkt") "../lib/xexpr-utils.rkt")
@ -108,42 +109,45 @@
(define origin (format "https://~a.fandom.com" wikiname)) (define origin (format "https://~a.fandom.com" wikiname))
(define source-url (format "~a/wiki/~a" origin prefixed-title)) (define source-url (format "~a/wiki/~a" origin prefixed-title))
(thread-let (define-values (media-detail siteinfo)
([media-detail (define dest-url (thread-values
(format "~a/wikia.php?~a" (λ ()
origin (define dest-url
(params->query `(("format" . "json") ("controller" . "Lightbox") (format "~a/wikia.php?~a"
("method" . "getMediaDetail") origin
("fileTitle" . ,prefixed-title))))) (params->query `(("format" . "json") ("controller" . "Lightbox")
(log-outgoing dest-url) ("method" . "getMediaDetail")
(define dest-res (easy:get dest-url #:timeouts timeouts)) ("fileTitle" . ,prefixed-title)))))
(easy:response-json dest-res)] (log-outgoing dest-url)
[siteinfo (siteinfo-fetch wikiname)]) (define dest-res (easy:get dest-url #:timeouts timeouts))
(if (not (jp "/exists" media-detail #f)) (easy:response-json dest-res))
(next-dispatcher) (λ ()
(response-handler (siteinfo-fetch wikiname))))
(define file-title (jp "/fileTitle" media-detail "")) (if (not (jp "/exists" media-detail #f))
(define title (next-dispatcher)
(if (non-empty-string? file-title) (format "File:~a" file-title) prefixed-title)) (response-handler
(define image-content-type (define file-title (jp "/fileTitle" media-detail ""))
(if (non-empty-string? (jp "/videoEmbedCode" media-detail "")) (define title
#f (if (non-empty-string? file-title) (format "File:~a" file-title) prefixed-title))
(url-content-type (jp "/imageUrl" media-detail)))) (define image-content-type
(define body (if (non-empty-string? (jp "/videoEmbedCode" media-detail ""))
(generate-results-page #:req req #f
#:source-url source-url (url-content-type (jp "/imageUrl" media-detail))))
#:wikiname wikiname (define body
#:title title (generate-results-page #:req req
#:media-detail media-detail #:source-url source-url
#:image-content-type image-content-type #:wikiname wikiname
#:siteinfo siteinfo)) #:title title
(when (config-true? 'debug) #:media-detail media-detail
; used for its side effects #:image-content-type image-content-type
; convert to string with error checking, error will be raised if xexp is invalid #:siteinfo siteinfo))
(xexp->html body)) (when (config-true? 'debug)
(response/output #:code 200 ; used for its side effects
#:headers (build-headers always-headers) ; convert to string with error checking, error will be raised if xexp is invalid
(λ (out) (write-html body out)))))))) (xexp->html body))
(response/output #:code 200
#:headers (build-headers always-headers)
(λ (out) (write-html body out)))))))
(module+ test (module+ test
(parameterize ([(config-parameter 'strict_proxy) "true"]) (parameterize ([(config-parameter 'strict_proxy) "true"])
(check-equal? (get-media-html "https://static.wikia.nocookie.net/a" "image/jpeg") (check-equal? (get-media-html "https://static.wikia.nocookie.net/a" "image/jpeg")

View file

@ -14,6 +14,7 @@
"config.rkt" "config.rkt"
"data.rkt" "data.rkt"
"../lib/syntax.rkt" "../lib/syntax.rkt"
"../lib/thread-utils.rkt"
"../lib/url-utils.rkt" "../lib/url-utils.rkt"
"whole-utils.rkt" "whole-utils.rkt"
"../lib/xexpr-utils.rkt") "../lib/xexpr-utils.rkt")
@ -72,23 +73,26 @@
("formatversion" . "2") ("formatversion" . "2")
("format" . "json"))))) ("format" . "json")))))
(thread-let (define-values (dest-res siteinfo)
([dest-res (log-outgoing dest-url) (thread-values
(easy:get dest-url #:timeouts timeouts)] (λ ()
[siteinfo (siteinfo-fetch wikiname)]) (log-outgoing dest-url)
(easy:get dest-url #:timeouts timeouts))
(λ ()
(siteinfo-fetch wikiname))))
(define data (easy:response-json dest-res)) (define data (easy:response-json dest-res))
(define body (generate-results-page req dest-url wikiname query data #:siteinfo siteinfo)) (define body (generate-results-page req dest-url wikiname query data #:siteinfo siteinfo))
(when (config-true? 'debug) (when (config-true? 'debug)
; used for its side effects ; used for its side effects
; convert to string with error checking, error will be raised if xexp is invalid ; convert to string with error checking, error will be raised if xexp is invalid
(xexp->html body)) (xexp->html body))
(response/output (response/output
#:code 200 #:code 200
#:headers (build-headers always-headers) #:headers (build-headers always-headers)
(λ (out) (λ (out)
(write-html body out)))))) (write-html body out)))))
(module+ test (module+ test
(parameterize ([(config-parameter 'feature_offline::only) "false"]) (parameterize ([(config-parameter 'feature_offline::only) "false"])
(check-not-false ((query-selector (attribute-selector 'href "/test/wiki/Gacha_Capsule") (check-not-false ((query-selector (attribute-selector 'href "/test/wiki/Gacha_Capsule")

View file

@ -19,6 +19,7 @@
"data.rkt" "data.rkt"
"../lib/pure-utils.rkt" "../lib/pure-utils.rkt"
"../lib/syntax.rkt" "../lib/syntax.rkt"
"../lib/thread-utils.rkt"
"../lib/tree-updater.rkt" "../lib/tree-updater.rkt"
"../lib/url-utils.rkt" "../lib/url-utils.rkt"
"whole-utils.rkt" "whole-utils.rkt"
@ -41,59 +42,62 @@
(define path (string-join (map path/param-path (cddr (url-path (request-uri req)))) "/")) (define path (string-join (map path/param-path (cddr (url-path (request-uri req)))) "/"))
(define source-url (format "https://~a.fandom.com/wiki/~a" wikiname path)) (define source-url (format "https://~a.fandom.com/wiki/~a" wikiname path))
(thread-let (define-values (dest-res siteinfo)
([dest-res (define dest-url (thread-values
(format "~a/api.php?~a" (λ ()
origin (define dest-url
(params->query `(("action" . "parse") (format "~a/api.php?~a"
("page" . ,path) origin
("prop" . "text|headhtml|langlinks") (params->query `(("action" . "parse")
("formatversion" . "2") ("page" . ,path)
("format" . "json"))))) ("prop" . "text|headhtml|langlinks")
(log-outgoing dest-url) ("formatversion" . "2")
(easy:get dest-url ("format" . "json")))))
#:timeouts timeouts (log-outgoing dest-url)
#:headers `#hasheq((cookie . ,(format "theme=~a" (user-cookies^-theme user-cookies)))))] (easy:get dest-url
[siteinfo (siteinfo-fetch wikiname)]) #:timeouts timeouts
#:headers `#hasheq((cookie . ,(format "theme=~a" (user-cookies^-theme user-cookies))))))
(λ ()
(siteinfo-fetch wikiname))))
(cond (cond
[(eq? 200 (easy:response-status-code dest-res)) [(eq? 200 (easy:response-status-code dest-res))
(let* ([data (easy:response-json dest-res)] (let* ([data (easy:response-json dest-res)]
[title (jp "/parse/title" data "")] [title (jp "/parse/title" data "")]
[page-html (jp "/parse/text" data "")] [page-html (jp "/parse/text" data "")]
[page-html (preprocess-html-wiki page-html)] [page-html (preprocess-html-wiki page-html)]
[page (html->xexp page-html)] [page (html->xexp page-html)]
[head-data ((head-data-getter wikiname) data)]) [head-data ((head-data-getter wikiname) data)])
(if (equal? "missingtitle" (jp "/error/code" data #f)) (if (equal? "missingtitle" (jp "/error/code" data #f))
(next-dispatcher) (next-dispatcher)
(response-handler (response-handler
(define body (define body
(generate-wiki-page (generate-wiki-page
(update-tree-wiki page wikiname) (update-tree-wiki page wikiname)
#:req req #:req req
#:source-url source-url #:source-url source-url
#:wikiname wikiname #:wikiname wikiname
#:title title #:title title
#:head-data head-data #:head-data head-data
#:siteinfo siteinfo)) #:siteinfo siteinfo))
(define redirect-msg ((query-selector (attribute-selector 'class "redirectMsg") body))) (define redirect-msg ((query-selector (attribute-selector 'class "redirectMsg") body)))
(define redirect-query-parameter (dict-ref (url-query (request-uri req)) 'redirect "yes")) (define redirect-query-parameter (dict-ref (url-query (request-uri req)) 'redirect "yes"))
(define headers (define headers
(build-headers (build-headers
always-headers always-headers
; redirect-query-parameter: only the string "no" is significant: ; redirect-query-parameter: only the string "no" is significant:
; https://github.com/Wikia/app/blob/fe60579a53f16816d65dad1644363160a63206a6/includes/Wiki.php#L367 ; https://github.com/Wikia/app/blob/fe60579a53f16816d65dad1644363160a63206a6/includes/Wiki.php#L367
(when (and redirect-msg (when (and redirect-msg
(not (equal? redirect-query-parameter "no"))) (not (equal? redirect-query-parameter "no")))
(let* ([dest (get-attribute 'href (bits->attributes ((query-selector (λ (t a c) (eq? t 'a)) redirect-msg))))] (let* ([dest (get-attribute 'href (bits->attributes ((query-selector (λ (t a c) (eq? t 'a)) redirect-msg))))]
[value (bytes-append #"0;url=" (string->bytes/utf-8 dest))]) [value (bytes-append #"0;url=" (string->bytes/utf-8 dest))])
(header #"Refresh" value))))) (header #"Refresh" value)))))
(when (config-true? 'debug) (when (config-true? 'debug)
; used for its side effects ; used for its side effects
; convert to string with error checking, error will be raised if xexp is invalid ; convert to string with error checking, error will be raised if xexp is invalid
(xexp->html body)) (xexp->html body))
(response/output (response/output
#:code 200 #:code 200
#:headers headers #:headers headers
(λ (out) (λ (out)
(write-html body out))))))]))) (write-html body out))))))]))