2019-06-25 00:38:18 +00:00
|
|
|
import xmltree, htmlparser, strtabs, strformat, times
|
2019-06-23 23:34:30 +00:00
|
|
|
import nimquery, regex
|
|
|
|
|
2019-06-24 03:14:14 +00:00
|
|
|
import ./types, ./formatters, ./api
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
const
|
|
|
|
thumbRegex = re".+:url\('([^']+)'\)"
|
|
|
|
gifRegex = re".+thumb/([^\.']+)\.jpg.*"
|
|
|
|
|
|
|
|
proc getAttr*(node: XmlNode; attr: string; default=""): string =
|
|
|
|
if node.isNil or node.attrs.isNil: return default
|
|
|
|
return node.attrs.getOrDefault(attr)
|
|
|
|
|
|
|
|
proc selectAttr*(node: XmlNode; selector: string; attr: string; default=""): string =
|
|
|
|
let res = node.querySelector(selector)
|
|
|
|
if res == nil: "" else: res.getAttr(attr, default)
|
|
|
|
|
|
|
|
proc selectText*(node: XmlNode; selector: string): string =
|
|
|
|
let res = node.querySelector(selector)
|
|
|
|
result = if res == nil: "" else: res.innerText()
|
|
|
|
|
2019-06-24 07:30:34 +00:00
|
|
|
proc getHeader(profile: XmlNode): XmlNode =
|
|
|
|
result = profile.querySelector(".permalink-header")
|
|
|
|
if result.isNil:
|
|
|
|
result = profile.querySelector(".stream-item-header")
|
|
|
|
if result.isNil:
|
|
|
|
result = profile.querySelector(".ProfileCard-userFields")
|
|
|
|
|
2019-06-23 23:34:30 +00:00
|
|
|
proc isVerified*(profile: XmlNode): bool =
|
2019-06-24 07:30:34 +00:00
|
|
|
getHeader(profile).selectText(".Icon.Icon--verified").len > 0
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
proc isProtected*(profile: XmlNode): bool =
|
2019-06-24 07:30:34 +00:00
|
|
|
getHeader(profile).selectText(".Icon.Icon--protected").len > 0
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
proc getName*(profile: XmlNode; selector: string): string =
|
2019-06-25 00:38:18 +00:00
|
|
|
profile.selectText(selector).stripText()
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
proc getUsername*(profile: XmlNode; selector: string): string =
|
|
|
|
profile.selectText(selector).strip(chars={'@', ' '})
|
|
|
|
|
2019-06-25 00:38:18 +00:00
|
|
|
proc emojify*(node: XmlNode) =
|
|
|
|
for i in node.querySelectorAll(".Emoji"):
|
|
|
|
i.add newText(i.getAttr("alt"))
|
|
|
|
|
2019-06-25 02:52:38 +00:00
|
|
|
proc getQuoteText*(tweet: XmlNode): string =
|
|
|
|
let
|
|
|
|
text = tweet.querySelector(".QuoteTweet-text")
|
|
|
|
hasEmojis = not text.querySelector(".Emoji").isNil
|
|
|
|
|
|
|
|
if hasEmojis:
|
|
|
|
emojify(text)
|
|
|
|
|
|
|
|
result = stripText(selectText(text, ".tweet-text"))
|
|
|
|
result = stripTwitterUrls(result)
|
|
|
|
|
2019-06-23 23:34:30 +00:00
|
|
|
proc getTweetText*(tweet: XmlNode): string =
|
2019-06-24 07:39:45 +00:00
|
|
|
let
|
|
|
|
selector = ".tweet-text > a.twitter-timeline-link.u-hidden"
|
|
|
|
link = tweet.selectAttr(selector, "data-expanded-url")
|
|
|
|
quote = tweet.querySelector(".QuoteTweet")
|
2019-06-25 00:38:18 +00:00
|
|
|
text = tweet.querySelector(".tweet-text")
|
|
|
|
hasEmojis = not text.querySelector(".Emoji").isNil
|
|
|
|
|
|
|
|
if hasEmojis:
|
|
|
|
emojify(text)
|
|
|
|
|
|
|
|
result = stripText(selectText(text, ".tweet-text"))
|
2019-06-23 23:34:30 +00:00
|
|
|
|
2019-06-24 07:39:45 +00:00
|
|
|
if not quote.isNil and link.len > 0:
|
2019-06-25 00:38:18 +00:00
|
|
|
result = result.replace(link, "")
|
2019-06-23 23:34:30 +00:00
|
|
|
|
2019-06-25 00:38:18 +00:00
|
|
|
result = stripTwitterUrls(result)
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
proc getTime(tweet: XmlNode): XmlNode =
|
|
|
|
tweet.querySelector(".js-short-timestamp")
|
|
|
|
|
|
|
|
proc getTimestamp*(tweet: XmlNode): Time =
|
|
|
|
let time = getTime(tweet).getAttr("data-time", "0")
|
|
|
|
fromUnix(parseInt(time))
|
|
|
|
|
|
|
|
proc getShortTime*(tweet: XmlNode): string =
|
|
|
|
getTime(tweet).innerText()
|
|
|
|
|
|
|
|
proc getBio*(profile: XmlNode; selector: string): string =
|
2019-06-25 00:38:18 +00:00
|
|
|
profile.selectText(selector).stripText()
|
2019-06-23 23:34:30 +00:00
|
|
|
|
|
|
|
proc getAvatar*(profile: XmlNode; selector: string): string =
|
|
|
|
profile.selectAttr(selector, "src").getUserpic()
|
|
|
|
|
|
|
|
proc getBanner*(tweet: XmlNode): string =
|
|
|
|
let url = tweet.selectAttr("svg > image", "xlink:href")
|
|
|
|
|
|
|
|
if url.len > 0:
|
|
|
|
result = url.replace("600x200", "1500x500")
|
|
|
|
else:
|
|
|
|
result = tweet.selectAttr(".ProfileCard-bg", "style")
|
|
|
|
|
|
|
|
if result.len == 0:
|
|
|
|
result = "background-color: #161616"
|
|
|
|
|
|
|
|
proc getPopupStats*(profile: var Profile; node: XmlNode) =
|
|
|
|
for s in node.querySelectorAll( ".ProfileCardStats-statLink"):
|
|
|
|
let text = s.getAttr("title").split(" ")[0]
|
|
|
|
case s.getAttr("href").split("/")[^1]
|
|
|
|
of "followers": profile.followers = text
|
|
|
|
of "following": profile.following = text
|
|
|
|
else: profile.tweets = text
|
|
|
|
|
|
|
|
proc getIntentStats*(profile: var Profile; node: XmlNode) =
|
|
|
|
profile.tweets = "?"
|
|
|
|
for s in node.querySelectorAll( "dd.count > a"):
|
|
|
|
let text = s.innerText()
|
|
|
|
case s.getAttr("href").split("/")[^1]
|
|
|
|
of "followers": profile.followers = text
|
|
|
|
of "following": profile.following = text
|
|
|
|
|
2019-06-24 03:14:14 +00:00
|
|
|
proc getTweetStats*(tweet: Tweet; node: XmlNode) =
|
2019-06-23 23:34:30 +00:00
|
|
|
tweet.replies = "0"
|
|
|
|
tweet.retweets = "0"
|
|
|
|
tweet.likes = "0"
|
|
|
|
for action in node.querySelectorAll(".ProfileTweet-actionCountForAria"):
|
|
|
|
let text = action.innerText.split()
|
|
|
|
case text[1]
|
|
|
|
of "replies": tweet.replies = text[0]
|
|
|
|
of "likes": tweet.likes = text[0]
|
|
|
|
of "retweets": tweet.retweets = text[0]
|
|
|
|
|
2019-06-24 03:14:14 +00:00
|
|
|
proc getGif(player: XmlNode): Gif =
|
|
|
|
let
|
|
|
|
thumb = player.getAttr("style").replace(thumbRegex, "$1")
|
|
|
|
id = thumb.replace(gifRegex, "$1")
|
|
|
|
url = fmt"https://video.twimg.com/tweet_video/{id}.mp4"
|
|
|
|
Gif(url: url, thumb: thumb)
|
|
|
|
|
|
|
|
proc getTweetMedia*(tweet: Tweet; node: XmlNode) =
|
2019-06-23 23:34:30 +00:00
|
|
|
for photo in node.querySelectorAll(".AdaptiveMedia-photoContainer"):
|
|
|
|
tweet.photos.add photo.attrs["data-image-url"]
|
|
|
|
|
2019-06-24 03:14:14 +00:00
|
|
|
let player = node.querySelector(".PlayableMedia")
|
|
|
|
if player.isNil:
|
2019-06-23 23:34:30 +00:00
|
|
|
return
|
|
|
|
|
2019-06-24 03:14:14 +00:00
|
|
|
if "gif" in player.getAttr("class"):
|
|
|
|
tweet.gif = some(getGif(player.querySelector(".PlayableMedia-player")))
|
2019-06-24 03:29:47 +00:00
|
|
|
elif "video" in player.getAttr("class"):
|
2019-06-24 03:14:14 +00:00
|
|
|
tweet.video = some(Video())
|
2019-06-24 06:07:36 +00:00
|
|
|
|
|
|
|
proc getQuoteMedia*(quote: var Quote; node: XmlNode) =
|
2019-06-25 00:58:33 +00:00
|
|
|
let sensitive = node.querySelector(".QuoteTweet--sensitive")
|
|
|
|
if not sensitive.isNil:
|
|
|
|
quote.sensitive = true
|
|
|
|
return
|
|
|
|
|
2019-06-24 06:07:36 +00:00
|
|
|
let media = node.querySelector(".QuoteMedia")
|
|
|
|
if not media.isNil:
|
|
|
|
quote.thumb = some(media.selectAttr("img", "src"))
|
|
|
|
|
|
|
|
let badge = node.querySelector(".AdaptiveMedia-badgeText")
|
2019-06-24 22:39:32 +00:00
|
|
|
let gifBadge = node.querySelector(".Icon--gifBadge")
|
|
|
|
|
2019-06-24 06:07:36 +00:00
|
|
|
if not badge.isNil:
|
|
|
|
quote.badge = some(badge.innerText())
|
2019-06-24 22:39:32 +00:00
|
|
|
elif not gifBadge.isNil:
|
|
|
|
quote.badge = some("GIF")
|