438 lines
14 KiB
Nim
438 lines
14 KiB
Nim
# SPDX-License-Identifier: AGPL-3.0-only
|
|
import strutils, options, tables, times, math
|
|
import packedjson, packedjson/deserialiser
|
|
import types, parserutils, utils
|
|
import experimental/parser/unifiedcard
|
|
|
|
proc parseUser(js: JsonNode; id=""): User =
|
|
if js.isNull: return
|
|
result = User(
|
|
id: if id.len > 0: id else: js{"id_str"}.getStr,
|
|
username: js{"screen_name"}.getStr,
|
|
fullname: js{"name"}.getStr,
|
|
location: js{"location"}.getStr,
|
|
bio: js{"description"}.getStr,
|
|
userPic: js{"profile_image_url_https"}.getImageStr.replace("_normal", ""),
|
|
banner: js.getBanner,
|
|
following: js{"friends_count"}.getInt,
|
|
followers: js{"followers_count"}.getInt,
|
|
tweets: js{"statuses_count"}.getInt,
|
|
likes: js{"favourites_count"}.getInt,
|
|
media: js{"media_count"}.getInt,
|
|
verified: js{"verified"}.getBool,
|
|
protected: js{"protected"}.getBool,
|
|
joinDate: js{"created_at"}.getTime
|
|
)
|
|
|
|
result.expandUserEntities(js)
|
|
|
|
proc parseGraphList*(js: JsonNode): List =
|
|
if js.isNull: return
|
|
|
|
var list = js{"data", "user_by_screen_name", "list"}
|
|
if list.isNull:
|
|
list = js{"data", "list"}
|
|
if list.isNull:
|
|
return
|
|
|
|
result = List(
|
|
id: list{"id_str"}.getStr,
|
|
name: list{"name"}.getStr,
|
|
username: list{"user", "legacy", "screen_name"}.getStr,
|
|
userId: list{"user", "rest_id"}.getStr,
|
|
description: list{"description"}.getStr,
|
|
members: list{"member_count"}.getInt,
|
|
banner: list{"custom_banner_media", "media_info", "url"}.getImageStr
|
|
)
|
|
|
|
proc parsePoll(js: JsonNode): Poll =
|
|
let vals = js{"binding_values"}
|
|
# name format is pollNchoice_*
|
|
for i in '1' .. js{"name"}.getStr[4]:
|
|
let choice = "choice" & i
|
|
result.values.add parseInt(vals{choice & "_count"}.getStrVal("0"))
|
|
result.options.add vals{choice & "_label"}.getStrVal
|
|
|
|
let time = vals{"end_datetime_utc", "string_value"}.getDateTime
|
|
if time > now():
|
|
let timeLeft = $(time - now())
|
|
result.status = timeLeft[0 ..< timeLeft.find(",")]
|
|
else:
|
|
result.status = "Final results"
|
|
|
|
result.leader = result.values.find(max(result.values))
|
|
result.votes = result.values.sum
|
|
|
|
proc parseGif(js: JsonNode): Gif =
|
|
result = Gif(
|
|
url: js{"video_info", "variants"}[0]{"url"}.getImageStr,
|
|
thumb: js{"media_url_https"}.getImageStr
|
|
)
|
|
|
|
proc parseVideo(js: JsonNode): Video =
|
|
result = Video(
|
|
thumb: js{"media_url_https"}.getImageStr,
|
|
views: js{"ext", "mediaStats", "r", "ok", "viewCount"}.getStr($js{"mediaStats", "viewCount"}.getInt),
|
|
available: js{"ext_media_availability", "status"}.getStr.toLowerAscii == "available",
|
|
title: js{"ext_alt_text"}.getStr,
|
|
durationMs: js{"video_info", "duration_millis"}.getInt
|
|
# playbackType: mp4
|
|
)
|
|
|
|
with title, js{"additional_media_info", "title"}:
|
|
result.title = title.getStr
|
|
|
|
with description, js{"additional_media_info", "description"}:
|
|
result.description = description.getStr
|
|
|
|
for v in js{"video_info", "variants"}:
|
|
let
|
|
contentType = parseEnum[VideoType](v{"content_type"}.getStr("summary"))
|
|
url = v{"url"}.getStr
|
|
|
|
result.variants.add VideoVariant(
|
|
contentType: contentType,
|
|
bitrate: v{"bitrate"}.getInt,
|
|
url: url,
|
|
resolution: if contentType == mp4: getMp4Resolution(url) else: 0
|
|
)
|
|
|
|
proc parsePromoVideo(js: JsonNode): Video =
|
|
result = Video(
|
|
thumb: js{"player_image_large"}.getImageVal,
|
|
available: true,
|
|
durationMs: js{"content_duration_seconds"}.getStrVal("0").parseInt * 1000,
|
|
playbackType: vmap
|
|
)
|
|
|
|
var variant = VideoVariant(
|
|
contentType: vmap,
|
|
url: js{"player_hls_url"}.getStrVal(js{"player_stream_url"}.getStrVal(
|
|
js{"amplify_url_vmap"}.getStrVal()))
|
|
)
|
|
|
|
if "m3u8" in variant.url:
|
|
variant.contentType = m3u8
|
|
result.playbackType = m3u8
|
|
|
|
result.variants.add variant
|
|
|
|
proc parseBroadcast(js: JsonNode): Card =
|
|
let image = js{"broadcast_thumbnail_large"}.getImageVal
|
|
result = Card(
|
|
kind: broadcast,
|
|
url: js{"broadcast_url"}.getStrVal,
|
|
title: js{"broadcaster_display_name"}.getStrVal,
|
|
text: js{"broadcast_title"}.getStrVal,
|
|
image: image,
|
|
video: some Video(thumb: image)
|
|
)
|
|
|
|
proc parseCard(js: JsonNode; urls: JsonNode): Card =
|
|
const imageTypes = ["summary_photo_image", "player_image", "promo_image",
|
|
"photo_image_full_size", "thumbnail_image", "thumbnail",
|
|
"event_thumbnail", "image"]
|
|
let
|
|
vals = ? js{"binding_values"}
|
|
name = js{"name"}.getStr
|
|
kind = parseEnum[CardKind](name[(name.find(":") + 1) ..< name.len], unknown)
|
|
|
|
if kind == unified:
|
|
return parseUnifiedCard(vals{"unified_card", "string_value"}.getStr)
|
|
|
|
result = Card(
|
|
kind: kind,
|
|
url: vals.getCardUrl(kind),
|
|
dest: vals.getCardDomain(kind),
|
|
title: vals.getCardTitle(kind),
|
|
text: vals{"description"}.getStrVal
|
|
)
|
|
|
|
if result.url.len == 0:
|
|
result.url = js{"url"}.getStr
|
|
|
|
case kind
|
|
of promoVideo, promoVideoConvo, appPlayer, videoDirectMessage:
|
|
result.video = some parsePromoVideo(vals)
|
|
if kind == appPlayer:
|
|
result.text = vals{"app_category"}.getStrVal(result.text)
|
|
of broadcast:
|
|
result = parseBroadcast(vals)
|
|
of liveEvent:
|
|
result.text = vals{"event_title"}.getStrVal
|
|
of player:
|
|
result.url = vals{"player_url"}.getStrVal
|
|
if "youtube.com" in result.url:
|
|
result.url = result.url.replace("/embed/", "/watch?v=")
|
|
of audiospace, unknown:
|
|
result.title = "This card type is not supported."
|
|
else: discard
|
|
|
|
for typ in imageTypes:
|
|
with img, vals{typ & "_large"}:
|
|
result.image = img.getImageVal
|
|
break
|
|
|
|
for u in ? urls:
|
|
if u{"url"}.getStr == result.url:
|
|
result.url = u{"expanded_url"}.getStr
|
|
break
|
|
|
|
if kind in {videoDirectMessage, imageDirectMessage}:
|
|
result.url.setLen 0
|
|
|
|
if kind in {promoImageConvo, promoImageApp, imageDirectMessage} and
|
|
result.url.len == 0 or result.url.startsWith("card://"):
|
|
result.url = getPicUrl(result.image)
|
|
|
|
proc parseTweet(js: JsonNode; jsCard: JsonNode = newJNull()): Tweet =
|
|
if js.isNull: return
|
|
result = Tweet(
|
|
id: js{"id_str"}.getId,
|
|
threadId: js{"conversation_id_str"}.getId,
|
|
replyId: js{"in_reply_to_status_id_str"}.getId,
|
|
text: js{"full_text"}.getStr,
|
|
time: js{"created_at"}.getTime,
|
|
hasThread: js{"self_thread"}.notNull,
|
|
available: true,
|
|
user: User(id: js{"user_id_str"}.getStr),
|
|
stats: TweetStats(
|
|
replies: js{"reply_count"}.getInt,
|
|
retweets: js{"retweet_count"}.getInt,
|
|
likes: js{"favorite_count"}.getInt,
|
|
quotes: js{"quote_count"}.getInt
|
|
)
|
|
)
|
|
|
|
# fix for pinned threads
|
|
if result.hasThread and result.threadId == 0:
|
|
result.threadId = js{"self_thread", "id_str"}.getId
|
|
|
|
result.expandTweetEntities(js)
|
|
|
|
if js{"is_quote_status"}.getBool:
|
|
result.quote = some Tweet(id: js{"quoted_status_id_str"}.getId)
|
|
|
|
with rt, js{"retweeted_status_id_str"}:
|
|
result.retweet = some Tweet(id: rt.getId)
|
|
return
|
|
|
|
if jsCard.kind != JNull:
|
|
let name = jsCard{"name"}.getStr
|
|
if "poll" in name:
|
|
if "image" in name:
|
|
result.photos.add jsCard{"binding_values", "image_large"}.getImageVal
|
|
|
|
result.poll = some parsePoll(jsCard)
|
|
elif name == "amplify":
|
|
result.video = some(parsePromoVideo(jsCard{"binding_values"}))
|
|
else:
|
|
result.card = some parseCard(jsCard, js{"entities", "urls"})
|
|
|
|
with jsMedia, js{"extended_entities", "media"}:
|
|
for m in jsMedia:
|
|
case m{"type"}.getStr
|
|
of "photo":
|
|
result.photos.add m{"media_url_https"}.getImageStr
|
|
of "video":
|
|
result.video = some(parseVideo(m))
|
|
with user, m{"additional_media_info", "source_user"}:
|
|
result.attribution = some(parseUser(user))
|
|
of "animated_gif":
|
|
result.gif = some(parseGif(m))
|
|
else: discard
|
|
|
|
with jsWithheld, js{"withheld_in_countries"}:
|
|
let withheldInCountries: seq[string] =
|
|
if jsWithheld.kind != JArray: @[]
|
|
else: jsWithheld.to(seq[string])
|
|
|
|
# XX - Content is withheld in all countries
|
|
# XY - Content is withheld due to a DMCA request.
|
|
if js{"withheld_copyright"}.getBool or
|
|
withheldInCountries.len > 0 and ("XX" in withheldInCountries or
|
|
"XY" in withheldInCountries or
|
|
"withheld" in result.text):
|
|
result.text.removeSuffix(" Learn more.")
|
|
result.available = false
|
|
|
|
proc finalizeTweet(global: GlobalObjects; id: string): Tweet =
|
|
let intId = if id.len > 0: parseBiggestInt(id) else: 0
|
|
result = global.tweets.getOrDefault(id, Tweet(id: intId))
|
|
|
|
if result.quote.isSome:
|
|
let quote = get(result.quote).id
|
|
if $quote in global.tweets:
|
|
result.quote = some global.tweets[$quote]
|
|
else:
|
|
result.quote = some Tweet()
|
|
|
|
if result.retweet.isSome:
|
|
let rt = get(result.retweet).id
|
|
if $rt in global.tweets:
|
|
result.retweet = some finalizeTweet(global, $rt)
|
|
else:
|
|
result.retweet = some Tweet()
|
|
|
|
proc parsePin(js: JsonNode; global: GlobalObjects): Tweet =
|
|
let pin = js{"pinEntry", "entry", "entryId"}.getStr
|
|
if pin.len == 0: return
|
|
|
|
let id = pin.getId
|
|
if id notin global.tweets: return
|
|
|
|
global.tweets[id].pinned = true
|
|
return finalizeTweet(global, id)
|
|
|
|
proc parseGlobalObjects(js: JsonNode): GlobalObjects =
|
|
result = GlobalObjects()
|
|
let
|
|
tweets = ? js{"globalObjects", "tweets"}
|
|
users = ? js{"globalObjects", "users"}
|
|
|
|
for k, v in users:
|
|
result.users[k] = parseUser(v, k)
|
|
|
|
for k, v in tweets:
|
|
var tweet = parseTweet(v, v{"card"})
|
|
if tweet.user.id in result.users:
|
|
tweet.user = result.users[tweet.user.id]
|
|
result.tweets[k] = tweet
|
|
|
|
proc parseStatus*(js: JsonNode): Tweet =
|
|
with e, js{"errors"}:
|
|
if e.getError == tweetNotFound:
|
|
return
|
|
|
|
result = parseTweet(js, js{"card"})
|
|
if not result.isNil:
|
|
result.user = parseUser(js{"user"})
|
|
|
|
with quote, js{"quoted_status"}:
|
|
result.quote = some parseStatus(js{"quoted_status"})
|
|
|
|
proc parseInstructions[T](res: var Result[T]; global: GlobalObjects; js: JsonNode) =
|
|
if js.kind != JArray or js.len == 0:
|
|
return
|
|
|
|
for i in js:
|
|
when T is Tweet:
|
|
if res.beginning and i{"pinEntry"}.notNull:
|
|
with pin, parsePin(i, global):
|
|
res.content.add pin
|
|
|
|
with r, i{"replaceEntry", "entry"}:
|
|
if "top" in r{"entryId"}.getStr:
|
|
res.top = r.getCursor
|
|
elif "bottom" in r{"entryId"}.getStr:
|
|
res.bottom = r.getCursor
|
|
|
|
proc parseTimeline*(js: JsonNode; after=""): Timeline =
|
|
result = Timeline(beginning: after.len == 0)
|
|
let global = parseGlobalObjects(? js)
|
|
|
|
let instructions = ? js{"timeline", "instructions"}
|
|
if instructions.len == 0: return
|
|
|
|
result.parseInstructions(global, instructions)
|
|
|
|
var entries: JsonNode
|
|
for i in instructions:
|
|
if "addEntries" in i:
|
|
entries = i{"addEntries", "entries"}
|
|
|
|
for e in ? entries:
|
|
let entry = e{"entryId"}.getStr
|
|
if "tweet" in entry or entry.startsWith("sq-I-t") or "tombstone" in entry:
|
|
let tweet = finalizeTweet(global, e.getEntryId)
|
|
if not tweet.available: continue
|
|
result.content.add tweet
|
|
elif "cursor-top" in entry:
|
|
result.top = e.getCursor
|
|
elif "cursor-bottom" in entry:
|
|
result.bottom = e.getCursor
|
|
elif entry.startsWith("sq-C"):
|
|
with cursor, e{"content", "operation", "cursor"}:
|
|
if cursor{"cursorType"}.getStr == "Bottom":
|
|
result.bottom = cursor{"value"}.getStr
|
|
else:
|
|
result.top = cursor{"value"}.getStr
|
|
|
|
proc parsePhotoRail*(js: JsonNode): PhotoRail =
|
|
for tweet in js:
|
|
let
|
|
t = parseTweet(tweet, js{"card"})
|
|
url = if t.photos.len > 0: t.photos[0]
|
|
elif t.video.isSome: get(t.video).thumb
|
|
elif t.gif.isSome: get(t.gif).thumb
|
|
elif t.card.isSome: get(t.card).image
|
|
else: ""
|
|
|
|
if url.len == 0: continue
|
|
result.add GalleryPhoto(url: url, tweetId: $t.id)
|
|
|
|
proc parseGraphTweet(js: JsonNode): Tweet =
|
|
if js.kind == JNull or js{"__typename"}.getStr == "TweetUnavailable":
|
|
return Tweet(available: false)
|
|
|
|
var jsCard = copy(js{"card", "legacy"})
|
|
if jsCard.kind != JNull:
|
|
var values = newJObject()
|
|
for val in jsCard["binding_values"]:
|
|
values[val["key"].getStr] = val["value"]
|
|
jsCard["binding_values"] = values
|
|
|
|
result = parseTweet(js{"legacy"}, jsCard)
|
|
result.user = parseUser(js{"core", "user_results", "result", "legacy"})
|
|
|
|
var note_tweet = js{"note_tweet", "note_tweet_results", "result"}
|
|
if note_tweet.kind != JNull:
|
|
result.expandNoteTweetEntities(note_tweet)
|
|
|
|
if result.quote.isSome:
|
|
result.quote = some(parseGraphTweet(js{"quoted_status_result", "result"}))
|
|
|
|
proc parseGraphThread(js: JsonNode): tuple[thread: Chain; self: bool] =
|
|
let thread = js{"content", "items"}
|
|
for t in js{"content", "items"}:
|
|
let entryId = t{"entryId"}.getStr
|
|
if "cursor-showmore" in entryId:
|
|
let cursor = t{"item", "itemContent", "value"}
|
|
result.thread.cursor = cursor.getStr
|
|
result.thread.hasMore = true
|
|
elif "tweet" in entryId:
|
|
let tweet = parseGraphTweet(t{"item", "itemContent", "tweet_results", "result"})
|
|
result.thread.content.add tweet
|
|
|
|
if t{"item", "itemContent", "tweetDisplayType"}.getStr == "SelfThread":
|
|
result.self = true
|
|
|
|
proc parseGraphConversation*(js: JsonNode; tweetId: string): Conversation =
|
|
result = Conversation(replies: Result[Chain](beginning: true))
|
|
|
|
let instructions = ? js{"data", "threaded_conversation_with_injections_v2", "instructions"}
|
|
if instructions.len == 0:
|
|
return
|
|
|
|
for e in instructions[0]{"entries"}:
|
|
let entryId = e{"entryId"}.getStr
|
|
# echo entryId
|
|
if entryId.startsWith("tweet"):
|
|
let tweet = parseGraphTweet(e{"content", "itemContent", "tweet_results", "result"})
|
|
|
|
if not tweet.available:
|
|
tweet.id = parseBiggestInt(entryId.getId())
|
|
|
|
if $tweet.id == tweetId:
|
|
result.tweet = tweet
|
|
else:
|
|
result.before.content.add tweet
|
|
elif entryId.startsWith("conversationthread"):
|
|
let (thread, self) = parseGraphThread(e)
|
|
if self:
|
|
result.after = thread
|
|
else:
|
|
result.replies.content.add thread
|
|
elif entryId.startsWith("cursor-bottom"):
|
|
result.replies.bottom = e{"content", "itemContent", "value"}.getStr
|