# SPDX-License-Identifier: AGPL-3.0-only import strutils, options, tables, times, math import packedjson, packedjson/deserialiser import types, parserutils, utils import experimental/parser/unifiedcard proc parseGraphTweet(js: JsonNode): Tweet proc parseUser(js: JsonNode; id=""): User = if js.isNull: return result = User( id: if id.len > 0: id else: js{"id_str"}.getStr, username: js{"screen_name"}.getStr, fullname: js{"name"}.getStr, location: js{"location"}.getStr, bio: js{"description"}.getStr, userPic: js{"profile_image_url_https"}.getImageStr.replace("_normal", ""), banner: js.getBanner, following: js{"friends_count"}.getInt, followers: js{"followers_count"}.getInt, tweets: js{"statuses_count"}.getInt, likes: js{"favourites_count"}.getInt, media: js{"media_count"}.getInt, verified: js{"verified"}.getBool or js{"ext_is_blue_verified"}.getBool, protected: js{"protected"}.getBool, joinDate: js{"created_at"}.getTime ) result.expandUserEntities(js) proc parseGraphUser(js: JsonNode): User = let user = ? js{"user_results", "result"} result = parseUser(user{"legacy"}) if "is_blue_verified" in user: result.verified = true proc parseGraphList*(js: JsonNode): List = if js.isNull: return var list = js{"data", "user_by_screen_name", "list"} if list.isNull: list = js{"data", "list"} if list.isNull: return result = List( id: list{"id_str"}.getStr, name: list{"name"}.getStr, username: list{"user_results", "result", "legacy", "screen_name"}.getStr, userId: list{"user_results", "result", "rest_id"}.getStr, description: list{"description"}.getStr, members: list{"member_count"}.getInt, banner: list{"custom_banner_media", "media_info", "original_img_url"}.getImageStr ) proc parsePoll(js: JsonNode): Poll = let vals = js{"binding_values"} # name format is pollNchoice_* for i in '1' .. js{"name"}.getStr[4]: let choice = "choice" & i result.values.add parseInt(vals{choice & "_count"}.getStrVal("0")) result.options.add vals{choice & "_label"}.getStrVal let time = vals{"end_datetime_utc", "string_value"}.getDateTime if time > now(): let timeLeft = $(time - now()) result.status = timeLeft[0 ..< timeLeft.find(",")] else: result.status = "Final results" result.leader = result.values.find(max(result.values)) result.votes = result.values.sum proc parseGif(js: JsonNode): Gif = result = Gif( url: js{"video_info", "variants"}[0]{"url"}.getImageStr, thumb: js{"media_url_https"}.getImageStr ) proc parseVideo(js: JsonNode): Video = result = Video( thumb: js{"media_url_https"}.getImageStr, views: js{"ext", "mediaStats", "r", "ok", "viewCount"}.getStr($js{"mediaStats", "viewCount"}.getInt), available: js{"ext_media_availability", "status"}.getStr.toLowerAscii == "available", title: js{"ext_alt_text"}.getStr, durationMs: js{"video_info", "duration_millis"}.getInt # playbackType: mp4 ) with title, js{"additional_media_info", "title"}: result.title = title.getStr with description, js{"additional_media_info", "description"}: result.description = description.getStr for v in js{"video_info", "variants"}: let contentType = parseEnum[VideoType](v{"content_type"}.getStr("summary")) url = v{"url"}.getStr result.variants.add VideoVariant( contentType: contentType, bitrate: v{"bitrate"}.getInt, url: url, resolution: if contentType == mp4: getMp4Resolution(url) else: 0 ) proc parsePromoVideo(js: JsonNode): Video = result = Video( thumb: js{"player_image_large"}.getImageVal, available: true, durationMs: js{"content_duration_seconds"}.getStrVal("0").parseInt * 1000, playbackType: vmap ) var variant = VideoVariant( contentType: vmap, url: js{"player_hls_url"}.getStrVal(js{"player_stream_url"}.getStrVal( js{"amplify_url_vmap"}.getStrVal())) ) if "m3u8" in variant.url: variant.contentType = m3u8 result.playbackType = m3u8 result.variants.add variant proc parseBroadcast(js: JsonNode): Card = let image = js{"broadcast_thumbnail_large"}.getImageVal result = Card( kind: broadcast, url: js{"broadcast_url"}.getStrVal, title: js{"broadcaster_display_name"}.getStrVal, text: js{"broadcast_title"}.getStrVal, image: image, video: some Video(thumb: image) ) proc parseCard(js: JsonNode; urls: JsonNode): Card = const imageTypes = ["summary_photo_image", "player_image", "promo_image", "photo_image_full_size", "thumbnail_image", "thumbnail", "event_thumbnail", "image"] let vals = ? js{"binding_values"} name = js{"name"}.getStr kind = parseEnum[CardKind](name[(name.find(":") + 1) ..< name.len], unknown) if kind == unified: return parseUnifiedCard(vals{"unified_card", "string_value"}.getStr) result = Card( kind: kind, url: vals.getCardUrl(kind), dest: vals.getCardDomain(kind), title: vals.getCardTitle(kind), text: vals{"description"}.getStrVal ) if result.url.len == 0: result.url = js{"url"}.getStr case kind of promoVideo, promoVideoConvo, appPlayer, videoDirectMessage: result.video = some parsePromoVideo(vals) if kind == appPlayer: result.text = vals{"app_category"}.getStrVal(result.text) of broadcast: result = parseBroadcast(vals) of liveEvent: result.text = vals{"event_title"}.getStrVal of player: result.url = vals{"player_url"}.getStrVal if "youtube.com" in result.url: result.url = result.url.replace("/embed/", "/watch?v=") of audiospace, unknown: result.title = "This card type is not supported." else: discard for typ in imageTypes: with img, vals{typ & "_large"}: result.image = img.getImageVal break for u in ? urls: if u{"url"}.getStr == result.url: result.url = u{"expanded_url"}.getStr break if kind in {videoDirectMessage, imageDirectMessage}: result.url.setLen 0 if kind in {promoImageConvo, promoImageApp, imageDirectMessage} and result.url.len == 0 or result.url.startsWith("card://"): result.url = getPicUrl(result.image) proc parseTweet(js: JsonNode; jsCard: JsonNode = newJNull()): Tweet = if js.isNull: return result = Tweet( id: js{"id_str"}.getId, threadId: js{"conversation_id_str"}.getId, replyId: js{"in_reply_to_status_id_str"}.getId, text: js{"full_text"}.getStr, time: js{"created_at"}.getTime, hasThread: js{"self_thread"}.notNull, available: true, user: User(id: js{"user_id_str"}.getStr), stats: TweetStats( replies: js{"reply_count"}.getInt, retweets: js{"retweet_count"}.getInt, likes: js{"favorite_count"}.getInt, quotes: js{"quote_count"}.getInt ) ) result.expandTweetEntities(js) # fix for pinned threads if result.hasThread and result.threadId == 0: result.threadId = js{"self_thread", "id_str"}.getId if js{"is_quote_status"}.getBool: result.quote = some Tweet(id: js{"quoted_status_id_str"}.getId) # legacy with rt, js{"retweeted_status_id_str"}: result.retweet = some Tweet(id: rt.getId) return # graphql with rt, js{"retweeted_status_result", "result"}: # needed due to weird edgecase where the actual tweet data isn't included if "legacy" in rt: result.retweet = some parseGraphTweet(rt) return if jsCard.kind != JNull: let name = jsCard{"name"}.getStr if "poll" in name: if "image" in name: result.photos.add jsCard{"binding_values", "image_large"}.getImageVal result.poll = some parsePoll(jsCard) elif name == "amplify": result.video = some(parsePromoVideo(jsCard{"binding_values"})) else: result.card = some parseCard(jsCard, js{"entities", "urls"}) with jsMedia, js{"extended_entities", "media"}: for m in jsMedia: case m{"type"}.getStr of "photo": result.photos.add m{"media_url_https"}.getImageStr of "video": result.video = some(parseVideo(m)) with user, m{"additional_media_info", "source_user"}: if user{"id"}.getInt > 0: result.attribution = some(parseUser(user)) else: result.attribution = some(parseGraphUser(user)) of "animated_gif": result.gif = some(parseGif(m)) else: discard with jsWithheld, js{"withheld_in_countries"}: let withheldInCountries: seq[string] = if jsWithheld.kind != JArray: @[] else: jsWithheld.to(seq[string]) # XX - Content is withheld in all countries # XY - Content is withheld due to a DMCA request. if js{"withheld_copyright"}.getBool or withheldInCountries.len > 0 and ("XX" in withheldInCountries or "XY" in withheldInCountries or "withheld" in result.text): result.text.removeSuffix(" Learn more.") result.available = false proc finalizeTweet(global: GlobalObjects; id: string): Tweet = let intId = if id.len > 0: parseBiggestInt(id) else: 0 result = global.tweets.getOrDefault(id, Tweet(id: intId)) if result.quote.isSome: let quote = get(result.quote).id if $quote in global.tweets: result.quote = some global.tweets[$quote] else: result.quote = some Tweet() if result.retweet.isSome: let rt = get(result.retweet).id if $rt in global.tweets: result.retweet = some finalizeTweet(global, $rt) else: result.retweet = some Tweet() proc parsePin(js: JsonNode; global: GlobalObjects): Tweet = let pin = js{"pinEntry", "entry", "entryId"}.getStr if pin.len == 0: return let id = pin.getId if id notin global.tweets: return global.tweets[id].pinned = true return finalizeTweet(global, id) proc parseGlobalObjects(js: JsonNode): GlobalObjects = result = GlobalObjects() let tweets = ? js{"globalObjects", "tweets"} users = ? js{"globalObjects", "users"} for k, v in users: result.users[k] = parseUser(v, k) for k, v in tweets: var tweet = parseTweet(v, v{"card"}) if tweet.user.id in result.users: tweet.user = result.users[tweet.user.id] result.tweets[k] = tweet proc parseInstructions[T](res: var Result[T]; global: GlobalObjects; js: JsonNode) = if js.kind != JArray or js.len == 0: return for i in js: when T is Tweet: if res.beginning and i{"pinEntry"}.notNull: with pin, parsePin(i, global): res.content.add pin with r, i{"replaceEntry", "entry"}: if "top" in r{"entryId"}.getStr: res.top = r.getCursor elif "bottom" in r{"entryId"}.getStr: res.bottom = r.getCursor proc parseTimeline*(js: JsonNode; after=""): Timeline = result = Timeline(beginning: after.len == 0) let global = parseGlobalObjects(? js) let instructions = ? js{"timeline", "instructions"} if instructions.len == 0: return result.parseInstructions(global, instructions) var entries: JsonNode for i in instructions: if "addEntries" in i: entries = i{"addEntries", "entries"} for e in ? entries: let entry = e{"entryId"}.getStr if "tweet" in entry or entry.startsWith("sq-I-t") or "tombstone" in entry: let tweet = finalizeTweet(global, e.getEntryId) if not tweet.available: continue result.content.add tweet elif "cursor-top" in entry: result.top = e.getCursor elif "cursor-bottom" in entry: result.bottom = e.getCursor elif entry.startsWith("sq-cursor"): with cursor, e{"content", "operation", "cursor"}: if cursor{"cursorType"}.getStr == "Bottom": result.bottom = cursor{"value"}.getStr else: result.top = cursor{"value"}.getStr proc parsePhotoRail*(js: JsonNode): PhotoRail = for tweet in js: let t = parseTweet(tweet, js{"card"}) url = if t.photos.len > 0: t.photos[0] elif t.video.isSome: get(t.video).thumb elif t.gif.isSome: get(t.gif).thumb elif t.card.isSome: get(t.card).image else: "" if url.len == 0: continue result.add GalleryPhoto(url: url, tweetId: $t.id) proc parseGraphTweet(js: JsonNode): Tweet = if js.kind == JNull: return Tweet(available: false) case js{"__typename"}.getStr of "TweetUnavailable", "TweetPreviewDisplay": return Tweet(available: false) of "TweetTombstone": return Tweet( available: false, text: js{"tombstone", "text"}.getTombstone ) of "TweetWithVisibilityResults": return parseGraphTweet(js{"tweet"}) var jsCard = copy(js{"card", "legacy"}) if jsCard.kind != JNull: var values = newJObject() for val in jsCard["binding_values"]: values[val["key"].getStr] = val["value"] jsCard["binding_values"] = values result = parseTweet(js{"legacy"}, jsCard) result.user = parseGraphUser(js{"core"}) with noteTweet, js{"note_tweet", "note_tweet_results", "result"}: result.expandNoteTweetEntities(noteTweet) if result.quote.isSome: result.quote = some(parseGraphTweet(js{"quoted_status_result", "result"})) proc parseGraphThread(js: JsonNode): tuple[thread: Chain; self: bool] = let thread = js{"content", "items"} for t in js{"content", "items"}: let entryId = t{"entryId"}.getStr if "cursor-showmore" in entryId: let cursor = t{"item", "itemContent", "value"} result.thread.cursor = cursor.getStr result.thread.hasMore = true elif "tweet" in entryId: let tweet = parseGraphTweet(t{"item", "itemContent", "tweet_results", "result"}) result.thread.content.add tweet if t{"item", "itemContent", "tweetDisplayType"}.getStr == "SelfThread": result.self = true proc parseGraphTweetResult*(js: JsonNode): Tweet = with tweet, js{"data", "tweetResult", "result"}: result = parseGraphTweet(tweet) proc parseGraphConversation*(js: JsonNode; tweetId: string): Conversation = result = Conversation(replies: Result[Chain](beginning: true)) let instructions = ? js{"data", "threaded_conversation_with_injections", "instructions"} if instructions.len == 0: return for e in instructions[0]{"entries"}: let entryId = e{"entryId"}.getStr # echo entryId if entryId.startsWith("tweet"): with tweetResult, e{"content", "itemContent", "tweet_results", "result"}: let tweet = parseGraphTweet(tweetResult) if not tweet.available: tweet.id = parseBiggestInt(entryId.getId()) if $tweet.id == tweetId: result.tweet = tweet else: result.before.content.add tweet elif entryId.startsWith("tombstone"): let id = entryId.getId() let tweet = Tweet( id: parseBiggestInt(id), available: false, text: e{"content", "itemContent", "tombstoneInfo", "richText"}.getTombstone ) if id == tweetId: result.tweet = tweet else: result.before.content.add tweet elif entryId.startsWith("conversationthread"): let (thread, self) = parseGraphThread(e) if self: result.after = thread else: result.replies.content.add thread elif entryId.startsWith("cursor-bottom"): result.replies.bottom = e{"content", "itemContent", "value"}.getStr proc parseGraphTimeline*(js: JsonNode; root: string; after=""): Timeline = result = Timeline(beginning: after.len == 0) let instructions = if root == "list": ? js{"data", "list", "tweets_timeline", "timeline", "instructions"} else: ? js{"data", "user", "result", "timeline_v2", "timeline", "instructions"} if instructions.len == 0: return for i in instructions: if i{"type"}.getStr == "TimelineAddEntries": for e in i{"entries"}: let entryId = e{"entryId"}.getStr if entryId.startsWith("tweet"): with tweetResult, e{"content", "itemContent", "tweet_results", "result"}: let tweet = parseGraphTweet(tweetResult) if not tweet.available: tweet.id = parseBiggestInt(entryId.getId()) result.content.add tweet elif entryId.startsWith("cursor-bottom"): result.bottom = e{"content", "value"}.getStr proc parseGraphSearch*(js: JsonNode; after=""): Timeline = result = Timeline(beginning: after.len == 0) let instructions = js{"data", "search_by_raw_query", "search_timeline", "timeline", "instructions"} if instructions.len == 0: return for instruction in instructions: let typ = instruction{"type"}.getStr if typ == "TimelineAddEntries": for e in instructions[0]{"entries"}: let entryId = e{"entryId"}.getStr if entryId.startsWith("tweet"): with tweetResult, e{"content", "itemContent", "tweet_results", "result"}: let tweet = parseGraphTweet(tweetResult) if not tweet.available: tweet.id = parseBiggestInt(entryId.getId()) result.content.add tweet elif entryId.startsWith("cursor-bottom"): result.bottom = e{"content", "value"}.getStr elif typ == "TimelineReplaceEntry": if instruction{"entry_id_to_replace"}.getStr.startsWith("cursor-bottom"): result.bottom = instruction{"entry", "content", "value"}.getStr