Small refactoring & user feed API WIP
This commit is contained in:
parent
8438ddc3dd
commit
22433cdab5
@ -48,7 +48,7 @@ def test_twextract_UserExtract():
|
||||
assert user["created_at"] == "Tue Mar 21 20:50:14 +0000 2006"
|
||||
|
||||
def test_twextract_UserExtractID():
|
||||
user = twExtract.extractUser(testUserID,workaroundTokens=tokens)
|
||||
user = twExtract.extractUser(testUserIDUrl,workaroundTokens=tokens)
|
||||
assert user["screen_name"]=="jack"
|
||||
assert user["id"]==12
|
||||
assert user["created_at"] == "Tue Mar 21 20:50:14 +0000 2006"
|
||||
@ -99,4 +99,9 @@ def test_twextract_pollTweetExtract(): # basic check if poll data exists
|
||||
assert tweet['card']['name']=="poll2choice_text_only"
|
||||
|
||||
def test_twextract_NSFW_TweetExtract():
|
||||
tweet = twExtract.extractStatus(testNSFWTweet,workaroundTokens=tokens) # For now just test that there's no error
|
||||
tweet = twExtract.extractStatus(testNSFWTweet,workaroundTokens=tokens) # For now just test that there's no error
|
||||
|
||||
'''
|
||||
def test_twextract_feed():
|
||||
tweet = twExtract.extractUserFeedFromId(testUserID,workaroundTokens=tokens)
|
||||
'''
|
@ -1,8 +1,9 @@
|
||||
import twitfix, cache, twExtract
|
||||
from vx_testdata import *
|
||||
from twExtract import twUtils
|
||||
|
||||
def test_calcSyndicationToken():
|
||||
assert twExtract.calcSyndicationToken("1691389765483200513") == "43lnobuxzql"
|
||||
assert twUtils.calcSyndicationToken("1691389765483200513") == "43lnobuxzql"
|
||||
|
||||
def test_addToCache():
|
||||
cache.clearCache()
|
||||
|
@ -5,8 +5,10 @@ import re
|
||||
import os
|
||||
import random
|
||||
import urllib.parse
|
||||
import math
|
||||
from oauthlib import oauth1
|
||||
import sys
|
||||
sys.path.append(os.path.dirname(os.path.realpath(__file__)))
|
||||
import twUtils
|
||||
bearer="Bearer AAAAAAAAAAAAAAAAAAAAAPYXBAAAAAAACLXUNDekMxqa8h%2F40K4moUkGsoc%3DTYfbDKbT3jJPCEVnMYqilB28NHfOPqkca3qaAxGfsyKCs0wRbw"
|
||||
v2bearer="Bearer AAAAAAAAAAAAAAAAAAAAANRILgAAAAAAnNwIzUejRCOuH5E6I8xnZz4puTs%3D1Zv7ttfk8LF81IUq16cHjhLTvJu4FA33AGWWjCpTnA"
|
||||
androidBearer="Bearer AAAAAAAAAAAAAAAAAAAAAFXzAwAAAAAAMHCxpeSDG1gLNLghVe8d74hl6k4%3DRUMF4xAQLsbeBhTSRrCiQpJtxoGWeyHrDb5te2jpGskWDFW82F"
|
||||
@ -33,6 +35,10 @@ androidGraphql_api="llQH5PFIRlenVrlKJU8jNA"
|
||||
tweetDetailGraphqlFeatures='{"rweb_tipjar_consumption_enabled":true,"responsive_web_graphql_exclude_directive_enabled":true,"verified_phone_label_enabled":false,"creator_subscriptions_tweet_preview_api_enabled":true,"responsive_web_graphql_timeline_navigation_enabled":true,"responsive_web_graphql_skip_user_profile_image_extensions_enabled":false,"communities_web_enable_tweet_community_results_fetch":true,"c9s_tweet_anatomy_moderator_badge_enabled":true,"articles_preview_enabled":true,"tweetypie_unmention_optimization_enabled":true,"responsive_web_edit_tweet_api_enabled":true,"graphql_is_translatable_rweb_tweet_is_translatable_enabled":true,"view_counts_everywhere_api_enabled":true,"longform_notetweets_consumption_enabled":true,"responsive_web_twitter_article_tweet_consumption_enabled":true,"tweet_awards_web_tipping_enabled":false,"creator_subscriptions_quote_tweet_preview_enabled":false,"freedom_of_speech_not_reach_fetch_enabled":true,"standardized_nudges_misinfo":true,"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled":true,"rweb_video_timestamps_enabled":true,"longform_notetweets_rich_text_read_enabled":true,"longform_notetweets_inline_media_enabled":true,"responsive_web_enhance_cards_enabled":false}'
|
||||
tweetDetailGraphql_api="e7RKseIxLu7HgkWNKZ6qnw"
|
||||
|
||||
# this is for UserTweets endpoint
|
||||
tweetFeedGraphqlFeatures='{"profile_label_improvements_pcf_label_in_post_enabled":true,"rweb_tipjar_consumption_enabled":true,"responsive_web_graphql_exclude_directive_enabled":true,"verified_phone_label_enabled":false,"creator_subscriptions_tweet_preview_api_enabled":true,"responsive_web_graphql_timeline_navigation_enabled":true,"responsive_web_graphql_skip_user_profile_image_extensions_enabled":false,"premium_content_api_read_enabled":false,"communities_web_enable_tweet_community_results_fetch":true,"c9s_tweet_anatomy_moderator_badge_enabled":true,"responsive_web_grok_analyze_button_fetch_trends_enabled":false,"responsive_web_grok_analyze_post_followups_enabled":true,"responsive_web_jetfuel_frame":false,"responsive_web_grok_share_attachment_enabled":true,"articles_preview_enabled":true,"responsive_web_edit_tweet_api_enabled":true,"graphql_is_translatable_rweb_tweet_is_translatable_enabled":true,"view_counts_everywhere_api_enabled":true,"longform_notetweets_consumption_enabled":true,"responsive_web_twitter_article_tweet_consumption_enabled":true,"tweet_awards_web_tipping_enabled":false,"responsive_web_grok_analysis_button_from_backend":true,"creator_subscriptions_quote_tweet_preview_enabled":false,"freedom_of_speech_not_reach_fetch_enabled":true,"standardized_nudges_misinfo":true,"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled":true,"rweb_video_timestamps_enabled":true,"longform_notetweets_rich_text_read_enabled":true,"longform_notetweets_inline_media_enabled":true,"responsive_web_grok_image_annotation_enabled":true,"responsive_web_enhance_cards_enabled":false}'
|
||||
tweetFeedGraphql_api="Y9WM4Id6UcGFE8Z-hbnixw"
|
||||
|
||||
twitterUrl = "x.com" # doubt this will change but just in case
|
||||
class TwExtractError(Exception):
|
||||
def __init__(self, code, message):
|
||||
@ -166,41 +172,13 @@ def extractStatus_guestToken(url):
|
||||
raise TwExtractError(error["code"], error["message"])
|
||||
return output
|
||||
|
||||
digits = "0123456789abcdefghijklmnopqrstuvwxyz"
|
||||
|
||||
def baseConversion(x, base):
|
||||
result = ''
|
||||
i = int(x)
|
||||
while i > 0:
|
||||
result = digits[i % base] + result
|
||||
i = i // base
|
||||
if int(x) != x:
|
||||
result += '.'
|
||||
i = x - int(x)
|
||||
d = 0
|
||||
while i != int(i):
|
||||
result += digits[int(i * base % base)]
|
||||
i = i * base
|
||||
d += 1
|
||||
if d >= 8:
|
||||
break
|
||||
return result
|
||||
|
||||
def calcSyndicationToken(idStr):
|
||||
id = int(idStr) / 1000000000000000 * math.pi
|
||||
o = baseConversion(x=id, base=int(math.pow(6, 2)))
|
||||
c = o.replace('0', '').replace('.', '')
|
||||
if c == '':
|
||||
c = '0'
|
||||
return c
|
||||
|
||||
def extractStatus_syndication(url,workaroundTokens=None):
|
||||
# https://github.com/mikf/gallery-dl/blob/46cae04aa3a113c7b6bbee1bb468669564b14ae8/gallery_dl/extractor/twitter.py#L1784
|
||||
m = re.search(pathregex, url)
|
||||
if m is None:
|
||||
raise TwExtractError(400, "Extract error")
|
||||
twid = m.group(2)
|
||||
tweet = requests.get("https://cdn.syndication.twimg.com/tweet-result?id=" + twid+"&token="+calcSyndicationToken(twid))
|
||||
tweet = requests.get("https://cdn.syndication.twimg.com/tweet-result?id=" + twid+"&token="+twUtils.calcSyndicationToken(twid))
|
||||
|
||||
|
||||
if tweet.status_code == 404:
|
||||
@ -524,8 +502,32 @@ def extractUser(url,workaroundTokens):
|
||||
continue
|
||||
raise TwExtractError(400, "Extract error")
|
||||
|
||||
#def extractUserByID(id):
|
||||
|
||||
def extractUserFeedFromId(userId,workaroundTokens):
|
||||
tokens = workaroundTokens
|
||||
random.shuffle(tokens)
|
||||
for authToken in tokens:
|
||||
if authToken.startswith("oa|"): # oauth token not supported atm
|
||||
# TODO: https://api.twitter.com/graphql/x31u1gdnjcqtiVZFc1zWnQ/UserWithProfileTweetsQueryV2?variables={"cursor":"?","includeTweetImpression":true,"includeHasBirdwatchNotes":false,"includeEditPerspective":false,"includeEditControl":true,"count":40,"rest_id":"12","includeTweetVisibilityNudge":true,"autoplay_enabled":true}&features={"longform_notetweets_inline_media_enabled":true,"super_follow_badge_privacy_enabled":true,"longform_notetweets_rich_text_read_enabled":true,"super_follow_user_api_enabled":true,"unified_cards_ad_metadata_container_dynamic_card_content_query_enabled":true,"super_follow_tweet_api_enabled":true,"articles_api_enabled":true,"android_graphql_skip_api_media_color_palette":true,"creator_subscriptions_tweet_preview_api_enabled":true,"freedom_of_speech_not_reach_fetch_enabled":true,"tweetypie_unmention_optimization_enabled":true,"longform_notetweets_consumption_enabled":true,"subscriptions_verification_info_enabled":true,"blue_business_profile_image_shape_enabled":true,"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled":true,"immersive_video_status_linkable_timestamps":false,"super_follow_exclusive_tweet_notifications_enabled":true}
|
||||
continue
|
||||
try:
|
||||
vars = json.loads('{"userId":"x","count":20,"includePromotedContent":true,"withQuickPromoteEligibilityTweetFields":true,"withVoice":true,"withV2Timeline":true}')
|
||||
vars['userId'] = str(userId)
|
||||
vars['includePromotedContent'] = False # idk if this works
|
||||
reqHeaders = getAuthHeaders(bearer,authToken=authToken)
|
||||
reqHeaders["x-client-transaction-id"] = twUtils.generate_transaction_id("GET","/i/api/graphql/x31u1gdnjcqtiVZFc1zWnQ/UserWithProfileTweetsQueryV2")
|
||||
feed = requests.get(f"https://{twitterUrl}/i/api/graphql/{tweetFeedGraphql_api}/UserTweets?variables={urllib.parse.quote(json.dumps(vars))}&features={urllib.parse.quote(tweetFeedGraphqlFeatures)}", reqHeaders)
|
||||
output = feed.json()
|
||||
if "errors" in output:
|
||||
# pick the first error and create a twExtractError
|
||||
error = output["errors"][0]
|
||||
raise TwExtractError(error["code"], error["message"])
|
||||
return output
|
||||
except Exception as e:
|
||||
continue
|
||||
raise TwExtractError(400, "Extract error")
|
||||
|
||||
def extractUserFeed(username,workaroundTokens):
|
||||
pass
|
||||
|
||||
def lambda_handler(event, context):
|
||||
if ("queryStringParameters" not in event):
|
||||
|
35
twExtract/twUtils.py
Normal file
35
twExtract/twUtils.py
Normal file
@ -0,0 +1,35 @@
|
||||
import math
|
||||
import hashlib
|
||||
import base64
|
||||
import uuid
|
||||
digits = "0123456789abcdefghijklmnopqrstuvwxyz"
|
||||
|
||||
def baseConversion(x, base):
|
||||
result = ''
|
||||
i = int(x)
|
||||
while i > 0:
|
||||
result = digits[i % base] + result
|
||||
i = i // base
|
||||
if int(x) != x:
|
||||
result += '.'
|
||||
i = x - int(x)
|
||||
d = 0
|
||||
while i != int(i):
|
||||
result += digits[int(i * base % base)]
|
||||
i = i * base
|
||||
d += 1
|
||||
if d >= 8:
|
||||
break
|
||||
return result
|
||||
|
||||
|
||||
def calcSyndicationToken(idStr):
|
||||
id = int(idStr) / 1000000000000000 * math.pi
|
||||
o = baseConversion(x=id, base=int(math.pow(6, 2)))
|
||||
c = o.replace('0', '').replace('.', '')
|
||||
if c == '':
|
||||
c = '0'
|
||||
return c
|
||||
|
||||
def generate_transaction_id(method: str, path: str) -> str:
|
||||
return "?" # not implemented
|
@ -26,7 +26,8 @@ testMixedMediaTweet_compare={'text': 'Some of us here are definitely big nerds a
|
||||
testVinePlayerTweet_compare={'text': 'You wanted old ROBLOX back, you got it. Check out our sweet "new" look! #BringBackOldROBLOX https://vine.co/v/OL9VqvM6wJh', 'date': 'Wed Apr 01 16:17:13 +0000 2015', 'tweetURL': 'https://twitter.com/Roblox/status/583302104342638592', 'tweetID': '583302104342638592', 'conversationID': '583302104342638592', 'mediaURLs': ['https://v.cdn.vine.co/r/videos/20A1BE53011195086166081318912_3fe3b526b1a.1.5.3156516531034157495.mp4?versionId=DI1mMu7EI6zcLbvgucyp3GHebdz8.9cQ'], 'media_extended': [{'url': 'https://v.cdn.vine.co/r/videos/20A1BE53011195086166081318912_3fe3b526b1a.1.5.3156516531034157495.mp4?versionId=DI1mMu7EI6zcLbvgucyp3GHebdz8.9cQ', 'type': 'video', 'size': {'width': 435, 'height': 435}}], 'possibly_sensitive': False, 'hashtags': [], 'qrtURL': None, 'allSameType': True, 'hasMedia': True, 'combinedMediaUrl': None, 'pollData': {'options': []}, 'article': None, 'date_epoch': 1427905033}
|
||||
|
||||
testUser="https://twitter.com/jack"
|
||||
testUserID = "https://twitter.com/i/user/12"
|
||||
testUserID=12 # could also be 170824883
|
||||
testUserIDUrl = "https://twitter.com/i/user/"+str(testUserID)
|
||||
testUserWeirdURLs=["https://twitter.com/jack?lang=en","https://twitter.com/jack/with_replies","https://twitter.com/jack/media","https://twitter.com/jack/likes","https://twitter.com/jack/with_replies?lang=en","https://twitter.com/jack/media?lang=en","https://twitter.com/jack/likes?lang=en","https://twitter.com/jack/"]
|
||||
testTextTweet="https://twitter.com/jack/status/20"
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user