searxng/searx/engines/twitter.py

76 lines
2.4 KiB
Python
Raw Normal View History

2022-08-14 01:39:41 +00:00
# SPDX-License-Identifier: AGPL-3.0-or-later
# lint: pylint
"""Twitter (microblogging platform)"""
from json import loads
from urllib.parse import urlencode
from datetime import datetime
about = {
"website": 'https://twitter.com',
"wikidata_id": None,
"official_api_documentation": 'https://developer.twitter.com/en/docs/twitter-api',
"use_official_api": True,
"require_api_key": False,
"results": 'JSON',
}
categories = ['social media']
url = "https://api.twitter.com"
search_url = (
"{url}/2/search/adaptive.json?{query}&tweet_mode=extended&query_source=typed_query&pc=1&spelling_corrections=1"
)
def request(query, params):
params['url'] = search_url.format(url=url, query=urlencode({'q': query}))
params['headers'] = {
2022-08-17 12:45:42 +00:00
# This token is used in the Twitter web interface (twitter.com). Without this header, the API doesn't work.
# The value of the token has never changed (or maybe once a long time ago).
2022-08-14 01:39:41 +00:00
# https://github.com/zedeus/nitter/blob/5f31e86e0e8578377fa7d5aeb9631bbb2d35ef1e/src/consts.nim#L5
'Authorization': (
"Bearer AAAAAAAAAAAAAAAAAAAAAPYXBAAAAAAACLXUNDekMxqa8h%2F40K4moUkGsoc%3DTYfbDKb"
"T3jJPCEVnMYqilB28NHfOPqkca3qaAxGfsyKCs0wRbw"
)
}
return params
def response(resp):
results = []
json_res = loads(resp.text)['globalObjects']
for tweet in json_res['tweets'].values():
text = tweet['full_text']
display = tweet['display_text_range']
2022-08-17 07:25:22 +00:00
img_src = tweet.get('extended_entities', {}).get('media', [{}])[0].get('media_url_https')
if img_src:
img_src += "?name=thumb"
2022-08-14 01:39:41 +00:00
results.append(
{
'url': 'https://twitter.com/i/web/status/' + tweet['id_str'],
'title': (text[:40] + '...') if len(text) > 40 else text,
'content': text[display[0] : display[1]],
2022-08-17 07:25:22 +00:00
'img_src': img_src,
2022-08-14 01:39:41 +00:00
'publishedDate': datetime.strptime(tweet['created_at'], '%a %b %d %H:%M:%S %z %Y'),
}
)
for user in json_res['users'].values():
results.append(
2022-08-17 07:30:59 +00:00
{
'title': user['name'],
'content': user['description'],
'url': 'https://twitter.com/' + user['screen_name'],
'img_src': user['profile_image_url_https'],
}
2022-08-14 01:39:41 +00:00
)
return results