mirror of
https://0xacab.org/johnxina/rat.git
synced 2024-12-23 13:09:08 +00:00
50 lines
1.3 KiB
Python
50 lines
1.3 KiB
Python
'''Extra APIs'''
|
|
|
|
import requests
|
|
import bs4
|
|
import re
|
|
|
|
from shared import *
|
|
|
|
# TODO: known bug, can't extract from super old editor images.
|
|
def extract_image_name(url):
|
|
match = re.search(r'/(\w+)\.jpg', url)
|
|
try:
|
|
return match.group(1) + '.jpg'
|
|
except:
|
|
return '404.jpg'
|
|
|
|
@cache.memoize(timeout=60)
|
|
def find_tieba_info(tname):
|
|
"""Get the tiebat avatar for the forum name.
|
|
|
|
:param tname: the name of the target forum.
|
|
:returns: the internal ID of the corresponding avatar.
|
|
|
|
"""
|
|
info = { 'name': tname }
|
|
|
|
res = requests.get('https://tieba.baidu.com/f',
|
|
params={'kw': tname},
|
|
allow_redirects=False)
|
|
|
|
# Baidu will bring us to the search page, so we ignore it.
|
|
if res.status_code == 302:
|
|
raise ValueError('您搜索的贴吧不存在')
|
|
|
|
soup = bs4.BeautifulSoup(res.text, 'html.parser')
|
|
|
|
elems = soup.select('#forum-card-head')
|
|
info['avatar'] = extract_image_name(elems[0]['src'])
|
|
|
|
footer = soup.select('.th_footer_l')[0]
|
|
stat_elems = footer.findAll('span', {'class': 'red_text'}, recursive=False)
|
|
stats = list(map(lambda x: int(x.text), stat_elems))
|
|
|
|
info |= { 'topic': stats[0], 'thread': stats[1], 'member': stats[2] }
|
|
|
|
slogan = soup.select('.card_slogan')[0]
|
|
info['desc'] = slogan.text
|
|
|
|
return info
|