Update getinfobox.py
This commit is contained in:
parent
fbc0a2d226
commit
f95b2b5a4d
1 changed files with 3 additions and 10 deletions
|
@ -13,13 +13,8 @@ from selenium.webdriver.common.desired_capabilities import DesiredCapabilities
|
||||||
|
|
||||||
from config import Config
|
from config import Config
|
||||||
|
|
||||||
config_path = os.path.abspath('./config/config.cfg')
|
|
||||||
|
|
||||||
try:
|
infobox_render = Config().config('infobox_render')
|
||||||
if config_path:
|
|
||||||
infobox_render = Config().config(config_path, 'infobox_render')
|
|
||||||
except:
|
|
||||||
infobox_render = None
|
|
||||||
|
|
||||||
|
|
||||||
async def get_infobox_pic(link, pagelink, headers):
|
async def get_infobox_pic(link, pagelink, headers):
|
||||||
|
@ -27,8 +22,6 @@ async def get_infobox_pic(link, pagelink, headers):
|
||||||
print('hello')
|
print('hello')
|
||||||
wlink = re.sub(r'api.php', '', link)
|
wlink = re.sub(r'api.php', '', link)
|
||||||
link = re.sub(r'(?:w/|)api.php', '', link)
|
link = re.sub(r'(?:w/|)api.php', '', link)
|
||||||
print(link)
|
|
||||||
print(pagelink)
|
|
||||||
try:
|
try:
|
||||||
async with aiohttp.ClientSession(headers=headers) as session:
|
async with aiohttp.ClientSession(headers=headers) as session:
|
||||||
async with session.get(pagelink, timeout=aiohttp.ClientTimeout(total=20)) as req:
|
async with session.get(pagelink, timeout=aiohttp.ClientTimeout(total=20)) as req:
|
||||||
|
@ -36,14 +29,13 @@ async def get_infobox_pic(link, pagelink, headers):
|
||||||
except:
|
except:
|
||||||
traceback.print_exc()
|
traceback.print_exc()
|
||||||
return False
|
return False
|
||||||
print(111)
|
|
||||||
soup = BeautifulSoup(html, 'html.parser')
|
soup = BeautifulSoup(html, 'html.parser')
|
||||||
pagename = uuid.uuid4()
|
pagename = uuid.uuid4()
|
||||||
url = os.path.abspath(f'./cache/{pagename}.html')
|
url = os.path.abspath(f'./cache/{pagename}.html')
|
||||||
if os.path.exists(url):
|
if os.path.exists(url):
|
||||||
os.remove(url)
|
os.remove(url)
|
||||||
print(222)
|
print(222)
|
||||||
find_infobox = soup.find(class_='notaninfobox') # 我
|
find_infobox = soup.find(class_='.notaninfobox') # 我
|
||||||
if find_infobox is None: # 找
|
if find_infobox is None: # 找
|
||||||
find_infobox = soup.find(class_='portable-infobox') # 找
|
find_infobox = soup.find(class_='portable-infobox') # 找
|
||||||
if find_infobox is None: # 找
|
if find_infobox is None: # 找
|
||||||
|
@ -60,6 +52,7 @@ async def get_infobox_pic(link, pagelink, headers):
|
||||||
find_infobox = soup.find(class_='wikitable songtable') # 找 (arcw)
|
find_infobox = soup.find(class_='wikitable songtable') # 找 (arcw)
|
||||||
if find_infobox is None: # 找
|
if find_infobox is None: # 找
|
||||||
return False # 找你妈,不找了<-咱还是回家吧
|
return False # 找你妈,不找了<-咱还是回家吧
|
||||||
|
print('Find infobox..')
|
||||||
|
|
||||||
if infobox_render is None:
|
if infobox_render is None:
|
||||||
open_file = open(url, 'a', encoding='utf-8')
|
open_file = open(url, 'a', encoding='utf-8')
|
||||||
|
|
Reference in a new issue