89 lines
No EOL
4 KiB
Python
89 lines
No EOL
4 KiB
Python
import json
|
||
import re
|
||
import requests
|
||
import urllib
|
||
import traceback
|
||
from interwikilist import iwlist,iwlink
|
||
async def wiki1(path1,pagename):
|
||
print(pagename)
|
||
metaurl = path1 +'api.php?action=query&format=json&prop=info&inprop=url&redirects&titles=' + pagename
|
||
print(metaurl)
|
||
metatext = requests.get(metaurl, timeout=10)
|
||
file = json.loads(metatext.text)
|
||
try:
|
||
x = file['query']['pages']
|
||
y = sorted(x.keys())[0]
|
||
if int(y) == -1:
|
||
if 'invalid' in x['-1']:
|
||
rs = re.sub('The requested page title contains invalid characters:','请求的页面标题包含非法字符:',x['-1']['invalidreason'])
|
||
return('发生错误:“'+rs+'”。')
|
||
else:
|
||
if 'missing' in x['-1']:
|
||
try:
|
||
try:
|
||
searchurl = path1+'api.php?action=query&generator=search&gsrsearch=' + pagename + '&gsrsort=just_match&gsrenablerewrites&prop=info&gsrlimit=1&format=json'
|
||
f = requests.get(searchurl)
|
||
g = json.loads(f.text)
|
||
j = g['query']['pages']
|
||
b = sorted(j.keys())[0]
|
||
m = j[b]['title']
|
||
return ('找不到条目,您是否要找的是:' + m +'?')
|
||
except Exception:
|
||
searchurl = path1+'api.php?action=query&list=search&srsearch='+pagename+'&srwhat=text&srlimit=1&srenablerewrites=&format=json'
|
||
f = requests.get(searchurl)
|
||
g = json.loads(f.text)
|
||
m = g['query']['search'][0]['title']
|
||
return ('找不到条目,您是否要找的是:' + m +'?')
|
||
except Exception:
|
||
return ('找不到条目。')
|
||
else:
|
||
return ('您要的'+ pagename +':'+path1 + urllib.parse.quote(pagename.encode('UTF-8')))
|
||
else:
|
||
z = x[y]['fullurl']
|
||
if z.find('index.php') != -1 or z.find('Index.php') !=-1:
|
||
h = re.match(r'https?://.*/.*/(.*)', z, re.M | re.I)
|
||
else:
|
||
h = re.match(r'https?://.*/(.*)', z, re.M | re.I)
|
||
try:
|
||
texturl = metaurl + '/api.php?action=query&prop=extracts&exsentences=1&&explaintext&exsectionformat=wiki&format=json&titles=' + h.group(1)
|
||
gettext = requests.get(texturl, timeout=10)
|
||
loadtext = json.loads(gettext.text)
|
||
v = loadtext['query']['pages'][y]['extract']
|
||
except Exception:
|
||
v = ''
|
||
try:
|
||
s = re.match(r'.*(\#.*)',pagename)
|
||
z = x[y]['fullurl'] + urllib.parse.quote(s.group(1).encode('UTF-8'))
|
||
except Exception:
|
||
z = x[y]['fullurl']
|
||
if z.find('index.php') != -1 or z.find('Index.php') !=-1:
|
||
n = re.match(r'https?://.*?/.*/(.*)',z)
|
||
else:
|
||
n = re.match(r'https?://.*?/(.*)',z)
|
||
k = urllib.parse.unquote(n.group(1),encoding='UTF-8')
|
||
k = re.sub('_',' ',k)
|
||
if k == pagename:
|
||
xx = re.sub('\n$', '', z + '\n' + v)
|
||
else:
|
||
xx = re.sub('\n$', '', '\n(重定向['+pagename +']至['+k+'])\n'+z + '\n' + v)
|
||
return('您要的'+pagename+":"+xx)
|
||
except Exception:
|
||
try:
|
||
w = re.match(r'(.*?):(.*)',pagename)
|
||
i = w.group(1)
|
||
if i in iwlist():
|
||
return(await wiki2(i,w.group(2)))
|
||
else:
|
||
return('发生错误:内容非法。')
|
||
except Exception as e:
|
||
traceback.print_exc()
|
||
return('发生错误:'+str(e))
|
||
|
||
|
||
async def wiki2(lang,str1):
|
||
try:
|
||
metaurl = iwlink(lang)
|
||
return(await wiki1(metaurl,str1))
|
||
except Exception as e:
|
||
traceback.print_exc()
|
||
return (str(e)) |