用百度的识字api 可以识别广西公需科目 当代科学技术前沿知识 的文档《当代科学技术前沿知识读本》电子书(全文).pdf 这个可以在平台下载完了就识别出来就好搜答案了
自动考试视频
guagnxi视频.mp4
#考试代码
for i in cont:
mu = i.text
mu = re.findall('\. (.+)\[\d分\]',mu)[0]
try:
an = daan[mu]
print(mu)
print(an)
print('\n')
d = i.attrs['id']
x = browser.find_element_by_id(d)
xx = x.find_elements_by_class_name('cTitle')
xuan = []
for t in xx:
xuan.append(t.text)
inp = x.find_elements_by_css_selector('input')
for r in an:
dd = xuan.index(r)
inp[dd].click()
time.sleep(0.5)
print(r)
except:
pass
from aip import AipOcr
def bai(na ='1.jpg'):
""" 你的 APPID AK SK """
APP_ID = ''
API_KEY = ''
SECRET_KEY = ''
client = AipOcr(APP_ID, API_KEY, SECRET_KEY)
image =open(na,'rb')
image = image.read()
cc = client.basicGeneral(image)
con =cc['words_result']
for i in con:
print(i['words'])
def file_name(file_dir):
for root, dirs, files in os.walk(file_dir):
'''
print(root) # 当前目录路径
print(dirs) # 当前路径下所有子目录
print(files) # 当前路径下所有非目录子文件
'''
for i in files:
if '.py' in str(i):
pass
else:
bai(i)
识别出来的结果:这下面我识别了一小半 ,全完的电子书答案有288页图片