mirror of
https://github.com/NaiboWang/EasySpider.git
synced 2025-04-20 10:05:00 +08:00
Version 0.3.0 Beta
This commit is contained in:
parent
76e6800cb8
commit
f76cd8dd88
@ -691,7 +691,7 @@ def getData(para, loopElement, isInLoop=True, parentPath="", index=0):
|
|||||||
text = pytesseract.image_to_string(image, lang='chi_sim+eng')
|
text = pytesseract.image_to_string(image, lang='chi_sim+eng')
|
||||||
content = text
|
content = text
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
content = "OCR失败"
|
content = "OCR Error"
|
||||||
print("To use OCR, You need to install Tesseract-OCR and add it to the environment variable PATH: https://tesseract-ocr.github.io/tessdoc/Installation.html")
|
print("To use OCR, You need to install Tesseract-OCR and add it to the environment variable PATH: https://tesseract-ocr.github.io/tessdoc/Installation.html")
|
||||||
print("要使用OCR识别功能,你需要安装Tesseract-OCR并将其添加到环境变量PATH中:https://blog.csdn.net/u010454030/article/details/80515501")
|
print("要使用OCR识别功能,你需要安装Tesseract-OCR并将其添加到环境变量PATH中:https://blog.csdn.net/u010454030/article/details/80515501")
|
||||||
elif p["contentType"] == 9:
|
elif p["contentType"] == 9:
|
||||||
|
@ -53,7 +53,7 @@ Bilibili/B站视频教程:
|
|||||||
|
|
||||||
[如何爬需要输入验证码的网站](https://www.bilibili.com/video/BV18c411K7FH)
|
[如何爬需要输入验证码的网站](https://www.bilibili.com/video/BV18c411K7FH)
|
||||||
|
|
||||||
[如何切换IP池和使用隧道IP - 打开详情页采集案](https://www.bilibili.com/video/BV1KT411t79n)
|
[如何切换IP池和使用隧道IP - 打开详情页采集案例](https://www.bilibili.com/video/BV1KT411t79n)
|
||||||
|
|
||||||
|
|
||||||
Refer to [Youtube Playlist](https://youtube.com/playlist?list=PL0kEFEkWrT7mt9MUlEBV2DTo1QsaanUTp) to see the video tutorials of EasySpider.
|
Refer to [Youtube Playlist](https://youtube.com/playlist?list=PL0kEFEkWrT7mt9MUlEBV2DTo1QsaanUTp) to see the video tutorials of EasySpider.
|
||||||
|
Loading…
x
Reference in New Issue
Block a user