The script should open a preview of amazon book, list all given pages ( images ), download it's content and print it.
import time import subprocess from selenium import webdriver from urllib.request import urlretrieve driver = webdriver.Firefox() driver.get("http://www.amazon.com/War-Peace-Leo-Nikolayevich-Tolstoy/dp/1427030200") time.sleep(2) driver.find_element_by_id("imgBlkFront").click() imageList = set() time.sleep(5) while "pointer" in driver.find_element_by_id("sitbReaderRightPageTurner").get_attribute("style"): driver.find_element_by_id("sitbReaderRightPageTurner").click() time.sleep(2) pages = driver.find_elements_by_xpath("//div[@class='pageImage']/div/img") for page in pages: image = page.get_attribute("src") imageList.add(image) driver.quit() for image in sorted(imageList): urlretrieve(image, "page.jpg") p = subprocess.Popen(["tesseract", "page.jpg", "page"], stdout=subprocess.PIPE, stderr=subprocess.PIPE) p.wait() f = open("page.txt", "r") print(f.read())but this is what I get
Error:Traceback (most recent call last):
File "C:\Python36\kodovi\bookpreview.py", line 26, in <module>
p = subprocess.Popen(["tesseract", "page.jpg", "page"], stdout=subprocess.PI
PE, stderr=subprocess.PIPE)
File "C:\Python36\lib\subprocess.py", line 709, in __init__
restore_signals, start_new_session)
File "C:\Python36\lib\subprocess.py", line 997, in _execute_child
startupinfo)
FileNotFoundError: [WinError 2] The system cannot find the file specified