The script should open a preview of amazon book, list all given pages ( images ), download it's content and print it.
import time
import subprocess
from selenium import webdriver
from urllib.request import urlretrieve
driver = webdriver.Firefox()
driver.get("http://www.amazon.com/War-Peace-Leo-Nikolayevich-Tolstoy/dp/1427030200")
time.sleep(2)
driver.find_element_by_id("imgBlkFront").click()
imageList = set()
time.sleep(5)
while "pointer" in driver.find_element_by_id("sitbReaderRightPageTurner").get_attribute("style"):
driver.find_element_by_id("sitbReaderRightPageTurner").click()
time.sleep(2)
pages = driver.find_elements_by_xpath("//div[@class='pageImage']/div/img")
for page in pages:
image = page.get_attribute("src")
imageList.add(image)
driver.quit()
for image in sorted(imageList):
urlretrieve(image, "page.jpg")
p = subprocess.Popen(["tesseract", "page.jpg", "page"], stdout=subprocess.PIPE, stderr=subprocess.PIPE)
p.wait()
f = open("page.txt", "r")
print(f.read())but this is what I getError:Traceback (most recent call last):
File "C:\Python36\kodovi\bookpreview.py", line 26, in <module>
p = subprocess.Popen(["tesseract", "page.jpg", "page"], stdout=subprocess.PI
PE, stderr=subprocess.PIPE)
File "C:\Python36\lib\subprocess.py", line 709, in __init__
restore_signals, start_new_session)
File "C:\Python36\lib\subprocess.py", line 997, in _execute_child
startupinfo)
FileNotFoundError: [WinError 2] The system cannot find the file specified
