Downloading images using src in python produces empty images

Question

My script is kind of working but the files it saves are empty. Any ideas? Forgive me for all the unused import at the top! I tried a lot of different things to do this. In here I'm pulling the img using selenium. The SRCs are then iterated through a loop and transformed into bytes so that they can be

Accepted Answer

You forgot to use requests to get data from server    response = requests.get(img_src)    data = response.content        with open(fullname, "wb") as f:        f.write(data)Minimal working example.It works for me for few first images. Maybe other images need longer sleep() or it needs to scroll to the bottom to load all src by JavaScript.import osimport timeimport requestsfrom selenium import webdriverfrom selenium.webdriver.firefox.options import Optionsfrom selenium.webdriver.support.ui import WebDriverWait from selenium.webdriver.support import expected_conditions as ECfrom selenium.webdriver.common.by import Byoptions = Options()options.headless = Truedriver = webdriver.Firefox(options=options)driver.get("https://superrare.com/features/the-intersection-of-machine-and-artist")time.sleep(2)                                                                                                            #the element with longest height on pageroot = driver.find_element("xpath", '//div[@id="root"]')total_height = root.size["height"] + 8000print('total_height:', total_height)time.sleep(2)driver.set_window_size(1920, total_height) time.sleep(2)imgs = WebDriverWait(driver, 50).until(EC.presence_of_all_elements_located((By.XPATH, "//img")))time.sleep(5)print('len(imgs):', len(imgs))download_folder = "/Users/rcastong/Desktop/imgs"# it will create only if not existsos.makedirs(download_folder, exist_ok=True)for number, item in enumerate(imgs, 1):    print('---', number, '---')    img_src = item.get_attribute("src")    print('from:', img_src)    fullname = os.path.join(download_folder, os.path.basename(img_src))    print('  to:', fullname)        response = requests.get(img_src)    data = response.content        with open(fullname, "wb") as f:        f.write(data)

Advertisement

Answer