abstruse goose downloader

2016-02-10 22:40:26 +01:00 · 2016-02-10 22:40:26 +01:00 · ee09097389
commit ee09097389
parent 45b211785f
1 changed files with 33 additions and 0 deletions
--- a/download_abstrusegoose.py
+++ b/download_abstrusegoose.py
@ -0,0 +1,33 @@
 #!/usr/bin/env python2
 import requests
 from bs4 import BeautifulSoup
 FIRST_COMIC = 1
 LAST_COMIC = 575
 def download(img_url, i):
    img = requests.get(img_url, stream=True)
    file_name = "%04d_%s" %(i, img_url.split("/")[-1])
    with open(file_name ,"wb") as f:
        for chunk in img.iter_content(chunk_size=1024):
            if chunk:
                f.write(chunk)
        print "Got %s" %file_name
 def run():
    for i in range(FIRST_COMIC, LAST_COMIC + 1):
        p = requests.get("http://abstrusegoose.com/%d" %i)
        soup = BeautifulSoup(p.text, "html.parser")
        section = soup.find("section")
        if section:
            img = section.find("img")
            if img:
                src = img["src"]
                if src:
                    download(src, i)
 if __name__ == "__main__":
    run()