0013 Done.

ddkangfu · ddkangfu · commit 2155c8f9ebd2 · 2015-01-05T22:19:43.000+08:00
diff --git a/ddkangfu/0013/0013.py b/ddkangfu/0013/0013.py
@@ -0,0 +1,56 @@
+# coding=utf-8
+
+import urllib2
+import urllib
+import os
+
+from bs4 import BeautifulSoup
+
+"""
+0013:用 Python 写一个爬图片的程序，爬 [这个链接里的日本妹子图片 :-)](http://tieba.baidu.com/p/2166231880)
+"""
+
+
+def get_img_src_list(url, img_class):
+    content = urllib2.urlopen(url).read()
+
+    soup = BeautifulSoup(content)
+    #print soup
+    src_list = []
+
+    for img in  soup.find_all('img', img_class):
+        src_list.append(img['src'])
+
+    return src_list   
+
+
+def download_img(src, download_path):
+    print 'Begin download image : %s ......' % src
+
+    file_name =  src.split("/")[-1]
+    dist = os.path.join(download_path, file_name)
+
+    urllib.urlretrieve(src, dist, None)
+
+    print 'Download image %s Done.' % src
+
+
+
+if __name__ == '__main__':
+    src_list = get_img_src_list('http://tieba.baidu.com/p/2166231880', 'BDE_Image')
+    
+    if src_list:
+        save_path = os.path.abspath("./downlaod")
+        if not os.path.exists(save_path):
+            os.mkdir(save_path)
+
+        print 'Start download %d images.....' % len(src_list)
+
+        for src in src_list:
+            download_img(src, save_path)
+
+        print 'Download %d images done.' % len(src_list)
+    else:
+        print 'No Imges found !!!'
+
+