From bdf89644b855d15fd9869666b4d6754476e4cd94 Mon Sep 17 00:00:00 2001
From: LiZheng <alexlee5670@gmail.com>
Date: Sat, 5 May 2018 09:45:36 +0800
Subject: [PATCH 1/2] add unsplash

---
 crawler/unsplash.py | 59 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 59 insertions(+)
 create mode 100644 crawler/unsplash.py

diff --git a/crawler/unsplash.py b/crawler/unsplash.py
new file mode 100644
index 000000000000..1c8cf21b7b03
--- /dev/null
+++ b/crawler/unsplash.py
@@ -0,0 +1,59 @@
+#-*-encoding:utf-8-*-
+import os, shutil
+import requests
+from bs4 import BeautifulSoup
+import json
+import threading
+
+Url = 'https://unsplash.com/'
+Start = 'https://unsplash.com/napi/feeds/home?after=95cc4cd0-4529-11e8-8080-8001050033a3'
+Pattern = 'https://unsplash.com/napi/feeds/home?after=xxx'
+Auth = {'Authorization':'Client-ID 72664f05b2aee9ed032f9f4084f0ab55aafe02704f8b7f8ef9e28acbec372d09'}
+Des = 'data'
+Pages = 50
+
+
+def GetJson(target):
+    req = requests.get(target, headers=Auth, verify=False)
+    if req.status_code == 200:
+        return req.json()
+    else:
+        print('response error: ', req.status_code)
+
+def SavePhoto(photo, regular_size=True):
+    target = photo['m_size']
+    if not regular_size:
+        target = photo['l_size']
+    req = requests.get(target, headers=Auth, verify=False)
+    file = os.path.join(Des, photo['name'])
+    file = file + '.jpg'
+    with open(file, 'wb') as f:
+        f.write(req.content)
+
+if __name__ == '__main__':
+    os.chdir(os.curdir)
+    if not os.path.exists(Des):
+        os.mkdir(Des)
+
+    js = GetJson(Start)
+    cur_page = 1
+    while cur_page < Pages:
+        print('saving page: ', cur_page)
+        after_value = js['next_page'].split('=')[1]
+        next_target = Pattern.replace('xxx', after_value)
+        photos = []
+        for photo in js['photos']:
+            pt = {}
+            pt['id'] = photo['id']
+            pt['m_size'] = photo['urls']['regular']
+            pt['l_size'] = photo['urls']['full']
+
+            pt['name'] = photo['id']
+            photos.append(pt)
+        threads = [threading.Thread(target=SavePhoto, args=(photo, )) for photo in photos]
+        for t in threads:
+            t.start()
+        # for t in threads:
+        #     t.join()
+        js = GetJson(next_target)
+        cur_page += 1

From 92b5af6a1ddc105754852cf48ff8b56dc1dfbbdb Mon Sep 17 00:00:00 2001
From: LiZheng <alexlee5670@gmail.com>
Date: Sat, 5 May 2018 09:52:32 +0800
Subject: [PATCH 2/2] revert

---
 crawler/unsplash.py | 59 ---------------------------------------------
 1 file changed, 59 deletions(-)
 delete mode 100644 crawler/unsplash.py

diff --git a/crawler/unsplash.py b/crawler/unsplash.py
deleted file mode 100644
index 1c8cf21b7b03..000000000000
--- a/crawler/unsplash.py
+++ /dev/null
@@ -1,59 +0,0 @@
-#-*-encoding:utf-8-*-
-import os, shutil
-import requests
-from bs4 import BeautifulSoup
-import json
-import threading
-
-Url = 'https://unsplash.com/'
-Start = 'https://unsplash.com/napi/feeds/home?after=95cc4cd0-4529-11e8-8080-8001050033a3'
-Pattern = 'https://unsplash.com/napi/feeds/home?after=xxx'
-Auth = {'Authorization':'Client-ID 72664f05b2aee9ed032f9f4084f0ab55aafe02704f8b7f8ef9e28acbec372d09'}
-Des = 'data'
-Pages = 50
-
-
-def GetJson(target):
-    req = requests.get(target, headers=Auth, verify=False)
-    if req.status_code == 200:
-        return req.json()
-    else:
-        print('response error: ', req.status_code)
-
-def SavePhoto(photo, regular_size=True):
-    target = photo['m_size']
-    if not regular_size:
-        target = photo['l_size']
-    req = requests.get(target, headers=Auth, verify=False)
-    file = os.path.join(Des, photo['name'])
-    file = file + '.jpg'
-    with open(file, 'wb') as f:
-        f.write(req.content)
-
-if __name__ == '__main__':
-    os.chdir(os.curdir)
-    if not os.path.exists(Des):
-        os.mkdir(Des)
-
-    js = GetJson(Start)
-    cur_page = 1
-    while cur_page < Pages:
-        print('saving page: ', cur_page)
-        after_value = js['next_page'].split('=')[1]
-        next_target = Pattern.replace('xxx', after_value)
-        photos = []
-        for photo in js['photos']:
-            pt = {}
-            pt['id'] = photo['id']
-            pt['m_size'] = photo['urls']['regular']
-            pt['l_size'] = photo['urls']['full']
-
-            pt['name'] = photo['id']
-            photos.append(pt)
-        threads = [threading.Thread(target=SavePhoto, args=(photo, )) for photo in photos]
-        for t in threads:
-            t.start()
-        # for t in threads:
-        #     t.join()
-        js = GetJson(next_target)
-        cur_page += 1