get_face.py 841 B

123456789101112131415161718192021222324252627282930313233
  1. #!/usr/bin/env python
  2. # -*- encoding: utf-8 -*-
  3. '''
  4. @File : get_face.py
  5. @Time : 2019/05/16 05:44:10
  6. @Author : Liuyuqi
  7. @Version : 1.0
  8. @Contact : liuyuqi.gov@msn.cn
  9. @License : (C)Copyright 2019
  10. @Desc : 抓取用户头像,User表中头像字段导出后下载即可。
  11. '''
  12. import urllib
  13. import re
  14. import os, sys
  15. src = "C:/Users/liuyuqi/Desktop/crawl_bilibili"
  16. os.chdir(src)
  17. sys.path.append(src)
  18. f = open("data/bilibili_user_face.txt")
  19. line = f.readline()
  20. for i in range(1, 1000):
  21. print(line,)
  22. if re.match('http://static.*', line):
  23. line = f.readline()
  24. print('noface:' + str(i))
  25. else:
  26. path = r"../data/face/" + str(i) + ".jpg"
  27. data = urllib.request.urlretrieve(line, path) #下载到指定位置
  28. line = f.readline()
  29. print('succeed:' + str(i))
  30. f.close()