Skip to content

Commit

Permalink
增加异常处理(bug并未修复)
Browse files Browse the repository at this point in the history
  • Loading branch information
wjllp committed Jul 11, 2018
1 parent 8ac6b12 commit 3778a93
Show file tree
Hide file tree
Showing 2 changed files with 555 additions and 39 deletions.
26 changes: 18 additions & 8 deletions douyin.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@
session = requests.session()
#保存url的文件名
filename = "urls.txt"
c = 0
def start(userid,count):
#一次请求最多能获取到的url数
maxCount = 35
Expand All @@ -13,36 +14,45 @@ def start(userid,count):
#初始游标为0
max_cursor = 0
for i in range(0,page):
print ('此时count为:',count)
print ('当前游标为:',max_cursor)
#如果需获取的视频数大于最大能获取的数,则传入maxCount,并减小count的值
if (count > maxCount):
max_cursor = download(userid,maxCount,max_cursor)
count = count - maxCount
#最后count被减到小于maxCount的时候,传入count
else:
max_cursor = download(userid,count,max_cursor)
max_cursor = download(userid,count,max_cursor)

#参数:用户id,用于下载指定用户的收藏视频。count:下载数量。max_cursor:游标
def download(userid,count,max_cursor):
global c
url = 'https://www.douyin.com/aweme/v1/aweme/favorite/?user_id='+str(userid)+'&count='+str(count+1)+'&max_cursor='+str(max_cursor)+'&aid=1128'
#get请求,并保存响应报文
resp = session.get(url)
#解析http报文
soup = BeautifulSoup(resp.text, 'html.parser')
#解析json
#将字符串转为json
myjson = json.loads(str(soup))
#获取游标,用于解析下一页视频
max_cursor = myjson['max_cursor']
with open(filename,"a+") as f:
for i in range(0,count):
#解析json数据
video_url = myjson['aweme_list'][i]['video']['play_addr']['url_list'][0]
print (myjson['aweme_list'][i]['video']['play_addr']['url_list'][0])
#写入文件
f.write(video_url+"\n")
try:
#解析json数据
video_url = myjson['aweme_list'][i]['video']['play_addr']['url_list'][0]
#写入文件
f.write(video_url+"\n")
except:
print("json第",c,"次解析时解析出错...")
finally:
c = c + 1
print (video_url)

#关闭文件
f.close()
#返回游标
return max_cursor
if __name__ == '__main__':
#参数一:用户id,参数2:你想下载的视频个数
start(84064249580,100)
start(84064249580,500)
Loading

0 comments on commit 3778a93

Please sign in to comment.