# -*- coding: utf-8 -*-
import requests
from bs4 import BeautifulSoup
import json
import time
# http://www.dgtle.com/
# url = 'https://api.yii.dgtle.com/v2/index?token=&perpage=14&page=3&dateline=1530336360'
page = 1
url = 'https://api.yii.dgtle.com/v2/index?token=&perpage=14&page=1'
def get_detail(url):
global page
wb_data = requests.get(url)
json_data = json.loads(wb_data.text)
dateline = json_data['dateline']
page += 1
data_list = json_data['list']
for data in data_list:
if data.get('fid') == '2':
link = 'http://www.dgtle.com/article-{}-1.html'.format(data['aid'])
elif data.get('fid') == '160':
link = 'http://news.dgtle.com/thread-{}-1-1.html'.format(data['tid'])
else:
url = 'unknow'
need_data = {
'title': data['title'],
'image': data['pic'],
'link': link
}
print(need_data)
time.sleep(1)
if page < 10:
print(page)
next_url = 'https://api.yii.dgtle.com/v2/index?token=&perpage=14&page={}&dateline={}'.format(page, dateline)
print(next_url)
get_detail(next_url)
if __name__ == '__main__':
get_detail(url)
'''
{'tid': '989406', 'typeid': '34', 'recommend_add': '7', 'replies': '65', 'author': '小淼-海', 'authorid': '76456', 'special': '', 'fid': '2', 'tviews': '281', 'aid': '24052', 'pic': 'http://s2.dgtle.com/portal/201807/02/125247iwss83sjq234z2p8.png?imageView2/2/w/960/q/100', 'url': '', 'title': '深夜俱乐部丨推荐一部最让你感触的社会现实类电影吧', 'summary': '社会现实类电影是电影品类中的利刃,它们用电影的方式披露现实社会中的一些问题,引发观影者的思考与共鸣。', 'id': '989406', 'dateline': '1530536460', 'height': '1170', 'width': '1770', 'catid': '7', 'type': '生活', 'comment_num': 71, 'views': '2603', 'avatar': 'http://www.dgtle.com/uc_server/avatar.php?uid=76456', 'date': '4 小时前', 'is_recommend': 0, 'class': 'article', 'line': 2}
http://www.dgtle.com/article-24052-1.html
{'tid': '987878', 'typeid': '5', 'recommend_add': '13', 'replies': '14', 'author': '长胖的西瓜', 'authorid': '426655', 'special': '', 'fid': '2', 'tviews': '869', 'aid': '24061', 'pic': 'http://s2.dgtle.com/portal/201807/02/171933xn6x1hczm28kd9t6.jpeg?imageView2/2/w/960/q/100', 'url': '', 'title': '有了这玩意儿,今年的世界杯好看多了', 'summary': '住在出租房里面,哪来电视这种能让我「看世界杯」的科幻玩意儿呢?于是我有了个买投影仪的念头。\r\n', 'id': '987878', 'dateline': '1530523178', 'height': '1171', 'width': '1770', 'catid': '5', 'type': '影音', 'comment_num': 20, 'views': '4889', 'avatar': 'http://www.dgtle.com/uc_server/avatar.php?uid=426655', 'date': '7 小时前', 'is_recommend': 0, 'class': 'article', 'line': 2}
http://www.dgtle.com/article-24061-1.html
{'tid': '989446', 'typeid': '390', 'recommend_add': '9', 'replies': '21', 'author': 'nyctimee', 'authorid': '287129', 'special': '', 'fid': '160', 'tviews': '4734', 'aid': '24056', 'pic': 'http://s2.dgtle.com/portal/201807/02/155800bkkakzjq979vqeje.jpg?imageView2/2/w/590/q/100', 'url': '', 'title': '坚果闹钟式无线充电座,让充电这件小事变得更优雅', 'summary': '这可能是目前为止颜值最高的一款无线充电座。', 'id': '989446', 'dateline': '1530518491', 'height': '2000', 'width': '1999', 'catid': '37', 'type': '产品', 'comment_num': 28, 'views': '1502', 'avatar': 'http://www.dgtle.com/uc_server/avatar.php?uid=287129', 'date': '9 小时前', 'is_recommend': 0, 'class': 'news', 'line': 1, 'cover_name': 'http://s2.dgtle.com/forum/201807/02/142840sujjosavjjcwj3hz.jpg?imageView2/2/w/500/q/100'}
http://news.dgtle.com/thread-989446-1-1.html
{'tid': '989536', 'typeid': '389', 'recommend_add': '6', 'replies': '11', 'author': 'egonHu', 'authorid': '913275', 'special': '', 'fid': '160', 'tviews': '1498', 'aid': '24055', 'pic': 'http://s2.dgtle.com/portal/201807/02/154017s8vsynvs8nofzzjs.jpg?imageView2/2/w/590/q/100', 'url': '', 'title': '斯皮尔伯格监制,《光环》改编美剧 2019 年开拍', 'summary': '早已传言纷纷的《光环》改编电视剧,如今终于尘埃落定。', 'id': '989536', 'dateline': '1530517223', 'height': '855', 'width': '855', 'catid': '37', 'type': '快讯', 'comment_num': 11, 'views': '1116', 'avatar': 'http://www.dgtle.com/uc_server/avatar.php?uid=913275', 'date': '9 小时前', 'is_recommend': 0, 'class': 'news', 'line': 1, 'cover_name': 'http://s2.dgtle.com/forum/201807/02/152244lmlwilhd77ihanyr.jpg?imageView2/2/w/500/q/100'}
http://news.dgtle.com/thread-989536-1-1.html
'''
url = 'https://api.yii.dgtle.com/v2/index?token=&perpage=14&page=1'
wb_data = requests.get(url)
json_data = json.loads(wb_data.text)
print(json_data['dateline'])