该楼层疑似违规已被系统折叠 隐藏此楼查看此楼

import requests

from lxml import etree

import pymongo

client = pymongo.MongoClient('localhost', 27017)

mydb = client['mydb']

timeline = mydb['timeline']

def get_time_info(url,page):

user_id = url.split('/')

user_id = user_id[4]

if url.find('page='):

page = page+1

html = requests.get(url)

selector = etree.HTML(html.text)

infos = selector.xpath('//ul[@class="note-list"]/li')

for info in infos:

dd = info.xpath('div/div/div/span/@data-datetime')[0]

type = info.xpath('div/div/div/span/@data-type')[0]

timeline.insert_one({'date':dd,'type':type})

id_infos = selector.xpath('//ul[@class="note-list"]/li/@id')

if len(infos) > 1:

feed_id = id_infos[-1]

max_id = feed_id.split('-')[1]

next_url = 'http://www.jianshu.com/users/%s/timeline?max_id=%s&page=%s' % (user_id, max_id, page)

get_time_info(next_url, page)

if __name__ == '__main__':

get_time_info('http://www.jianshu.com/users/9104ebf5e177/timeline',1)

Logo

魔乐社区(Modelers.cn) 是一个中立、公益的人工智能社区,提供人工智能工具、模型、数据的托管、展示与应用协同服务,为人工智能开发及爱好者搭建开放的学习交流平台。社区通过理事会方式运作,由全产业链共同建设、共同运营、共同享有,推动国产AI生态繁荣发展。

更多推荐