@pxaklbe 通过文件获取关键词是没问题的



对于关键词:“一个”,时间: 2017-2-26,进行了测试,设置如下

keywords = ['一个']
start_time = datetime.datetime(year=2017, month=2, day=26, hour=0)
end_time = datetime.datetime(year=2017, month=2, day=27, hour=0)
is_split_by_hour = True


{"_id": "4079206164329661", "mblogid": "ExevSialf", "created_at": "2017-02-26 01:00:00", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "HUAWEI G9 青春版", "content": "hjsh//@小螃蟹喵:Forever Love KARRY //@王俊凯的凯喵战队:#王俊凯的小棉袄# &#王俊凯# 从《摩天轮的思念》《树读》到现在的《小棉袄》王俊凯的每一首歌都有自己独特的风格,唱功也是发挥到了极致,期待歌手王俊凯的下一个作品[鼓掌]@TFBOYS-王俊凯", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "5596052053", "avatar_hd": ",tva&Expires=1707849492&ssig=3JGlGSrFLI", "nick_name": "小螃蟹喵", "verified": true, "mbrank": 7, "mbtype": 12, "verified_type": 0}, "url": "", "retweet_id": "4007589602317195", "keyword": "一个", "crawl_time": 1707838692}
{"_id": "4079221258676363", "mblogid": "ExeUdAp7l", "created_at": "2017-02-26 02:00:00", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 1, "source": "weishoot", "content": "微摄(App)是一个分享图片就能直接赚钱的平台。这里给所有人带来了意想不到的惊喜!赶快用手机分享您的图片吧! ", "pic_urls": [""], "pic_num": 1, "isLongText": false, "is_retweet": false, "user": {"_id": "1730283472", "avatar_hd": ",tva&Expires=1707849492&ssig=%2B0UFeB1c6r", "nick_name": "何世红cfn", "verified": true, "mbrank": 4, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838693}
{"_id": "4079251441479623", "mblogid": "ExfGU6cUT", "created_at": "2017-02-26 03:59:55", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "皮皮时光机", "content": "英国人曼吉特·辛格被认为拥有世界上最大的肺活量。1998年9月,他在42分钟内吹出了一个直径2.44米的大气球,其重量有1千克。 ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "5561059755", "avatar_hd": ",tva&Expires=1707849495&ssig=dOJgPAo%2BeJ", "nick_name": "风土情网", "verified": true, "mbrank": 0, "mbtype": 0, "verified_type": 2}, "url": "", "keyword": "一个", "crawl_time": 1707838695}
{"_id": "4079266549050925", "mblogid": "Exg5gBYyF", "created_at": "2017-02-26 04:59:57", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 1, "attitudes_count": 1, "source": "微博", "content": "同意,拍的挺好的。//@和顺安稳: http://叶泳湘,有“现代小龙女”、“当代宫二”之誉。。功夫如何不知道,但如能推广太极拳,培养太极人口,也挺好~//@安般太极拳: //@喝茶的太极猫: 陈式被大师金刚吹死了,现在杨式也被新秀开吹了。年轻女子没有一个有功夫的,只有会打扮和跳舞的", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "1594481374", "avatar_hd": ",tva&Expires=1707849496&ssig=YLKN1HAGtW", "nick_name": "安般太极拳", "verified": true, "mbrank": 2, "mbtype": 2, "verified_type": 0}, "video": ",video", "url": "", "retweet_id": "4078354791868311", "keyword": "一个", "crawl_time": 1707838696}
{"_id": "4079251441591651", "mblogid": "ExfGU6G3N", "created_at": "2017-02-26 03:59:55", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "皮皮时光机", "content": "【美胸金标准】丰满、匀称、柔韧而富有弹性;两侧乳房大小、形状、位置均对称一致,两乳间距离大于20厘米;乳房基底面直径在10-12厘米,从基底面至乳头的高度为5-6厘米;乳房挺拔,环差为17-20厘米;两个乳头与胸骨切迹成一个等边三角形。你是美胸吗? ", "pic_urls": [""], "pic_num": 1, "isLongText": false, "is_retweet": false, "user": {"_id": "3771186273", "avatar_hd": ",tva&Expires=1707849497&ssig=rrsO56A4PP", "nick_name": "御姐控的cinderella2", "verified": true, "mbrank": 0, "mbtype": 0, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838697}
{"_id": "4079326959727955", "mblogid": "ExhEHEOGv", "created_at": "2017-02-26 08:59:59", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "小米手机5", "content": "//@千玺周刊_Memory-of-Jackson:从前车🚗、马[草泥马]、邮件[礼物]都很慢,一个月[月亮]的流量☔只够等一个人[NO]。", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "3844080608", "avatar_hd": ",tva&Expires=1707849501&ssig=2VHdIZMrPp", "nick_name": "就问你我萌不萌呀", "verified": true, "mbrank": 1, "mbtype": 2, "verified_type": 0}, "url": "", "retweet_id": "4079164539223533", "keyword": "一个", "crawl_time": 1707838701}
{"_id": "4079357154410434", "mblogid": "Exirpivm2", "created_at": "2017-02-26 10:59:59", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 4, "attitudes_count": 1, "source": "", "content": "【投稿】 之前喜欢一个男生嘛 然后表白到现在大概快三个月了(现在想来应该也不是喜欢吧just一点点好感而被怂恿了)然后后来因为这个男生和我三观不合 平常无话可说都是我尬聊 对我的态度也很迷...他和别的女生暧昧啥的反正槽点很多的 于是我想通了放弃了 简直可喜可贺 中途因为他难过了好多次啊困惑了好久啊还投稿了好多次。 然后这个男生却和我说既然追了  然后放弃他这样可能让我名声不好??EXO ME? 谁爱倒贴谁倒贴吧老娘不玩了。而且说实话我长得挺不错但是他长得丑..被朋友一直骂说我瞎了我还能坚持着我也不知道当时怎么想。。真的好后悔之前为什么会看上这种人。希望小仙女们擦亮眼睛啊~不要太辛苦! 不过也明白了我也有错吧不该没弄清楚", "pic_urls": [], "pic_num": 0, "isLongText": true, "is_retweet": false, "user": {"_id": "6007173471", "avatar_hd": ",tva&Expires=1707849503&ssig=IlFJYSe6c9", "nick_name": "说给可爱的你", "verified": true, "mbrank": 6, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838705}
{"_id": "4079402457673592", "mblogid": "ExjCtwcfC", "created_at": "2017-02-26 14:00:00", "geo": null, "ip_location": null, "reposts_count": 3, "comments_count": 0, "attitudes_count": 0, "source": "Android", "content": "#冯绍峰# #冯绍峰吴居蓝# #冯绍峰那片星空那片海# 每个表情都透着一个字 帅[舔屏]", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "1694857804", "avatar_hd": ",tva&Expires=1707849507&ssig=A7QdeX19jv", "nick_name": "我峰美如画", "verified": false, "mbrank": 7, "mbtype": 2}, "url": "", "retweet_id": "4079384837496640", "keyword": "一个", "crawl_time": 1707838707}
{"_id": "4079432656619837", "mblogid": "ExkpbrM7z", "created_at": "2017-02-26 15:59:59", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 1, "source": "微博", "content": "//@Kingkill33: //@_大大小咩:拉低中奖率 //@百里蝎尾狮:截止到今晚十二点瞎基霸随机抽一个100软妹币和摸鱼儿[doge]", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "2672145682", "avatar_hd": ",tva&Expires=1707849508&ssig=nAj%2BHN5Dy7", "nick_name": "Egoso", "verified": true, "mbrank": 5, "mbtype": 2, "verified_type": 0}, "url": "", "retweet_id": "4079176438346631", "keyword": "一个", "crawl_time": 1707838708}
{"_id": "4079432656989113", "mblogid": "ExkpbtkbD", "created_at": "2017-02-26 16:00:00", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "iPhone 7", "content": "卧槽 想起我两个高中化学老师😱😱😱😱😱😱 //@北美吐槽君://@隐浮斋子: 同右[笑cry]//@Lamb_babi:[摊手]我认识一个化学博士 几乎不长头发 也没有指纹…", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "1635758035", "avatar_hd": ",tva&Expires=1707849509&ssig=n2xqxZsAgg", "nick_name": "Nomi_Ryu", "verified": true, "mbrank": 0, "mbtype": 0, "verified_type": 0}, "url": "", "retweet_id": "4079342742435038", "keyword": "一个", "crawl_time": 1707838709}
{"_id": "4079251433089402", "mblogid": "ExfGTcXH4", "created_at": "2017-02-26 03:59:53", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 1, "attitudes_count": 1, "source": "🦁iPhone 6s Plus", "content": "我以前打死抽不出古笼火最后拼了一个 今天连着抽两个全是古笼火 这是不是bug ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "1567106610", "avatar_hd": ",tva&Expires=1707849519&ssig=8%2B6uOfbHAM", "nick_name": "猫警官", "verified": false, "mbrank": 7, "mbtype": 12}, "url": "", "keyword": "一个", "crawl_time": 1707838720}
{"_id": "4079357155184899", "mblogid": "ExirplKPp", "created_at": "2017-02-26 10:59:59", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "微博", "content": "//@Maslow得不到需要: #日常一稳#//@繁柏:#传销理论#//@白水攻玉:21天以上的重复会形成习惯;90天的重复会形成稳定的习惯,任何一个想法重复验证21次,就会变成习惯性想法。所以,一个观念如果被别人或者自己验证了21次以上,它一定已经变成了你的信念。 #以上,是我赧于自己依旧真情实感的甩锅#", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "2244663813", "avatar_hd": ",tva&Expires=1707849523&ssig=eRoFAA1hZi", "nick_name": "dian5200", "verified": true, "mbrank": 7, "mbtype": 12, "verified_type": 0}, "url": "", "retweet_id": "4079227038733267", "keyword": "一个", "crawl_time": 1707838723}
{"_id": "4079206155411695", "mblogid": "ExevRmHPp", "created_at": "2017-02-26 00:59:58", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 2, "source": "微博视频号", "content": "#健康美食专属#【日本整脊大师教大家“睡前花3分钟做一个动作”】这个优质睡眠减脂法结果惊人,大家可以试试!转给睡眠不好的童鞋! ![话筒] ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "3988622116", "avatar_hd": ",tva&Expires=1707849525&ssig=1DGKaC9Mrm", "nick_name": "寻香美食", "verified": true, "mbrank": 7, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838725}
{"_id": "4079402448978818", "mblogid": "ExjCsBFNE", "created_at": "2017-02-26 13:59:58", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "OPPO R9", "content": "59//@唯易wJ:做你最坚强的底气//@红色炒黄色975:我一直在期待,期待每一个你//@易烊千玺战斗鹤:#北鼻放开那个易烊千玺让我来##一心一意,易烊千玺##我想听你说#期待着小哥哥的福利 北鼻。。。幸福的等待[鲜花][鲜花][鲜花]@TFBOYS-易烊千玺 #你说-易烊千玺[音乐]#", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "5505474944", "avatar_hd": ",tva&Expires=1707849528&ssig=HB48uVJnb9", "nick_name": "唯易wJ", "verified": true, "mbrank": 7, "mbtype": 12, "verified_type": 0}, "url": "", "retweet_id": "4077028422614598", "keyword": "一个", "crawl_time": 1707838728}
{"_id": "4079432647823212", "mblogid": "ExkpawPaQ", "created_at": "2017-02-26 15:59:58", "geo": null, "ip_location": null, "reposts_count": 9, "comments_count": 9, "attitudes_count": 1, "source": "iPhone 6", "content": "#洛阳生活# 【二月二龙抬头一起来拔头彩】八三哥的御用理发师来(洗剪吹.造型.头发护理.蜡染等等)送2017新年第一波福利,二月二龙抬头**人的吉祥习俗,在这一天剪头寓意全年一切顺利!啥也不说,先上福利现在转发微博 @ 一个你想让TA新年抬头的人,并说出【角度造型】的位置,1.二月二当天剪头剪一送一,2.持本条微博二月二当天冲100元送100元,在加送一次剪头,3.还有机会获得100元任意消费现金卡,有3个名额呢[嘻嘻]坐标:南昌路与丽川路口向西20米(丹尼斯北隔壁)以下真实拍摄未经加工!", "pic_urls": ["", "", "", "", "", "", "", "", ""], "pic_num": 9, "isLongText": true, "is_retweet": false, "user": {"_id": "1747263521", "avatar_hd": ",tva&Expires=1707849530&ssig=%2BcvisFjexq", "nick_name": "一米八三Mr", "verified": true, "mbrank": 7, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838731}
{"_id": "4079508154284339", "mblogid": "ExmmXhYyf", "created_at": "2017-02-26 21:00:00", "geo": null, "ip_location": null, "reposts_count": 1, "comments_count": 0, "attitudes_count": 1, "source": "药哥的Android", "content": "我家大阪城全特么枪爹[摊手]一个都没掉 我不会啥玩意没有就毕业吧[摊手][摊手][摊手] ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "2116120665", "avatar_hd": ",tva&Expires=1707849532&ssig=LblD8OIFlk", "nick_name": "Cantus龄澜_", "verified": true, "mbrank": 7, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838732}
{"_id": "4079538353056258", "mblogid": "Exn9FcP4u", "created_at": "2017-02-26 23:00:00", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "微博", "content": "等等病了,爸爸平均一个小时要问800次,要不要去医院,而妈妈呢,就一直强调,问过医生了,说没事,就让他自愈吧?喝水,喝小米汤就好,相比之下我觉得我不像个亲妈 ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "6043349284", "avatar_hd": ",tva&Expires=1707849535&ssig=SfPw%2FK2U2h", "nick_name": "VPN造型-波比", "verified": false, "mbrank": 0, "mbtype": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838735}
{"_id": "4079206151405243", "mblogid": "ExevR5Tzd", "created_at": "2017-02-26 00:59:57", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "OPPO R9", "content": "凤九与帝君的爱情就是再说,爱一个值得爱的人,明知无缘无分也要拼尽全力要和你在一起,就算三生石上没有你我的名字!#凤九断尾##三生三世十里桃花电视剧#  ", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": false, "user": {"_id": "3506662794", "avatar_hd": ",tva&Expires=1707849538&ssig=6J2LK5NhAm", "nick_name": "多阅DooYea", "verified": true, "mbrank": 0, "mbtype": 0, "verified_type": 2}, "url": "", "keyword": "一个", "crawl_time": 1707838738}
{"_id": "4079432643780585", "mblogid": "ExkpafRvb", "created_at": "2017-02-26 15:59:57", "geo": null, "ip_location": null, "reposts_count": 1, "comments_count": 3, "attitudes_count": 1, "source": "微博", "content": "很炫的机车,更炫的改装车,漂亮的老婆~就一个字:小编很羡慕~#长沙婚纱照# #长沙摄影工作室# #长沙情侣照# ", "pic_urls": ["", "", "", ""], "pic_num": 4, "isLongText": false, "is_retweet": false, "user": {"_id": "5619759506", "avatar_hd": ",tva&Expires=1707849540&ssig=hm2CzUS0Xb", "nick_name": "长沙V格摄婚纱摄影", "verified": true, "mbrank": 7, "mbtype": 2, "verified_type": 2}, "url": "", "keyword": "一个", "crawl_time": 1707838740}
{"_id": "4079206147533843", "mblogid": "ExevQvBTB", "created_at": "2017-02-26 00:59:56", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 0, "source": "HUAWEI G9 青春版", "content": "//@小螃蟹喵:Forever Love KARRY //@王俊凯的凯喵战队:#王俊凯的小棉袄# &#王俊凯# 从《摩天轮的思念》《树读》到现在的《小棉袄》王俊凯的每一首歌都有自己独特的风格,唱功也是发挥到了极致,期待歌手王俊凯的下一个作品[鼓掌]@TFBOYS-王俊凯", "pic_urls": [], "pic_num": 0, "isLongText": false, "is_retweet": true, "user": {"_id": "5596052053", "avatar_hd": ",tva&Expires=1707849542&ssig=dYB6yngJr0", "nick_name": "小螃蟹喵", "verified": true, "mbrank": 7, "mbtype": 12, "verified_type": 0}, "url": "", "retweet_id": "4007589602317195", "keyword": "一个", "crawl_time": 1707838742}
{"_id": "4079206138619088", "mblogid": "ExevPAady", "created_at": "2017-02-26 00:59:54", "geo": null, "ip_location": null, "reposts_count": 0, "comments_count": 0, "attitudes_count": 1, "source": "皮皮时光机", "content": "这一切悲剧随生命终结的时候,萧红才31岁,而我们每一个人31岁时,还在犯着多少愚蠢的错误。即使在今天,**的女儿们仍然背负着重重历史债务。自由从来不容易,不是一个姿态,一个手势,自由是永恒的克服重力,挣扎着向上飞行。——郭玉洁《众声》 ", "pic_urls": [""], "pic_num": 1, "isLongText": false, "is_retweet": false, "user": {"_id": "5278229399", "avatar_hd": ",tva&Expires=1707849544&ssig=SoKeL7ux1P", "nick_name": "语录颂", "verified": true, "mbrank": 1, "mbtype": 2, "verified_type": 0}, "url": "", "keyword": "一个", "crawl_time": 1707838744}

