From cd135b97b4b355befceb846af2f2f30879cfe5bf Mon Sep 17 00:00:00 2001 From: LeLe <251192913@qq.com> Date: Sat, 19 Oct 2019 16:54:11 +0800 Subject: [PATCH] =?UTF-8?q?=E9=92=88=E5=AF=B9=E5=BE=AE=E4=BF=A1=E8=BF=94?= =?UTF-8?q?=E5=9B=9E=E6=A0=BC=E5=BC=8F=E5=8F=98=E5=8C=96=E4=BF=AE=E6=94=B9?= =?UTF-8?q?app=5Fmsg=5Fext=5Finfo?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- start.py | 23 ++++++++++++----------- 1 file changed, 12 insertions(+), 11 deletions(-) diff --git a/start.py b/start.py index 353d0f3..1286fa7 100644 --- a/start.py +++ b/start.py @@ -128,26 +128,27 @@ def GetArticleList(jsondir): for item in list: #一个item里可能有多篇文章 artidx = 1 #请注意这里的编号只是为了保存html方便,并不对应于真实的文章发文位置(比如头条、次条、3条) comm_msg_info = item["comm_msg_info"] - app_msg_ext_info = item["app_msg_ext_info"] + pubstamp = comm_msg_info["datetime"] pubdate = Timestamp2Datetime(pubstamp) if comm_msg_info["type"] == 49: #49为普通图文类型,还有其他类型,暂不考虑 + app_msg_ext_info = item["app_msg_ext_info"] url = app_msg_ext_info["content_url"] #文章链接 idx = artidx title = app_msg_ext_info["title"] art = Article(url,pubdate,idx,title) ArtList.append(art) print(len(ArtList),pubdate, idx, title) - if app_msg_ext_info["is_multi"] == 1: # 一次发多篇 - artidx += 1 - multi_app_msg_item_list = app_msg_ext_info["multi_app_msg_item_list"] - for subArt in multi_app_msg_item_list: - url =subArt["content_url"] - idx =artidx - title = subArt["title"] - art = Article(url,pubdate,idx,title) - ArtList.append(art) - print(len(ArtList),pubdate, idx, title) + if app_msg_ext_info["is_multi"] == 1: # 一次发多篇 + artidx += 1 + multi_app_msg_item_list = app_msg_ext_info["multi_app_msg_item_list"] + for subArt in multi_app_msg_item_list: + url =subArt["content_url"] + idx =artidx + title = subArt["title"] + art = Article(url,pubdate,idx,title) + ArtList.append(art) + print(len(ArtList),pubdate, idx, title) return ArtList def DownHtmlMain(jsonDir,saveHtmlDir):