juanboy

Merge remote-tracking branch 'origin/main'

@@ -52,7 +52,7 @@ def run_script(): @@ -52,7 +52,7 @@ def run_script():
52 52
53 if __name__ == '__main__': 53 if __name__ == '__main__':
54 scheduler = BackgroundScheduler(timezone=utc) 54 scheduler = BackgroundScheduler(timezone=utc)
55 - scheduler.add_job(run_script, 'interval', minutes=1) 55 + scheduler.add_job(run_script, 'interval', hours=5)
56 scheduler.start() 56 scheduler.start()
57 57
58 try: 58 try:
@@ -2,7 +2,7 @@ import os @@ -2,7 +2,7 @@ import os
2 from sqlalchemy import create_engine 2 from sqlalchemy import create_engine
3 import pandas as pd 3 import pandas as pd
4 from spiderDataPackage.settings import articleAddr,commentsAddr 4 from spiderDataPackage.settings import articleAddr,commentsAddr
5 -from model.topicDefine import * 5 +# from ..model.topicDefine import *
6 6
7 engine = create_engine('mysql+pymysql://XiaoXueQi:XiaoXueQi@47.92.235.6/Weibo_PublicOpinion_AnalysisSystem?charset=utf8mb4') 7 engine = create_engine('mysql+pymysql://XiaoXueQi:XiaoXueQi@47.92.235.6/Weibo_PublicOpinion_AnalysisSystem?charset=utf8mb4')
8 8
@@ -29,7 +29,7 @@ def saveData(): @@ -29,7 +29,7 @@ def saveData():
29 29
30 os.remove(articleAddr) 30 os.remove(articleAddr)
31 os.remove(commentsAddr) 31 os.remove(commentsAddr)
32 - update_data() 32 + # update_data()
33 33
34 if __name__ == '__main__': 34 if __name__ == '__main__':
35 saveData() 35 saveData()
@@ -9,7 +9,7 @@ def spiderData(): @@ -9,7 +9,7 @@ def spiderData():
9 print('正在爬取导航栏数据') 9 print('正在爬取导航栏数据')
10 spiderNav() 10 spiderNav()
11 print('正在爬取文章数据') 11 print('正在爬取文章数据')
12 - spiderContent(1,1) 12 + spiderContent(9,1)
13 print('正在爬取文章评论数据') 13 print('正在爬取文章评论数据')
14 spiderComments() 14 spiderComments()
15 15
@@ -90,7 +90,7 @@ def readJson(response,type): @@ -90,7 +90,7 @@ def readJson(response,type):
90 isVip 90 isVip
91 ]) 91 ])
92 92
93 -def start(typeNum=1,pageNum=1): 93 +def start(typeNum=14,pageNum=3):
94 articleUrl = 'https://weibo.com/ajax/feed/hottimeline' 94 articleUrl = 'https://weibo.com/ajax/feed/hottimeline'
95 init() 95 init()
96 typeList = getTypeList() 96 typeList = getTypeList()

1.04 MB | W: | H:

750 KB | W: | H:

  • 2-up
  • Swipe
  • Onion skin
@@ -112,7 +112,7 @@ @@ -112,7 +112,7 @@
112 </a> 112 </a>
113 </li> 113 </li>
114 <li class="px-3 pt-3 pb-2"> 114 <li class="px-3 pt-3 pb-2">
115 - <span class="text-uppercase small font-weight-bold">词云图</span> 115 + <span class="text-uppercase small font-weight-bold">机器学习预测</span>
116 </li> 116 </li>
117 <li class=" sidebar-layout"> 117 <li class=" sidebar-layout">
118 <a href="/page/articleCloud" class="svg-icon"> 118 <a href="/page/articleCloud" class="svg-icon">