Showing
8 changed files
with
6 additions
and
6 deletions
| @@ -52,7 +52,7 @@ def run_script(): | @@ -52,7 +52,7 @@ def run_script(): | ||
| 52 | 52 | ||
| 53 | if __name__ == '__main__': | 53 | if __name__ == '__main__': |
| 54 | scheduler = BackgroundScheduler(timezone=utc) | 54 | scheduler = BackgroundScheduler(timezone=utc) |
| 55 | - scheduler.add_job(run_script, 'interval', minutes=1) | 55 | + scheduler.add_job(run_script, 'interval', hours=5) |
| 56 | scheduler.start() | 56 | scheduler.start() |
| 57 | 57 | ||
| 58 | try: | 58 | try: |
model/__init__.py
0 → 100644
spider/__init__.py
0 → 100644
| @@ -2,7 +2,7 @@ import os | @@ -2,7 +2,7 @@ import os | ||
| 2 | from sqlalchemy import create_engine | 2 | from sqlalchemy import create_engine |
| 3 | import pandas as pd | 3 | import pandas as pd |
| 4 | from spiderDataPackage.settings import articleAddr,commentsAddr | 4 | from spiderDataPackage.settings import articleAddr,commentsAddr |
| 5 | -from model.topicDefine import * | 5 | +# from ..model.topicDefine import * |
| 6 | 6 | ||
| 7 | engine = create_engine('mysql+pymysql://XiaoXueQi:XiaoXueQi@47.92.235.6/Weibo_PublicOpinion_AnalysisSystem?charset=utf8mb4') | 7 | engine = create_engine('mysql+pymysql://XiaoXueQi:XiaoXueQi@47.92.235.6/Weibo_PublicOpinion_AnalysisSystem?charset=utf8mb4') |
| 8 | 8 | ||
| @@ -29,7 +29,7 @@ def saveData(): | @@ -29,7 +29,7 @@ def saveData(): | ||
| 29 | 29 | ||
| 30 | os.remove(articleAddr) | 30 | os.remove(articleAddr) |
| 31 | os.remove(commentsAddr) | 31 | os.remove(commentsAddr) |
| 32 | - update_data() | 32 | + # update_data() |
| 33 | 33 | ||
| 34 | if __name__ == '__main__': | 34 | if __name__ == '__main__': |
| 35 | saveData() | 35 | saveData() |
| @@ -9,7 +9,7 @@ def spiderData(): | @@ -9,7 +9,7 @@ def spiderData(): | ||
| 9 | print('正在爬取导航栏数据') | 9 | print('正在爬取导航栏数据') |
| 10 | spiderNav() | 10 | spiderNav() |
| 11 | print('正在爬取文章数据') | 11 | print('正在爬取文章数据') |
| 12 | - spiderContent(1,1) | 12 | + spiderContent(9,1) |
| 13 | print('正在爬取文章评论数据') | 13 | print('正在爬取文章评论数据') |
| 14 | spiderComments() | 14 | spiderComments() |
| 15 | 15 |
| @@ -90,7 +90,7 @@ def readJson(response,type): | @@ -90,7 +90,7 @@ def readJson(response,type): | ||
| 90 | isVip | 90 | isVip |
| 91 | ]) | 91 | ]) |
| 92 | 92 | ||
| 93 | -def start(typeNum=1,pageNum=1): | 93 | +def start(typeNum=14,pageNum=3): |
| 94 | articleUrl = 'https://weibo.com/ajax/feed/hottimeline' | 94 | articleUrl = 'https://weibo.com/ajax/feed/hottimeline' |
| 95 | init() | 95 | init() |
| 96 | typeList = getTypeList() | 96 | typeList = getTypeList() |
| @@ -112,7 +112,7 @@ | @@ -112,7 +112,7 @@ | ||
| 112 | </a> | 112 | </a> |
| 113 | </li> | 113 | </li> |
| 114 | <li class="px-3 pt-3 pb-2"> | 114 | <li class="px-3 pt-3 pb-2"> |
| 115 | - <span class="text-uppercase small font-weight-bold">词云图</span> | 115 | + <span class="text-uppercase small font-weight-bold">机器学习预测</span> |
| 116 | </li> | 116 | </li> |
| 117 | <li class=" sidebar-layout"> | 117 | <li class=" sidebar-layout"> |
| 118 | <a href="/page/articleCloud" class="svg-icon"> | 118 | <a href="/page/articleCloud" class="svg-icon"> |
-
Please register or login to post a comment