juanboy

爬虫结束自动打标注

@@ -69,13 +69,11 @@ def getTopicCreatedAtandpredictData(topic):# 统计特定话题的评论在每 @@ -69,13 +69,11 @@ def getTopicCreatedAtandpredictData(topic):# 统计特定话题的评论在每
69 else: 69 else:
70 createdAt[i[1]] = 1 70 createdAt[i[1]] = 1
71 createdAt = {k: createdAt[k] for k in sorted(createdAt, key=lambda date: datetime.datetime.strptime(date, "%Y-%m-%d"))} 71 createdAt = {k: createdAt[k] for k in sorted(createdAt, key=lambda date: datetime.datetime.strptime(date, "%Y-%m-%d"))}
72 - print(createdAt)  
73 createdAt.update(predict_future_values(createdAt)) 72 createdAt.update(predict_future_values(createdAt))
74 - print(createdAt)  
75 sorted_data = {k: createdAt[k] for k in sorted(createdAt, key=lambda date: datetime.datetime.strptime(date, "%Y-%m-%d"))} 73 sorted_data = {k: createdAt[k] for k in sorted(createdAt, key=lambda date: datetime.datetime.strptime(date, "%Y-%m-%d"))}
76 - return topic,sorted_data  
77 - # return topic,list(createdAt.keys()),list(createdAt.values())  
78 - # return topic, createdAt.items() 74 + result_list = [0] * (len(sorted_data) - 5) + [1] * 5
  75 + return topic,sorted_data,result_list
  76 + # return topic,list(createdAt.keys()),list(createdAt.values()),result_list
79 77
80 def writeTopicsToCSV(topics, file_name): 78 def writeTopicsToCSV(topics, file_name):
81 # 检查文件是否存在,如果存在则附加写入,否则新建一个 79 # 检查文件是否存在,如果存在则附加写入,否则新建一个