Commit 48c53bef authored by liyang's avatar liyang

feat:1.编写自由时报爬虫脚本

2.编写数据量统计脚本
parent f0e81304
......@@ -156,7 +156,7 @@ def reptile(browser=None, search_word=""):
script_close(browser)
else:
# 爬取数据为空
log.info("未爬取到数据")
log.info("no reptile data")
# 删除目录
delete_directory(local_path)
script_close(browser)
......
......@@ -127,7 +127,7 @@ def parse_ltn_time_string(time_str):
number = int(time_str.split("小時")[0])
time_delta = datetime.timedelta(hours=number)
return int((datetime.datetime.now() + time_delta).timestamp())
else:
elif "月" in time_str and "日" in time_str:
try:
datetime_str = time_str.replace("月", " ").replace("日", "")
month, day = map(int, datetime_str.split())
......@@ -136,6 +136,9 @@ def parse_ltn_time_string(time_str):
return int(datetime_obj.timestamp())
except ValueError:
return None
else:
# print(time_str)
return datetime.datetime.strptime(time_str, '%Y/%m/%d')
# 转换 youtube 的时间
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment