PyBot/GotoSend/M_4hou.py

160 lines
4.7 KiB
Python
Raw Normal View History

2024-12-06 16:32:34 +08:00
# -*- coding: utf-8 -*-
2024-12-03 17:33:37 +08:00
import json
import sqlite3
import os
from datetime import datetime, timedelta
def create_database():
conn = sqlite3.connect('./db/4hou.db')
cursor = conn.cursor()
cursor.execute('''CREATE TABLE IF NOT EXISTS articles (
id INTEGER PRIMARY KEY AUTOINCREMENT,
title TEXT,
link TEXT,
description TEXT,
pubDate DATETIME,
author TEXT
)''')
conn.commit()
conn.close()
def insert_data(data):
conn = sqlite3.connect('./db/4hou.db')
cursor = conn.cursor()
for entry in data:
try:
# 解析 pubDate 字符串为 datetime 对象
pub_date = datetime.strptime(entry['pubDate'], '%a, %d %b %Y %H:%M:%S %z')
# 格式化 pubDate 为所需的格式
formatted_pub_date = pub_date.strftime('%Y-%m-%d %H:%M:%S')
except ValueError:
# 如果解析失败,使用原始 pubDate 字符串
formatted_pub_date = entry['pubDate']
cursor.execute('''
INSERT INTO articles (title, link, description, pubDate, author)
VALUES (?, ?, ?, ?, ?)
''', (entry['title'], entry['link'], entry['description'], formatted_pub_date, entry['author']))
conn.commit()
conn.close()
def get_4hou_json():
# 检查文件是否存在
if not os.path.exists('./JSON/4hou.json'):
raise FileNotFoundError(f"4hou.json文件不存在请检查程序是否运行正常")
# 打开并读取JSON文件
with open('./JSON/4hou.json', 'r', encoding='utf-8') as file:
data = json.load(file)
# 假设data是一个包含多个JSON对象的列表
if not isinstance(data, list):
raise ValueError("JSON文件格式错误请检查common.py是否异常")
# 提取所需字段并编号
total_data = []
for index, item in enumerate(data, start=1):
entry = {
"id": index,
"title": item.get("title", ""),
"link": item.get("link", ""),
"description": item.get("description", ""),
"pubDate": item.get("pubDate", ""),
"author": item.get("author", "")
}
total_data.append(entry)
return total_data
2024-12-04 17:21:26 +08:00
def select_articles(e_hour):
2024-12-03 17:33:37 +08:00
conn = sqlite3.connect('./db/4hou.db')
cursor = conn.cursor()
# 获取当前日期和时间
now = datetime.now()
2024-12-04 17:21:26 +08:00
start_time = now - timedelta(hours=e_hour)
end_time = now
2024-12-03 17:33:37 +08:00
# 查询指定时间段内的数据
cursor.execute('''
SELECT * FROM articles
WHERE pubDate BETWEEN ? AND ?
''', (start_time.strftime('%Y-%m-%d %H:%M:%S'), end_time.strftime('%Y-%m-%d %H:%M:%S')))
results = cursor.fetchall()
conn.close()
return results
def clear_table():
conn = sqlite3.connect('./db/4hou.db')
cursor = conn.cursor()
cursor.execute('DELETE FROM articles')
conn.commit()
conn.close()
2024-12-10 11:49:15 +08:00
def record_md(result, filename="./history/sec_news.md"):
# 读取现有内容
if os.path.exists(filename):
with open(filename, 'r', encoding='utf-8') as file:
existing_content = file.read()
else:
existing_content = ""
# 将新内容插入到现有内容的开头
new_content = result + existing_content
# 写回文件
with open(filename, 'w', encoding='utf-8') as file:
file.write(new_content)
2024-12-03 17:33:37 +08:00
def get_filtered_articles(entries):
result = ""
2024-12-10 11:49:15 +08:00
record = ""
2024-12-03 17:33:37 +08:00
for entry in entries:
2024-12-09 23:03:35 +08:00
result += f"作者:{entry[5]}\n文章:{entry[1]}\n"
result += f"链接:{entry[2]}\n上传时间:{entry[4]}\n"
2024-12-10 11:49:15 +08:00
result += "\n" + "-" * 40 + "\n" # 添加分隔线以便区分不同文章
record += f"#### 文章:{entry[1]}\n"
record += f"**作者**{entry[5]}\n"
record += f"**链接**{entry[2]}\n"
record += f"**上传时间**{entry[4]}\n"
record += "\n" + "-" * 40 + "\n" # 添加分隔线以便区分不同文章
record_md(record)
2024-12-03 17:33:37 +08:00
return result
2024-12-04 17:21:26 +08:00
def Src_4hou(e_hour):
2024-12-03 17:33:37 +08:00
if not os.path.exists('./db/4hou.db'):
# 创建数据库和表
create_database()
# 清空表
clear_table()
# 获取 JSON 数据
M_4hou_data = get_4hou_json()
# 插入数据到数据库
insert_data(M_4hou_data)
# 查询指定时间段内的数据
2024-12-04 17:21:26 +08:00
filtered_articles = select_articles(e_hour)
2024-12-03 17:33:37 +08:00
# print(filtered_articles)
if filtered_articles:
results = get_filtered_articles(filtered_articles)
2024-12-05 12:20:37 +08:00
return results
else:
return ""
if __name__ == "__main__":
reslts = Src_4hou(4)
if reslts != "":
print(reslts)
2024-12-03 17:33:37 +08:00
else:
# 如果为空,则跳过执行
2024-12-05 12:20:37 +08:00
print("-" * 40)
2024-12-04 17:21:26 +08:00
print("嘶吼数据为空,跳过执行。")
2024-12-03 17:33:37 +08:00