PyBot/GotoSend/freebuf.py

163 lines
5.0 KiB
Python
Raw Normal View History

2024-12-06 16:32:34 +08:00
# -*- coding: utf-8 -*-
2024-12-05 00:03:51 +08:00
import json
import sqlite3
import os
from datetime import datetime, timedelta
def create_database():
conn = sqlite3.connect('./db/freebuf.db')
cursor = conn.cursor()
cursor.execute('''CREATE TABLE IF NOT EXISTS articles (
id INTEGER PRIMARY KEY AUTOINCREMENT,
title TEXT,
link TEXT,
description TEXT,
pubDate DATETIME,
category TEXT
)''')
conn.commit()
conn.close()
def insert_data(data):
conn = sqlite3.connect('./db/freebuf.db')
cursor = conn.cursor()
for entry in data:
try:
# 解析 pubDate 字符串为 datetime 对象
pub_date = datetime.strptime(entry['pubDate'], '%a, %d %b %Y %H:%M:%S %z')
# 格式化 pubDate 为所需的格式
formatted_pub_date = pub_date.strftime('%Y-%m-%d %H:%M:%S')
except ValueError:
# 如果解析失败,使用原始 pubDate 字符串
formatted_pub_date = entry['pubDate']
cursor.execute('''
INSERT INTO articles (title, link, description, pubDate, category)
VALUES (?, ?, ?, ?, ?)
''', (entry['title'], entry['link'], entry['description'], formatted_pub_date, entry['category']))
conn.commit()
conn.close()
def get_freebuf_json():
# 检查文件是否存在
if not os.path.exists('./JSON/freebuf.json'):
raise FileNotFoundError(f"freebuf.json文件不存在请检查程序是否运行正常")
# 打开并读取JSON文件
with open('./JSON/freebuf.json', 'r', encoding='utf-8') as file:
data = json.load(file)
# 假设data是一个包含多个JSON对象的列表
if not isinstance(data, list):
2025-01-02 13:00:43 +08:00
raise ValueError("JSON文件格式错误请检查爬取程序是否异常")
2024-12-05 00:03:51 +08:00
# 提取所需字段并编号
total_data = []
for index, item in enumerate(data, start=1):
entry = {
"id": index,
"title": item.get("title", ""),
"link": item.get("link", ""),
"description": item.get("description", ""),
"pubDate": item.get("pubDate", ""),
"category": item.get("category", "")
}
total_data.append(entry)
return total_data
def select_articles(e_hour):
conn = sqlite3.connect('./db/freebuf.db')
cursor = conn.cursor()
# 获取当前日期和时间
now = datetime.now()
start_time = now - timedelta(hours=e_hour)
end_time = now
# 查询指定时间段内的数据
cursor.execute('''
SELECT * FROM articles
WHERE pubDate BETWEEN ? AND ?
''', (start_time.strftime('%Y-%m-%d %H:%M:%S'), end_time.strftime('%Y-%m-%d %H:%M:%S')))
results = cursor.fetchall()
conn.close()
return results
def clear_table():
conn = sqlite3.connect('./db/freebuf.db')
cursor = conn.cursor()
cursor.execute('DELETE FROM articles')
conn.commit()
conn.close()
2024-12-10 11:49:15 +08:00
def record_md(result, filename="./history/sec_news.md"):
# 读取现有内容
if os.path.exists(filename):
with open(filename, 'r', encoding='utf-8') as file:
existing_content = file.read()
else:
existing_content = ""
# 将新内容插入到现有内容的开头
new_content = result + existing_content
# 写回文件
with open(filename, 'w', encoding='utf-8') as file:
file.write(new_content)
2024-12-10 11:49:15 +08:00
2024-12-18 11:56:11 +08:00
def get_filtered_articles(entries, Is_short):
2024-12-05 00:03:51 +08:00
result = ""
2024-12-10 11:49:15 +08:00
record = ""
2024-12-05 00:03:51 +08:00
for entry in entries:
2024-12-18 11:56:11 +08:00
if Is_short == False:
2024-12-25 18:40:20 +08:00
result += f"文章:[{entry[1]}]({entry[2]})\n类型:{entry[5]}\n"
result += f"上传时间:{entry[4]}\n"
2024-12-18 11:56:11 +08:00
result += "\n" + "-" * 40 + "\n" # 添加分隔线以便区分不同文章
elif Is_short == True:
2024-12-25 18:40:20 +08:00
result += f"文章:[{entry[1]}]({entry[2]})\n"
result += f"上传时间:{entry[4]}\n"
2024-12-18 11:56:11 +08:00
result += "\n" + "-" * 3 + "\n" # 添加分隔线以便区分不同文章
2024-12-10 11:49:15 +08:00
2024-12-25 18:40:20 +08:00
record += f"#### 文章:[{entry[1]}]({entry[2]})\n"
2024-12-10 11:49:15 +08:00
record += f"**类型**{entry[5]}\n"
record += f"**上传时间**{entry[4]}\n"
record += "\n" + "-" * 40 + "\n" # 添加分隔线以便区分不同文章
record_md(record)
2024-12-05 00:03:51 +08:00
return result
2024-12-18 11:56:11 +08:00
def Src_freebuf(e_hour, Is_short):
2024-12-05 00:03:51 +08:00
if not os.path.exists('./db/freebuf.db'):
# 创建数据库和表
create_database()
# 清空表
clear_table()
# 获取 JSON 数据
freebuf_data = get_freebuf_json()
# 插入数据到数据库
insert_data(freebuf_data)
# 查询指定时间段内的数据
filtered_articles = select_articles(e_hour)
# print(filtered_articles)
if filtered_articles:
2024-12-18 11:56:11 +08:00
results = get_filtered_articles(filtered_articles, Is_short)
2024-12-05 12:20:37 +08:00
return results
2024-12-05 00:03:51 +08:00
else:
2024-12-05 12:20:37 +08:00
return False
2024-12-05 00:03:51 +08:00
if __name__ == "__main__":
2024-12-18 11:56:11 +08:00
reslts = Src_freebuf(4, False)
2024-12-05 12:20:37 +08:00
if reslts != False:
print(reslts)
else:
# 如果为空,则跳过执行
print("-" * 40)
print("Freebuf数据为空跳过执行。")