TradingAgents/tradingagents/dataflows/akshare_news.py

50 lines
1.9 KiB
Python

# tradingagents/dataflows/akshare_news.py
import akshare as ak
from datetime import datetime
import pandas as pd
def get_news_akshare(
ticker: str,
start_date: str,
end_date: str,
) -> str:
"""
使用 AkShare 获取 A 股特定股票的新闻 (东方财富数据源)
"""
# 1. A股代码清洗: yfinance 习惯用 '600519.SS', akshare 通常只需要 '600519'
clean_ticker = ticker.split('.')[0]
if not clean_ticker.isdigit():
return f"Invalid A-share ticker format: {ticker}"
try:
# 获取个股新闻 (东方财富接口)
news_df = ak.stock_news_em(symbol=clean_ticker)
if news_df.empty:
return f"No news found for {ticker}"
# 将发布时间转换为 datetime 进行过滤
news_df['发布时间'] = pd.to_datetime(news_df['发布时间'])
start_dt = datetime.strptime(start_date, "%Y-%m-%d")
end_dt = datetime.strptime(end_date, "%Y-%m-%d")
# 过滤日期区间
mask = (news_df['发布时间'] >= start_dt) & (news_df['发布时间'] <= end_dt)
filtered_news = news_df.loc[mask]
if filtered_news.empty:
return f"No news found for {ticker} between {start_date} and {end_date}"
# 格式化输出为大模型易读的 Markdown 格式
news_str = ""
# 限制返回条数,避免 token 溢出
for _, row in filtered_news.head(20).iterrows():
pub_time = row['发布时间'].strftime('%Y-%m-%d %H:%M:%S')
news_str += f"### {row['新闻标题']} (时间: {pub_time})\n"
news_str += f"{row['新闻内容']}\n"
news_str += f"来源: {row['文章来源']} | Link: {row['新闻链接']}\n\n"
return f"## {ticker} A股新闻, 从 {start_date}{end_date}:\n\n{news_str}"
except Exception as e:
return f"Error fetching A-share news for {ticker} via AkShare: {str(e)}"