233 lines
9.2 KiB
Python
233 lines
9.2 KiB
Python
"""
|
||
该代码用于更新日 K 数据
|
||
"""
|
||
from futu import *
|
||
from pymysql import Error
|
||
from MySQLHelper import MySQLHelper # MySQLHelper类保存为单独文件
|
||
from datetime import datetime
|
||
import logging
|
||
from typing import Optional, List, Dict, Union, Tuple
|
||
import time
|
||
|
||
def get_market_data(market: Market) -> List[str]:
|
||
"""
|
||
从Futu API获取指定市场的股票代码列表
|
||
|
||
Args:
|
||
market (Market): 市场枚举值,如 Market.SH, Market.SZ
|
||
|
||
Returns:
|
||
List[str]: 股票代码列表
|
||
"""
|
||
quote_ctx = OpenQuoteContext(host='127.0.0.1', port=11111)
|
||
try:
|
||
ret, data = quote_ctx.get_stock_basicinfo(market, SecurityType.STOCK)
|
||
if ret == RET_OK:
|
||
# 提取code列并转换为列表
|
||
codes = data['code'].astype(str).tolist()
|
||
logging.info(f"获取到 {market} 市场 {len(codes)} 个股票代码")
|
||
return codes
|
||
else:
|
||
logging.error(f"获取股票代码失败: {data}")
|
||
return []
|
||
except Exception as e:
|
||
logging.error(f"获取股票代码时发生异常: {str(e)}")
|
||
return []
|
||
finally:
|
||
quote_ctx.close()
|
||
|
||
def preprocess_quote_data(df: pd.DataFrame) -> List[Dict]:
|
||
"""
|
||
预处理行情数据,转换为适合数据库存储的格式
|
||
|
||
Args:
|
||
df (pd.DataFrame): 原始行情数据DataFrame
|
||
|
||
Returns:
|
||
List[Dict]: 处理后的数据列表
|
||
"""
|
||
processed_data = []
|
||
for _, row in df.iterrows():
|
||
try:
|
||
# 提取市场标识
|
||
market = row['code'].split('.')[0] if '.' in row['code'] else 'UNKNOWN'
|
||
|
||
# 转换时间格式
|
||
trade_time = datetime.strptime(row['time_key'], '%Y-%m-%d %H:%M:%S')
|
||
|
||
item = {
|
||
'stock_code': row['code'],
|
||
'stock_name': row['name'],
|
||
'trade_date': trade_time,
|
||
'open_price': float(row['open']),
|
||
'close_price': float(row['close']),
|
||
'high_price': float(row['high']),
|
||
'low_price': float(row['low']),
|
||
'pe_ratio': float(row['pe_ratio']) if pd.notna(row['pe_ratio']) else None,
|
||
'turnover_rate': float(row['turnover_rate']) if pd.notna(row['turnover_rate']) else None,
|
||
'volume': int(row['volume']) if pd.notna(row['volume']) else None,
|
||
'turnover': float(row['turnover']) if pd.notna(row['turnover']) else None,
|
||
'change_rate': float(row['change_rate']) if pd.notna(row['change_rate']) else None,
|
||
'last_close': float(row['last_close']) if pd.notna(row['last_close']) else None,
|
||
'market': market
|
||
}
|
||
processed_data.append(item)
|
||
except Exception as e:
|
||
logging.warning(f"处理行情数据时跳过异常行 {row.get('code', '未知')}: {str(e)}")
|
||
continue
|
||
|
||
return processed_data
|
||
|
||
def save_quotes_to_db(db_config: dict, quote_data: pd.DataFrame, table_name: str = 'stock_quotes') -> bool:
|
||
"""
|
||
将行情数据保存到数据库
|
||
|
||
Args:
|
||
db_config (dict): 数据库配置
|
||
quote_data (pd.DataFrame): 行情数据DataFrame
|
||
table_name (str): 目标表名(默认为'stock_quotes')
|
||
|
||
Returns:
|
||
bool: 是否成功保存
|
||
"""
|
||
# 预处理数据
|
||
processed_data = preprocess_quote_data(quote_data)
|
||
if not processed_data:
|
||
logging.error("没有有效数据需要保存")
|
||
return False
|
||
|
||
# 动态生成SQL插入语句
|
||
insert_sql = f"""
|
||
INSERT INTO {table_name} (
|
||
stock_code, stock_name, trade_date, open_price, close_price, high_price, low_price,
|
||
pe_ratio, turnover_rate, volume, turnover, change_rate, last_close, market
|
||
) VALUES (
|
||
%(stock_code)s, %(stock_name)s, %(trade_date)s, %(open_price)s, %(close_price)s, %(high_price)s, %(low_price)s,
|
||
%(pe_ratio)s, %(turnover_rate)s, %(volume)s, %(turnover)s, %(change_rate)s, %(last_close)s, %(market)s
|
||
)
|
||
ON DUPLICATE KEY UPDATE
|
||
stock_name = VALUES(stock_name),
|
||
open_price = VALUES(open_price),
|
||
close_price = VALUES(close_price),
|
||
high_price = VALUES(high_price),
|
||
low_price = VALUES(low_price),
|
||
pe_ratio = VALUES(pe_ratio),
|
||
turnover_rate = VALUES(turnover_rate),
|
||
volume = VALUES(volume),
|
||
turnover = VALUES(turnover),
|
||
change_rate = VALUES(change_rate),
|
||
last_close = VALUES(last_close)
|
||
"""
|
||
|
||
try:
|
||
with MySQLHelper(**db_config) as db:
|
||
# 检查表是否存在,不存在则创建
|
||
if not db.table_exists(table_name):
|
||
create_table_sql = f"""
|
||
CREATE TABLE IF NOT EXISTS {table_name} (
|
||
id INT AUTO_INCREMENT PRIMARY KEY,
|
||
stock_code VARCHAR(20) NOT NULL COMMENT '股票代码',
|
||
stock_name VARCHAR(50) COMMENT '股票名称',
|
||
trade_date DATETIME NOT NULL COMMENT '交易日期时间',
|
||
open_price DECIMAL(10, 3) COMMENT '开盘价',
|
||
close_price DECIMAL(10, 3) COMMENT '收盘价',
|
||
high_price DECIMAL(10, 3) COMMENT '最高价',
|
||
low_price DECIMAL(10, 3) COMMENT '最低价',
|
||
pe_ratio DECIMAL(10, 3) COMMENT '市盈率',
|
||
turnover_rate DECIMAL(10, 6) COMMENT '换手率(%)',
|
||
volume BIGINT COMMENT '成交量(股)',
|
||
turnover DECIMAL(20, 2) COMMENT '成交额(元)',
|
||
change_rate DECIMAL(10, 6) COMMENT '涨跌幅(%)',
|
||
last_close DECIMAL(10, 3) COMMENT '昨收价',
|
||
market VARCHAR(10) COMMENT '市场标识',
|
||
create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP COMMENT '创建时间',
|
||
|
||
UNIQUE KEY uk_code_date (stock_code, trade_date),
|
||
KEY idx_trade_date (trade_date),
|
||
KEY idx_stock_code (stock_code)
|
||
) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4 COMMENT='股票行情数据表'
|
||
"""
|
||
db.execute_update(create_table_sql)
|
||
logging.info(f"创建了新表: {table_name}")
|
||
|
||
affected_rows = db.execute_many(insert_sql, processed_data)
|
||
logging.info(f"成功插入/更新 {affected_rows} 条行情记录到表 {table_name}")
|
||
return True
|
||
except Exception as e:
|
||
logging.error(f"保存行情数据到表 {table_name} 失败: {str(e)}")
|
||
return False
|
||
|
||
def read_missing_codes_basic(file_path='missing_tables.txt'):
|
||
"""基础读取方法 - 按行读取所有内容"""
|
||
try:
|
||
with open(file_path, 'r', encoding='utf-8') as f:
|
||
lines = f.readlines()
|
||
# 去除每行末尾的换行符,并过滤空行
|
||
codes = [line.strip() for line in lines if line.strip()]
|
||
return codes
|
||
except FileNotFoundError:
|
||
print(f"文件 {file_path} 不存在")
|
||
return []
|
||
except Exception as e:
|
||
print(f"读取文件失败: {str(e)}")
|
||
return []
|
||
|
||
if __name__ == "__main__":
|
||
# 配置日志
|
||
logging.basicConfig(
|
||
level=logging.INFO,
|
||
format='%(asctime)s - %(levelname)s - %(message)s',
|
||
handlers=[
|
||
logging.FileHandler('Debug.log', encoding='utf-8'), # 关键在这里
|
||
logging.StreamHandler()
|
||
]
|
||
)
|
||
|
||
# 数据库配置
|
||
db_config = {
|
||
'host': 'localhost',
|
||
'user': 'root',
|
||
'password': 'bzskmysql',
|
||
'database': 'klinedata_1d_hk'
|
||
}
|
||
|
||
|
||
# market_data = get_market_data(Market.HK) # 获取香港市场数据,后面需要改成按照筛选来获取
|
||
|
||
market_data = read_missing_codes_basic()
|
||
|
||
nCount = 0 # 记录账号获取多少只股票的数据
|
||
for code in market_data:
|
||
|
||
# nCount = nCount + 1
|
||
# if nCount < 450:
|
||
# continue
|
||
|
||
quote_ctx = OpenQuoteContext(host='127.0.0.1', port=11111)
|
||
# ret, data, page_req_key = quote_ctx.request_history_kline(code, start='2024-09-01', end='2025-08-20', max_count=100, session=Session.ALL) # 每页5个,请求第一页 session 字段紧美股有用
|
||
ret, data, page_req_key = quote_ctx.request_history_kline(code, start='2024-10-01', end='2025-08-20', max_count=100) # 每页5个,请求第一页
|
||
# 保存数据到自定义表
|
||
custom_table_name = 'hk_' + code[3:] # 自定义表名
|
||
|
||
if ret == RET_OK:
|
||
success = save_quotes_to_db(db_config, data, table_name=custom_table_name)
|
||
else:
|
||
print('error:', data)
|
||
|
||
while page_req_key != None: # 请求后面的所有结果
|
||
# print('*************************************')
|
||
ret, data, page_req_key = quote_ctx.request_history_kline(code, start='2024-10-01', end='2025-08-20', max_count=100, page_req_key=page_req_key) # 请求翻页后的数据
|
||
if ret == RET_OK:
|
||
success = save_quotes_to_db(db_config, data, table_name=custom_table_name)
|
||
else:
|
||
print('error:', data)
|
||
|
||
time.sleep(1)
|
||
|
||
|
||
# if nCount == 2000:
|
||
# break
|
||
quote_ctx.close() # 结束后记得关闭当条连接,防止连接条数用尽
|
||
|
||
|