# 选取5大行业各6只代表性股票
industry_stock_mapping = { # 行业-股票映射字典
'银行': ['601398.XSHG', '601288.XSHG', '600036.XSHG', '601818.XSHG', '600000.XSHG', '601166.XSHG'], # 工商银行、农业银行、招商银行等
'电子': ['002415.XSHE', '603986.XSHG', '600703.XSHG', '002049.XSHE', '300750.XSHE', '688008.XSHG'], # 海康威视等电子企业
'食品饮料': ['600519.XSHG', '000858.XSHE', '603369.XSHG', '002304.XSHE', '000568.XSHE', '600887.XSHG'], # 贵州茅台等食品企业
'非银金融': ['601318.XSHG', '600030.XSHG', '601688.XSHG', '600837.XSHG', '000776.XSHE', '601211.XSHG'], # 中国平安等金融企业
'房地产': ['000002.XSHE', '001979.XSHE', '600048.XSHG', '000069.XSHE', '600383.XSHG', '600340.XSHG'] # 万科A等房地产企业
} # 5行业 × 6只 = 30只股票
all_selected_stock_codes = [] # 存放所有选中股票代码
for stock_list in industry_stock_mapping.values(): # 展开所有行业的股票
all_selected_stock_codes.extend(stock_list) # 追加到总列表
# 读取后复权股价数据
path_price = os.path.join(DATA_DIR, 'stock/stock_price_post_adjusted.h5') # 股价文件路径
stock_price_data = pd.read_hdf(path_price).reset_index() # 读取并重置索引