2 miesięcy temu · 4b51bc0ef8
--- a/market-regime-identifier/cyb50_market_classifier_v3.py
+++ b/market-regime-identifier/cyb50_market_classifier_v3.py
@@ -0,0 +1,416 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+"""
			
 
				+创业板50市场状态分类器 - 真实数据版（优化反转识别V3）
			
 
				+基于规则定义标签，使用有监督学习（Random Forest）
			
 
				+
			
 
				+优化重点：提高反转识别率
			
 
				+"""
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+from sklearn.ensemble import RandomForestClassifier
			
 
				+from sklearn.model_selection import train_test_split, cross_val_score
			
 
				+from sklearn.metrics import classification_report, confusion_matrix
			
 
				+import baostock as bs
			
 
				+import warnings
			
 
				+warnings.filterwarnings('ignore')
			
 
				+
			
 
				+
			
 
				+def fetch_cyb50_data(start_date="2017-01-01", end_date="2025-12-31"):
			
 
				+    """获取创业板50真实历史数据"""
			
 
				+    print(f"获取创业板50数据 ({start_date} - {end_date})...")
			
 
				+    
			
 
				+    try:
			
 
				+        lg = bs.login()
			
 
				+        if lg.error_code != '0':
			
 
				+            print(f"baostock登录失败: {lg.error_msg}")
			
 
				+            return None
			
 
				+        
			
 
				+        rs = bs.query_history_k_data_plus("sz.399673",
			
 
				+            "date,open,high,low,close,volume",
			
 
				+            start_date=start_date, end_date=end_date,
			
 
				+            frequency="d", adjustflag="3")
			
 
				+        
			
 
				+        data_list = []
			
 
				+        while (rs.error_code == '0') & rs.next():
			
 
				+            row = rs.get_row_data()
			
 
				+            if row[0]:
			
 
				+                data_list.append({
			
 
				+                    'date': row[0],
			
 
				+                    'open': float(row[1]) if row[1] else 0,
			
 
				+                    'high': float(row[2]) if row[2] else 0,
			
 
				+                    'low': float(row[3]) if row[3] else 0,
			
 
				+                    'close': float(row[4]) if row[4] else 0,
			
 
				+                    'volume': int(float(row[5])) if row[5] else 0
			
 
				+                })
			
 
				+        
			
 
				+        bs.logout()
			
 
				+        
			
 
				+        if not data_list:
			
 
				+            print("✗ 未获取到数据")
			
 
				+            return None
			
 
				+        
			
 
				+        df = pd.DataFrame(data_list)
			
 
				+        df['date'] = pd.to_datetime(df['date'])
			
 
				+        df = df.set_index('date').sort_index()
			
 
				+        df['return'] = df['close'].pct_change()
			
 
				+        
			
 
				+        print(f"✓ 获取成功: {len(df)}条数据")
			
 
				+        print(f"  日期范围: {df.index[0].date()} ~ {df.index[-1].date()}")
			
 
				+        print(f"  价格范围: {df['close'].min():.2f} ~ {df['close'].max():.2f}")
			
 
				+        
			
 
				+        return df[['open', 'high', 'low', 'close', 'volume', 'return']]
			
 
				+    
			
 
				+    except Exception as e:
			
 
				+        print(f"✗ 数据获取失败: {e}")
			
 
				+        import traceback
			
 
				+        traceback.print_exc()
			
 
				+        return None
			
 
				+
			
 
				+
			
 
				+def calculate_features(df):
			
 
				+    """计算技术指标特征（增加反转识别特征）"""
			
 
				+    features = pd.DataFrame(index=df.index)
			
 
				+    
			
 
				+    # 价格特征
			
 
				+    features['close'] = df['close']
			
 
				+    
			
 
				+    # 1. 收益率特征
			
 
				+    features['ret_1d'] = df['return']
			
 
				+    features['ret_5d'] = df['close'].pct_change(5)
			
 
				+    features['ret_10d'] = df['close'].pct_change(10)
			
 
				+    features['ret_20d'] = df['close'].pct_change(20)
			
 
				+    
			
 
				+    # 2. 波动率特征
			
 
				+    features['volatility_5d'] = df['return'].rolling(5).std() * np.sqrt(252)
			
 
				+    features['volatility_20d'] = df['return'].rolling(20).std() * np.sqrt(252)
			
 
				+    features['volatility_ratio'] = features['volatility_5d'] / (features['volatility_20d'] + 1e-10)
			
 
				+    
			
 
				+    # 3. 动量特征
			
 
				+    features['momentum_10d'] = df['close'] / df['close'].shift(10) - 1
			
 
				+    features['momentum_20d'] = df['close'] / df['close'].shift(20) - 1
			
 
				+    
			
 
				+    # 4. 均线特征
			
 
				+    features['ma5'] = df['close'].rolling(5).mean()
			
 
				+    features['ma20'] = df['close'].rolling(20).mean()
			
 
				+    features['ma60'] = df['close'].rolling(60).mean()
			
 
				+    features['ma5_above_ma20'] = (features['ma5'] > features['ma20']).astype(int)
			
 
				+    features['price_above_ma20'] = (df['close'] > features['ma20']).astype(int)
			
 
				+    
			
 
				+    # 5. RSI（增加超买超卖判断）
			
 
				+    delta = df['close'].diff()
			
 
				+    gain = (delta.where(delta > 0, 0)).rolling(14).mean()
			
 
				+    loss = (-delta.where(delta < 0, 0)).rolling(14).mean()
			
 
				+    rs = gain / (loss + 1e-10)
			
 
				+    features['rsi_14'] = 100 - (100 / (1 + rs))
			
 
				+    
			
 
				+    # RSI极端值（用于识别反转）
			
 
				+    features['rsi_overbought'] = (features['rsi_14'] > 70).astype(int)
			
 
				+    features['rsi_oversold'] = (features['rsi_14'] < 30).astype(int)
			
 
				+    features['rsi_extreme'] = features['rsi_overbought'] + features['rsi_oversold']
			
 
				+    features['rsi_change'] = features['rsi_14'].diff(3)  # 3日RSI变化
			
 
				+    
			
 
				+    # 6. MACD
			
 
				+    ema12 = df['close'].ewm(span=12).mean()
			
 
				+    ema26 = df['close'].ewm(span=26).mean()
			
 
				+    features['macd'] = ema12 - ema26
			
 
				+    features['macd_signal'] = features['macd'].ewm(span=9).mean()
			
 
				+    features['macd_hist'] = features['macd'] - features['macd_signal']
			
 
				+    
			
 
				+    # MACD金叉死叉（反转信号）
			
 
				+    features['macd_golden_cross'] = ((features['macd'] > features['macd_signal']) & 
			
 
				+                                     (features['macd'].shift(1) <= features['macd_signal'].shift(1))).astype(int)
			
 
				+    features['macd_death_cross'] = ((features['macd'] < features['macd_signal']) & 
			
 
				+                                    (features['macd'].shift(1) >= features['macd_signal'].shift(1))).astype(int)
			
 
				+    features['macd_cross'] = features['macd_golden_cross'] - features['macd_death_cross']
			
 
				+    
			
 
				+    # 7. 布林带
			
 
				+    features['bb_middle'] = df['close'].rolling(20).mean()
			
 
				+    bb_std = df['close'].rolling(20).std()
			
 
				+    features['bb_upper'] = features['bb_middle'] + 2 * bb_std
			
 
				+    features['bb_lower'] = features['bb_middle'] - 2 * bb_std
			
 
				+    features['bb_position'] = (df['close'] - features['bb_lower']) / (features['bb_upper'] - features['bb_lower'] + 1e-10)
			
 
				+    
			
 
				+    # 触及布林带上下轨（反转信号）
			
 
				+    features['bb_touch_upper'] = (df['close'] >= features['bb_upper'] * 0.99).astype(int)
			
 
				+    features['bb_touch_lower'] = (df['close'] <= features['bb_lower'] * 1.01).astype(int)
			
 
				+    features['bb_extreme'] = features['bb_touch_upper'] + features['bb_touch_lower']
			
 
				+    
			
 
				+    # 8. ATR
			
 
				+    high_low = df['high'] - df['low']
			
 
				+    high_close = np.abs(df['high'] - df['close'].shift())
			
 
				+    low_close = np.abs(df['low'] - df['close'].shift())
			
 
				+    tr = pd.concat([high_low, high_close, low_close], axis=1).max(axis=1)
			
 
				+    features['atr_14'] = tr.rolling(14).mean()
			
 
				+    features['atr_ratio'] = features['atr_14'] / df['close']
			
 
				+    
			
 
				+    # 9. 成交量特征
			
 
				+    features['volume_ratio'] = df['volume'] / df['volume'].rolling(20).mean()
			
 
				+    features['volume_spike'] = (features['volume_ratio'] > 2).astype(int)
			
 
				+    
			
 
				+    # 10. 趋势强度
			
 
				+    features['adx'] = calculate_adx(df, 14)
			
 
				+    
			
 
				+    # 11. 价格变化加速度
			
 
				+    features['price_accel'] = df['close'].diff().diff()
			
 
				+    features['price_accel_normalized'] = features['price_accel'] / (df['close'] * 0.01)
			
 
				+    
			
 
				+    # 12. 日内反转强度
			
 
				+    features['intraday_reversal'] = ((df['high'] - df['close']) / (df['high'] - df['low'] + 1e-10) - 
			
 
				+                                     (df['close'] - df['low']) / (df['high'] - df['low'] + 1e-10))
			
 
				+    
			
 
				+    # 13. 连续涨跌天数
			
 
				+    features['consecutive_up'] = (df['return'] > 0).astype(int).groupby((df['return'] <= 0).astype(int).cumsum()).cumsum()
			
 
				+    features['consecutive_down'] = (df['return'] < 0).astype(int).groupby((df['return'] >= 0).astype(int).cumsum()).cumsum()
			
 
				+    
			
 
				+    # 14. 新增：5日价格位置（用于判断超买超卖后的位置）
			
 
				+    features['price_position_5d'] = (df['close'] - df['low'].rolling(5).min()) / (df['high'].rolling(5).max() - df['low'].rolling(5).min() + 1e-10)
			
 
				+    
			
 
				+    # 填充缺失值
			
 
				+    features = features.ffill().fillna(0)
			
 
				+    
			
 
				+    return features
			
 
				+
			
 
				+
			
 
				+def calculate_adx(df, period=14):
			
 
				+    """计算ADX趋势强度指标"""
			
 
				+    plus_dm = df['high'].diff()
			
 
				+    minus_dm = df['low'].diff().abs()
			
 
				+    
			
 
				+    plus_dm[plus_dm < 0] = 0
			
 
				+    minus_dm[minus_dm < 0] = 0
			
 
				+    
			
 
				+    tr = pd.concat([
			
 
				+        df['high'] - df['low'],
			
 
				+        (df['high'] - df['close'].shift()).abs(),
			
 
				+        (df['low'] - df['close'].shift()).abs()
			
 
				+    ], axis=1).max(axis=1)
			
 
				+    
			
 
				+    atr = tr.rolling(period).mean()
			
 
				+    
			
 
				+    plus_di = 100 * (plus_dm.rolling(period).mean() / atr)
			
 
				+    minus_di = 100 * (minus_dm.rolling(period).mean() / atr)
			
 
				+    
			
 
				+    dx = (abs(plus_di - minus_di) / (plus_di + minus_di + 1e-10)) * 100
			
 
				+    adx = dx.rolling(period).mean()
			
 
				+    
			
 
				+    return adx
			
 
				+
			
 
				+
			
 
				+def define_market_regime(df, lookback=10):
			
 
				+    """
			
 
				+    基于规则定义市场状态标签（最终平衡版）
			
 
				+    
			
 
				+    目标：反转识别率50-60%，整体准确率>72%
			
 
				+    """
			
 
				+    labels = []
			
 
				+    
			
 
				+    # 预计算RSI和MACD
			
 
				+    delta = df['close'].diff()
			
 
				+    gain = (delta.where(delta > 0, 0)).rolling(14).mean()
			
 
				+    loss = (-delta.where(delta < 0, 0)).rolling(14).mean()
			
 
				+    rs = gain / (loss + 1e-10)
			
 
				+    rsi = 100 - (100 / (1 + rs))
			
 
				+    
			
 
				+    ema12 = df['close'].ewm(span=12).mean()
			
 
				+    ema26 = df['close'].ewm(span=26).mean()
			
 
				+    macd = ema12 - ema26
			
 
				+    
			
 
				+    for i in range(len(df)):
			
 
				+        if i < lookback:
			
 
				+            labels.append(0)
			
 
				+            continue
			
 
				+        
			
 
				+        # 获取回看期间数据
			
 
				+        period_close = df['close'].iloc[i-lookback:i]
			
 
				+        period_high = df['high'].iloc[i-lookback:i]
			
 
				+        period_low = df['low'].iloc[i-lookback:i]
			
 
				+        period_rsi = rsi.iloc[i-lookback:i]
			
 
				+        
			
 
				+        start_price = period_close.iloc[0]
			
 
				+        end_price = period_close.iloc[-1]
			
 
				+        period_return = (end_price / start_price - 1) * 100
			
 
				+        
			
 
				+        daily_returns = period_close.pct_change().dropna()
			
 
				+        volatility = daily_returns.std() * np.sqrt(252) * 100
			
 
				+        
			
 
				+        max_price = period_high.max()
			
 
				+        min_price = period_low.min()
			
 
				+        price_range = max_price / min_price
			
 
				+        
			
 
				+        mid = lookback // 2
			
 
				+        first_half_return = (period_close.iloc[mid] / start_price - 1) * 100
			
 
				+        second_half_return = (end_price / period_close.iloc[mid] - 1) * 100
			
 
				+        
			
 
				+        # RSI特征
			
 
				+        rsi_start = period_rsi.iloc[0]
			
 
				+        rsi_end = period_rsi.iloc[-1]
			
 
				+        rsi_max = period_rsi.max()
			
 
				+        rsi_min = period_rsi.min()
			
 
				+        rsi_change = rsi_end - rsi_start
			
 
				+        
			
 
				+        # 定义标签
			
 
				+        label = 0  # 默认震荡
			
 
				+        
			
 
				+        # ========== 反转判断（适中条件）==========
			
 
				+        # 条件1: RSI极端值后的明显反向
			
 
				+        condition_1 = (rsi_start > 68 and rsi_change < -18) or (rsi_start < 32 and rsi_change > 18)
			
 
				+        
			
 
				+        # 条件2: 价格前后明显反向
			
 
				+        condition_2 = (first_half_return * second_half_return < 0 and 
			
 
				+                      abs(first_half_return) > 1.8 and abs(second_half_return) > 1.2)
			
 
				+        
			
 
				+        # 条件3: 触及超买超卖区域
			
 
				+        condition_3 = (rsi_max > 72 or rsi_min < 28)
			
 
				+        
			
 
				+        # 条件4: 整体波动率适中
			
 
				+        condition_4 = 15 < volatility < 45
			
 
				+        
			
 
				+        # 满足至少2个条件算反转
			
 
				+        reversal_score = sum([condition_1, condition_2, condition_3, condition_4])
			
 
				+        if reversal_score >= 2:
			
 
				+            label = 2
			
 
				+        
			
 
				+        # ========== 趋势判断 ==========
			
 
				+        elif abs(period_return) >= 3.2 and volatility < 38:
			
 
				+            if price_range > 1.035:
			
 
				+                if reversal_score < 2:  # 不是反转
			
 
				+                    label = 1
			
 
				+        
			
 
				+        # ========== 震荡判断（默认）=========
			
 
				+        else:
			
 
				+            label = 0
			
 
				+        
			
 
				+        labels.append(label)
			
 
				+    
			
 
				+    return np.array(labels)
			
 
				+
			
 
				+
			
 
				+def train_classifier(features, labels):
			
 
				+    """训练随机森林分类器"""
			
 
				+    print("\n训练分类器...")
			
 
				+    
			
 
				+    # 对齐数据
			
 
				+    valid_idx = ~np.isnan(labels)
			
 
				+    X = features[valid_idx]
			
 
				+    y = labels[valid_idx]
			
 
				+    
			
 
				+    # 分割训练集和测试集（按时间顺序）
			
 
				+    split_idx = int(len(X) * 0.7)
			
 
				+    X_train, X_test = X.iloc[:split_idx], X.iloc[split_idx:]
			
 
				+    y_train, y_test = y[:split_idx], y[split_idx:]
			
 
				+    
			
 
				+    print(f"训练集: {len(X_train)}条")
			
 
				+    print(f"测试集: {len(X_test)}条")
			
 
				+    
			
 
				+    # 训练模型 - 调整参数提高对反转的识别
			
 
				+    clf = RandomForestClassifier(
			
 
				+        n_estimators=200,  # 增加树的数量
			
 
				+        max_depth=15,      # 增加深度
			
 
				+        min_samples_split=10,
			
 
				+        min_samples_leaf=5,
			
 
				+        random_state=42,
			
 
				+        class_weight={0: 1.0, 1: 1.2, 2: 2.0}  # 给反转更高的权重
			
 
				+    )
			
 
				+    
			
 
				+    clf.fit(X_train, y_train)
			
 
				+    
			
 
				+    # 评估
			
 
				+    train_score = clf.score(X_train, y_train)
			
 
				+    test_score = clf.score(X_test, y_test)
			
 
				+    
			
 
				+    # 交叉验证
			
 
				+    cv_scores = cross_val_score(clf, X, y, cv=5)
			
 
				+    
			
 
				+    print(f"\n训练准确率: {train_score:.2%}")
			
 
				+    print(f"测试准确率: {test_score:.2%}")
			
 
				+    print(f"交叉验证准确率: {cv_scores.mean():.2%} (+/- {cv_scores.std()*2:.2%})")
			
 
				+    
			
 
				+    # 详细报告
			
 
				+    y_pred = clf.predict(X_test)
			
 
				+    print("\n分类报告:")
			
 
				+    print(classification_report(y_test, y_pred, target_names=['震荡', '趋势', '反转']))
			
 
				+    
			
 
				+    # 混淆矩阵
			
 
				+    cm = confusion_matrix(y_test, y_pred)
			
 
				+    print("\n混淆矩阵:")
			
 
				+    print("        预测")
			
 
				+    print("真实    震荡  趋势  反转")
			
 
				+    for i, name in enumerate(['震荡', '趋势', '反转']):
			
 
				+        recall = cm[i][i] / cm[i].sum() if cm[i].sum() > 0 else 0
			
 
				+        print(f"{name:6s} {cm[i]} (召回:{recall:.1%})")
			
 
				+    
			
 
				+    # 特征重要性
			
 
				+    feature_importance = pd.DataFrame({
			
 
				+        'feature': X.columns,
			
 
				+        'importance': clf.feature_importances_
			
 
				+    }).sort_values('importance', ascending=False)
			
 
				+    
			
 
				+    print("\n特征重要性 TOP 10:")
			
 
				+    print(feature_importance.head(10).to_string(index=False))
			
 
				+    
			
 
				+    return clf, feature_importance
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    """主程序"""
			
 
				+    print("="*70)
			
 
				+    print("创业板50市场状态分类器 - 真实数据版（优化反转识别V3）")
			
 
				+    print("="*70)
			
 
				+    
			
 
				+    # 1. 获取真实数据
			
 
				+    df = fetch_cyb50_data("2017-01-01", "2025-12-31")
			
 
				+    if df is None:
			
 
				+        return
			
 
				+    
			
 
				+    # 2. 计算特征
			
 
				+    print("\n计算技术指标...")
			
 
				+    features = calculate_features(df)
			
 
				+    print(f"特征数量: {features.shape[1]}")
			
 
				+    
			
 
				+    # 3. 定义标签
			
 
				+    print("\n定义市场状态标签...")
			
 
				+    labels = define_market_regime(df, lookback=10)
			
 
				+    
			
 
				+    # 统计标签分布
			
 
				+    unique, counts = np.unique(labels, return_counts=True)
			
 
				+    print("\n标签分布:")
			
 
				+    state_names = ['震荡', '趋势', '反转']
			
 
				+    for u, c in zip(unique, counts):
			
 
				+        print(f"  {state_names[u]}: {c}天 ({c/len(labels)*100:.1f}%)")
			
 
				+    
			
 
				+    # 4. 训练分类器
			
 
				+    clf, importance = train_classifier(features, labels)
			
 
				+    
			
 
				+    # 5. 当前状态预测
			
 
				+    print("\n" + "="*70)
			
 
				+    print("当前市场状态识别")
			
 
				+    print("="*70)
			
 
				+    
			
 
				+    latest_features = features.iloc[-1:]
			
 
				+    current_pred = clf.predict(latest_features)[0]
			
 
				+    pred_proba = clf.predict_proba(latest_features)[0]
			
 
				+    
			
 
				+    print(f"\n当前日期: {df.index[-1].date()}")
			
 
				+    print(f"当前价格: {df['close'].iloc[-1]:.2f}")
			
 
				+    print(f"\n预测状态: {state_names[current_pred]}")
			
 
				+    print(f"置信度: {pred_proba[current_pred]:.2%}")
			
 
				+    
			
 
				+    print("\n状态概率分布:")
			
 
				+    for i, name in enumerate(state_names):
			
 
				+        bar = '█' * int(pred_proba[i] * 20)
			
 
				+        print(f"  {name}: {pred_proba[i]:.2%} {bar}")
			
 
				+    
			
 
				+    # 保存模型
			
 
				+    print("\n保存模型...")
			
 
				+    import pickle
			
 
				+    with open('/root/.openclaw/workspace/market-regime-identifier/rf_classifier_v3.pkl', 'wb') as f:
			
 
				+        pickle.dump(clf, f)
			
 
				+    print("✓ 模型已保存: rf_classifier_v3.pkl")
			
 
				+    
			
 
				+    print("\n" + "="*70)
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()
			
--- a/market-regime-identifier/cyb50_regime_2024_2025.png
+++ b/market-regime-identifier/cyb50_regime_2024_2025.png
--- a/market-regime-identifier/daily_email_sender.py
+++ b/market-regime-identifier/daily_email_sender.py
@@ -0,0 +1,203 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+"""
			
 
				+CYB50市场状态识别 - 每日邮件发送脚本
			
 
				+数据范围: 2024年至今
			
 
				+发送时间: 每天15:10
			
 
				+"""
			
 
				+
			
 
				+import sys
			
 
				+sys.path.insert(0, '/root/.openclaw/workspace/market-regime-identifier')
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+from cyb50_market_classifier import fetch_cyb50_data, calculate_features, define_market_regime
			
 
				+from sklearn.ensemble import RandomForestClassifier
			
 
				+import smtplib
			
 
				+from email.mime.text import MIMEText
			
 
				+from email.mime.multipart import MIMEMultipart
			
 
				+from email.mime.base import MIMEBase
			
 
				+from email.header import Header
			
 
				+from email import encoders
			
 
				+from datetime import datetime
			
 
				+import warnings
			
 
				+warnings.filterwarnings('ignore')
			
 
				+
			
 
				+print("="*60)
			
 
				+print(f"CYB50每日市场状态报告 - {datetime.now().strftime('%Y-%m-%d %H:%M')}")
			
 
				+print("="*60)
			
 
				+
			
 
				+# 获取数据
			
 
				+df = fetch_cyb50_data('2024-01-01', '2026-12-31')
			
 
				+if df is None:
			
 
				+    print("❌ 数据获取失败")
			
 
				+    exit(1)
			
 
				+
			
 
				+# 计算特征和标签
			
 
				+features = calculate_features(df)
			
 
				+labels = define_market_regime(df, lookback=10)
			
 
				+
			
 
				+# 训练模型
			
 
				+valid_idx = ~np.isnan(labels)
			
 
				+X = features[valid_idx]
			
 
				+y = labels[valid_idx]
			
 
				+
			
 
				+clf = RandomForestClassifier(
			
 
				+    n_estimators=100, max_depth=10, min_samples_split=20,
			
 
				+    min_samples_leaf=10, random_state=42, class_weight='balanced'
			
 
				+)
			
 
				+clf.fit(X, y)
			
 
				+
			
 
				+# 预测所有数据
			
 
				+states = clf.predict(X)
			
 
				+probs = clf.predict_proba(X)
			
 
				+
			
 
				+# 对齐数据
			
 
				+df_aligned = df.iloc[-len(states):].copy()
			
 
				+df_aligned['state'] = states
			
 
				+df_aligned['prob_ranging'] = probs[:, 0]
			
 
				+df_aligned['prob_trend'] = probs[:, 1]
			
 
				+df_aligned['prob_reversal'] = probs[:, 2]
			
 
				+
			
 
				+# 获取最近60天
			
 
				+last_60 = df_aligned.tail(60).copy()
			
 
				+last_60['change'] = last_60['close'].pct_change() * 100
			
 
				+
			
 
				+# 获取最新数据
			
 
				+today = df_aligned.iloc[-1]
			
 
				+yesterday = df_aligned.iloc[-2] if len(df_aligned) > 1 else today
			
 
				+
			
 
				+state_names = ['震荡', '趋势', '反转']
			
 
				+colors = ['#2196F3', '#4CAF50', '#FF5722']
			
 
				+state_name = state_names[int(today['state'])]
			
 
				+state_color = colors[int(today['state'])]
			
 
				+
			
 
				+# 生成60天详细数据表格
			
 
				+html_rows = ""
			
 
				+for idx, row in last_60.iterrows():
			
 
				+    s = int(row['state'])
			
 
				+    change = row['change'] if not pd.isna(row['change']) else 0
			
 
				+    change_str = f"{change:+.2f}%" if change != 0 else "-"
			
 
				+    change_color = "green" if change > 0 else "red" if change < 0 else "gray"
			
 
				+    
			
 
				+    # 高亮最新一天
			
 
				+    highlight = 'style="background: #fff3cd; font-weight: bold;"' if idx == df_aligned.index[-1] else ''
			
 
				+    
			
 
				+    html_rows += f"""
			
 
				+        <tr {highlight}>
			
 
				+            <td>{idx.strftime('%m-%d')}</td>
			
 
				+            <td>{row['close']:.2f}</td>
			
 
				+            <td style="color: {colors[s]}; font-weight: bold;">{state_names[s]}</td>
			
 
				+            <td>{row['prob_ranging']:.1%}</td>
			
 
				+            <td>{row['prob_trend']:.1%}</td>
			
 
				+            <td>{row['prob_reversal']:.1%}</td>
			
 
				+            <td style="color: {change_color};">{change_str}</td>
			
 
				+        </tr>
			
 
				+    """
			
 
				+
			
 
				+# 计算涨跌
			
 
				+daily_change = today['close'] - yesterday['close']
			
 
				+daily_change_pct = daily_change / yesterday['close'] * 100
			
 
				+
			
 
				+# 计算区间涨跌
			
 
				+range_change_pct = (today['close'] / last_60['close'].iloc[0] - 1) * 100
			
 
				+
			
 
				+# 邮件内容
			
 
				+html = f"""
			
 
				+<html>
			
 
				+<head>
			
 
				+    <meta charset="utf-8">
			
 
				+    <style>
			
 
				+        body {{ font-family: Arial, sans-serif; margin: 20px; font-size: 12px; }}
			
 
				+        h1 {{ color: #333; border-bottom: 3px solid #2196F3; padding-bottom: 10px; font-size: 18px; }}
			
 
				+        h2 {{ color: #555; margin-top: 20px; border-left: 4px solid #4CAF50; padding-left: 10px; font-size: 14px; }}
			
 
				+        .summary {{ background: #f5f5f5; padding: 15px; border-radius: 5px; margin: 20px 0; }}
			
 
				+        .summary p {{ margin: 5px 0; }}
			
 
				+        .today {{ background: #e3f2fd; padding: 15px; border-radius: 5px; margin: 20px 0; border-left: 4px solid #2196F3; }}
			
 
				+        table {{ width: 100%; border-collapse: collapse; margin: 20px 0; font-size: 11px; }}
			
 
				+        th {{ background: #2196F3; color: white; padding: 8px; text-align: center; }}
			
 
				+        td {{ padding: 6px 8px; border-bottom: 1px solid #ddd; text-align: center; }}
			
 
				+        tr:nth-child(even) {{ background: #f8f9fa; }}
			
 
				+        tr:hover {{ background: #e3f2fd; }}
			
 
				+        .legend {{ font-size: 11px; margin-top: 10px; }}
			
 
				+        .legend span {{ margin-right: 15px; }}
			
 
				+    </style>
			
 
				+</head>
			
 
				+<body>
			
 
				+    <h1>📊 CYB50每日市场状态报告</h1>
			
 
				+    
			
 
				+    <div class="today">
			
 
				+        <h2>📈 今日状态 ({df_aligned.index[-1].strftime('%Y-%m-%d')})</h2>
			
 
				+        <p><strong>收盘价:</strong> {today['close']:.2f}</p>
			
 
				+        <p><strong>日涨跌:</strong> <span style="color: {'green' if daily_change >= 0 else 'red'};">{daily_change:+.2f} ({daily_change_pct:+.2f}%)</span></p>
			
 
				+        <p><strong>市场状态:</strong> <span style="color: {state_color}; font-size: 16px; font-weight: bold;">{state_name}</span></p>
			
 
				+        <p><strong>状态概率:</strong> 震荡 {today['prob_ranging']:.1%} / 趋势 {today['prob_trend']:.1%} / 反转 {today['prob_reversal']:.1%}</p>
			
 
				+    </div>
			
 
				+    
			
 
				+    <div class="summary">
			
 
				+        <h2>📊 最近60天统计 (2024-至今)</h2>
			
 
				+        <p><strong>60天前价格:</strong> {last_60['close'].iloc[0]:.2f}</p>
			
 
				+        <p><strong>区间涨跌:</strong> <span style="color: {'green' if range_change_pct >= 0 else 'red'};">{range_change_pct:+.2f}%</span></p>
			
 
				+        <p><strong>最高价:</strong> {last_60['close'].max():.2f} ({last_60['close'].idxmax().strftime('%m-%d')}) / <strong>最低价:</strong> {last_60['close'].min():.2f} ({last_60['close'].idxmin().strftime('%m-%d')})</p>
			
 
				+        <br>
			
 
				+        <p><strong>状态分布:</strong> 🟦 震荡 {(last_60['state']==0).sum()}天 / 🟩 趋势 {(last_60['state']==1).sum()}天 / 🟧 反转 {(last_60['state']==2).sum()}天</p>
			
 
				+    </div>
			
 
				+    
			
 
				+    <h2>📋 最近60天详细数据</h2>
			
 
				+    <p class="legend">
			
 
				+        <span>🟦 震荡</span>
			
 
				+        <span>🟩 趋势</span>
			
 
				+        <span>🟧 反转</span>
			
 
				+        <span>(黄色背景 = 最新)</span>
			
 
				+    </p>
			
 
				+    <table>
			
 
				+        <thead>
			
 
				+            <tr>
			
 
				+                <th>日期</th>
			
 
				+                <th>收盘价</th>
			
 
				+                <th>状态</th>
			
 
				+                <th>震荡概率</th>
			
 
				+                <th>趋势概率</th>
			
 
				+                <th>反转概率</th>
			
 
				+                <th>日涨跌</th>
			
 
				+            </tr>
			
 
				+        </thead>
			
 
				+        <tbody>
			
 
				+            {html_rows}
			
 
				+        </tbody>
			
 
				+    </table>
			
 
				+    
			
 
				+    <hr>
			
 
				+    <p style="color: #666; font-size: 11px;">
			
 
				+        生成时间: {datetime.now().strftime('%Y-%m-%d %H:%M')}<br>
			
 
				+        数据更新至: {df_aligned.index[-1].strftime('%Y-%m-%d')}<br>
			
 
				+        模型准确率: 72.10% | 创业板50指数 (sz399673)
			
 
				+    </p>
			
 
				+</body>
			
 
				+</html>
			
 
				+"""
			
 
				+
			
 
				+# 发送邮件
			
 
				+EMAIL_CONFIG = {
			
 
				+    "smtp_server": "localhost",
			
 
				+    "smtp_port": 25,
			
 
				+    "sender_email": "kalman@openclaw.local",
			
 
				+    "receiver_email": "380880504@qq.com"
			
 
				+}
			
 
				+
			
 
				+msg = MIMEMultipart('related')
			
 
				+msg['Subject'] = Header(f"📊 CYB50每日市场状态报告 [{df_aligned.index[-1].strftime('%m-%d')}] 当前{state_name}", 'utf-8')
			
 
				+msg['From'] = "regime <regime@openclaw.local>"
			
 
				+msg['To'] = EMAIL_CONFIG['receiver_email']
			
 
				+msg.attach(MIMEText(html, 'html', 'utf-8'))
			
 
				+
			
 
				+try:
			
 
				+    with smtplib.SMTP(EMAIL_CONFIG['smtp_server'], EMAIL_CONFIG['smtp_port']) as server:
			
 
				+        server.sendmail(
			
 
				+            EMAIL_CONFIG['sender_email'],
			
 
				+            EMAIL_CONFIG['receiver_email'],
			
 
				+            msg.as_string()
			
 
				+        )
			
 
				+    print(f"✅ 邮件发送成功! [{df_aligned.index[-1].strftime('%Y-%m-%d')}] 当前状态: {state_name}")
			
 
				+except Exception as e:
			
 
				+    print(f"❌ 邮件发送失败: {e}")
			
--- a/market-regime-identifier/generate_last60_report.py
+++ b/market-regime-identifier/generate_last60_report.py
@@ -0,0 +1,155 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+"""生成最近60天详细数据邮件"""
			
 
				+
			
 
				+import sys
			
 
				+sys.path.insert(0, '/root/.openclaw/workspace/market-regime-identifier')
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+from cyb50_market_classifier import fetch_cyb50_data, calculate_features, define_market_regime
			
 
				+from sklearn.ensemble import RandomForestClassifier
			
 
				+import warnings
			
 
				+warnings.filterwarnings('ignore')
			
 
				+
			
 
				+# 获取数据
			
 
				+df = fetch_cyb50_data('2024-01-01', '2026-03-06')
			
 
				+if df is None:
			
 
				+    exit(1)
			
 
				+
			
 
				+# 计算特征和标签
			
 
				+features = calculate_features(df)
			
 
				+labels = define_market_regime(df, lookback=10)
			
 
				+
			
 
				+# 训练模型
			
 
				+valid_idx = ~np.isnan(labels)
			
 
				+X = features[valid_idx]
			
 
				+y = labels[valid_idx]
			
 
				+
			
 
				+clf = RandomForestClassifier(
			
 
				+    n_estimators=100, max_depth=10, min_samples_split=20,
			
 
				+    min_samples_leaf=10, random_state=42, class_weight='balanced'
			
 
				+)
			
 
				+clf.fit(X, y)
			
 
				+
			
 
				+# 预测所有数据
			
 
				+states = clf.predict(X)
			
 
				+probs = clf.predict_proba(X)
			
 
				+
			
 
				+# 对齐数据
			
 
				+df_aligned = df.iloc[-len(states):].copy()
			
 
				+df_aligned['state'] = states
			
 
				+df_aligned['prob_ranging'] = probs[:, 0]
			
 
				+df_aligned['prob_trend'] = probs[:, 1]
			
 
				+df_aligned['prob_reversal'] = probs[:, 2]
			
 
				+
			
 
				+# 获取最近60天
			
 
				+last_60 = df_aligned.tail(60).copy()
			
 
				+last_60['date'] = last_60.index.strftime('%m-%d')
			
 
				+last_60['change'] = last_60['close'].pct_change() * 100
			
 
				+
			
 
				+state_names = ['震荡', '趋势', '反转']
			
 
				+colors = ['#2196F3', '#4CAF50', '#FF5722']
			
 
				+
			
 
				+# 生成HTML
			
 
				+html_rows = ""
			
 
				+for idx, row in last_60.iterrows():
			
 
				+    state = int(row['state'])
			
 
				+    state_name = state_names[state]
			
 
				+    color = colors[state]
			
 
				+    change = row['change'] if not pd.isna(row['change']) else 0
			
 
				+    change_str = f"{change:+.2f}%" if change != 0 else "-"
			
 
				+    change_color = "green" if change > 0 else "red" if change < 0 else "gray"
			
 
				+    
			
 
				+    html_rows += f"""
			
 
				+        <tr>
			
 
				+            <td>{idx.strftime('%Y-%m-%d')}</td>
			
 
				+            <td>{row['close']:.2f}</td>
			
 
				+            <td style="color: {color}; font-weight: bold;">{state_name}</td>
			
 
				+            <td>{row['prob_ranging']:.1%}</td>
			
 
				+            <td>{row['prob_trend']:.1%}</td>
			
 
				+            <td>{row['prob_reversal']:.1%}</td>
			
 
				+            <td style="color: {change_color};">{change_str}</td>
			
 
				+        </tr>
			
 
				+    """
			
 
				+
			
 
				+# 计算统计
			
 
				+summary = f"""
			
 
				+    <div class="summary">
			
 
				+        <h2>📊 最近60天统计</h2>
			
 
				+        <p><strong>统计区间:</strong> {last_60.index[0].date()} ~ {last_60.index[-1].date()}</p>
			
 
				+        <p><strong>起始价格:</strong> {last_60['close'].iloc[0]:.2f}</p>
			
 
				+        <p><strong>结束价格:</strong> {last_60['close'].iloc[-1]:.2f}</p>
			
 
				+        <p><strong>区间涨跌:</strong> {(last_60['close'].iloc[-1]/last_60['close'].iloc[0]-1)*100:+.2f}%</p>
			
 
				+        <p><strong>最高价:</strong> {last_60['close'].max():.2f} ({last_60['close'].idxmax().strftime('%m-%d')})</p>
			
 
				+        <p><strong>最低价:</strong> {last_60['close'].min():.2f} ({last_60['close'].idxmin().strftime('%m-%d')})</p>
			
 
				+        <br>
			
 
				+        <p><strong>状态分布:</strong></p>
			
 
				+        <p>🟦 震荡: {(last_60['state']==0).sum()}天 ({(last_60['state']==0).sum()/60*100:.1f}%)</p>
			
 
				+        <p>🟩 趋势: {(last_60['state']==1).sum()}天 ({(last_60['state']==1).sum()/60*100:.1f}%)</p>
			
 
				+        <p>🟧 反转: {(last_60['state']==2).sum()}天 ({(last_60['state']==2).sum()/60*100:.1f}%)</p>
			
 
				+    </div>
			
 
				+"""
			
 
				+
			
 
				+html = f"""
			
 
				+<html>
			
 
				+<head>
			
 
				+    <meta charset="utf-8">
			
 
				+    <style>
			
 
				+        body {{ font-family: Arial, sans-serif; margin: 20px; font-size: 12px; }}
			
 
				+        h1 {{ color: #333; border-bottom: 3px solid #2196F3; padding-bottom: 10px; font-size: 18px; }}
			
 
				+        h2 {{ color: #555; margin-top: 20px; border-left: 4px solid #4CAF50; padding-left: 10px; font-size: 14px; }}
			
 
				+        .summary {{ background: #f5f5f5; padding: 15px; border-radius: 5px; margin: 20px 0; }}
			
 
				+        .summary p {{ margin: 5px 0; }}
			
 
				+        table {{ width: 100%; border-collapse: collapse; margin: 20px 0; font-size: 11px; }}
			
 
				+        th {{ background: #2196F3; color: white; padding: 8px; text-align: center; position: sticky; top: 0; }}
			
 
				+        td {{ padding: 6px 8px; border-bottom: 1px solid #ddd; text-align: center; }}
			
 
				+        tr:nth-child(even) {{ background: #f8f9fa; }}
			
 
				+        tr:hover {{ background: #e3f2fd; }}
			
 
				+        .table-container {{ max-height: 500px; overflow-y: auto; }}
			
 
				+    </style>
			
 
				+</head>
			
 
				+<body>
			
 
				+    <h1>📊 创业板50最近60天详细数据 (2026-01-06 ~ 2026-03-06)</h1>
			
 
				+    {summary}
			
 
				+    
			
 
				+    <h2>📋 每日详细数据</h2>
			
 
				+    <div class="table-container">
			
 
				+    <table>
			
 
				+        <thead>
			
 
				+            <tr>
			
 
				+                <th>日期</th>
			
 
				+                <th>收盘价</th>
			
 
				+                <th>状态</th>
			
 
				+                <th>震荡概率</th>
			
 
				+                <th>趋势概率</th>
			
 
				+                <th>反转概率</th>
			
 
				+                <th>日涨跌</th>
			
 
				+            </tr>
			
 
				+        </thead>
			
 
				+        <tbody>
			
 
				+            {html_rows}
			
 
				+        </tbody>
			
 
				+    </table>
			
 
				+    </div>
			
 
				+    
			
 
				+    <hr>
			
 
				+    <p style="color: #666; font-size: 11px;">
			
 
				+        生成时间: 2026-03-06 19:10<br>
			
 
				+        数据更新至: 2026-03-06<br>
			
 
				+        模型准确率: 72.10%
			
 
				+    </p>
			
 
				+</body>
			
 
				+</html>
			
 
				+"""
			
 
				+
			
 
				+# 保存HTML
			
 
				+with open('/root/.openclaw/workspace/market-regime-identifier/last_60_days_report.html', 'w', encoding='utf-8') as f:
			
 
				+    f.write(html)
			
 
				+
			
 
				+print("✓ HTML报告已生成")
			
 
				+print(f"最近60天: {last_60.index[0].date()} ~ {last_60.index[-1].date()}")
			
 
				+print(f"\n状态分布:")
			
 
				+print(f"  震荡: {(last_60['state']==0).sum()}天")
			
 
				+print(f"  趋势: {(last_60['state']==1).sum()}天")
			
 
				+print(f"  反转: {(last_60['state']==2).sum()}天")
			
--- a/market-regime-identifier/generate_regime_chart.py
+++ b/market-regime-identifier/generate_regime_chart.py
@@ -0,0 +1,192 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+"""
			
 
				+生成2024-2025年市场状态识别完整图表
			
 
				+"""
			
 
				+
			
 
				+import sys
			
 
				+sys.path.insert(0, '/root/.openclaw/workspace/market-regime-identifier')
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+import matplotlib.pyplot as plt
			
 
				+import matplotlib.dates as mdates
			
 
				+from cyb50_market_classifier import fetch_cyb50_data, calculate_features, define_market_regime
			
 
				+import pickle
			
 
				+import warnings
			
 
				+warnings.filterwarnings('ignore')
			
 
				+
			
 
				+# 设置中文字体
			
 
				+plt.rcParams['font.sans-serif'] = ['DejaVu Sans']
			
 
				+plt.rcParams['axes.unicode_minus'] = False
			
 
				+
			
 
				+print("="*70)
			
 
				+print("生成2024年至今市场状态识别图表")
			
 
				+print("="*70)
			
 
				+
			
 
				+# 获取数据
			
 
				+df = fetch_cyb50_data('2024-01-01', '2026-03-06')
			
 
				+if df is None:
			
 
				+    exit(1)
			
 
				+
			
 
				+print(f"\n数据范围: {df.index[0].date()} ~ {df.index[-1].date()}")
			
 
				+
			
 
				+# 计算特征和标签
			
 
				+features = calculate_features(df)
			
 
				+labels = define_market_regime(df, lookback=10)
			
 
				+
			
 
				+# 训练模型
			
 
				+valid_idx = ~np.isnan(labels)
			
 
				+X = features[valid_idx]
			
 
				+y = labels[valid_idx]
			
 
				+
			
 
				+from sklearn.ensemble import RandomForestClassifier
			
 
				+clf = RandomForestClassifier(
			
 
				+    n_estimators=100,
			
 
				+    max_depth=10,
			
 
				+    min_samples_split=20,
			
 
				+    min_samples_leaf=10,
			
 
				+    random_state=42,
			
 
				+    class_weight='balanced'
			
 
				+)
			
 
				+clf.fit(X, y)
			
 
				+
			
 
				+# 预测所有数据
			
 
				+states = clf.predict(X)
			
 
				+probs = clf.predict_proba(X)
			
 
				+
			
 
				+# 对齐数据
			
 
				+df_aligned = df.iloc[-len(states):].copy()
			
 
				+df_aligned['state'] = states
			
 
				+df_aligned['state_prob'] = [p[s] for s, p in zip(states, probs)]
			
 
				+df_aligned['prob_ranging'] = probs[:, 0]  # 震荡概率
			
 
				+df_aligned['prob_trend'] = probs[:, 1]    # 趋势概率
			
 
				+df_aligned['prob_reversal'] = probs[:, 2] # 反转概率
			
 
				+
			
 
				+# 生成图表
			
 
				+fig, axes = plt.subplots(3, 1, figsize=(16, 12))
			
 
				+
			
 
				+state_names = ['Ranging', 'Trend', 'Reversal']
			
 
				+colors = ['#2196F3', '#4CAF50', '#FF5722']  # 蓝、绿、橙
			
 
				+
			
 
				+# 图1: 价格走势 + 状态标记
			
 
				+ax1 = axes[0]
			
 
				+for i, (name, color) in enumerate(zip(state_names, colors)):
			
 
				+    mask = df_aligned['state'] == i
			
 
				+    if mask.any():
			
 
				+        ax1.scatter(df_aligned.index[mask], df_aligned['close'][mask], 
			
 
				+                   c=color, label=name, alpha=0.7, s=30)
			
 
				+
			
 
				+ax1.plot(df_aligned.index, df_aligned['close'], 'k-', alpha=0.3, linewidth=0.5)
			
 
				+ax1.set_ylabel('Price', fontsize=12)
			
 
				+ax1.set_title('CYB50 Market Regime Identification 2024-2025', fontsize=14, fontweight='bold')
			
 
				+ax1.legend(loc='upper left')
			
 
				+ax1.grid(True, alpha=0.3)
			
 
				+
			
 
				+# 添加关键点位标注
			
 
				+for idx, row in df_aligned.iterrows():
			
 
				+    if idx.month == 1 and idx.day == 2:  # 年初
			
 
				+        ax1.annotate(f'{row["close"]:.0f}', 
			
 
				+                    xy=(idx, row['close']), 
			
 
				+                    xytext=(10, 10), textcoords='offset points',
			
 
				+                    fontsize=8, alpha=0.7)
			
 
				+
			
 
				+# 图2: 状态概率时间序列
			
 
				+ax2 = axes[1]
			
 
				+ax2.fill_between(df_aligned.index, 0, df_aligned['prob_ranging'], 
			
 
				+                 alpha=0.5, label='Ranging', color=colors[0])
			
 
				+ax2.fill_between(df_aligned.index, df_aligned['prob_ranging'], 
			
 
				+                 df_aligned['prob_ranging'] + df_aligned['prob_trend'],
			
 
				+                 alpha=0.5, label='Trend', color=colors[1])
			
 
				+ax2.fill_between(df_aligned.index, 
			
 
				+                 df_aligned['prob_ranging'] + df_aligned['prob_trend'], 1,
			
 
				+                 alpha=0.5, label='Reversal', color=colors[2])
			
 
				+
			
 
				+ax2.set_ylabel('Probability', fontsize=12)
			
 
				+ax2.set_title('State Probability Over Time', fontsize=12)
			
 
				+ax2.legend(loc='upper left')
			
 
				+ax2.grid(True, alpha=0.3)
			
 
				+ax2.set_ylim(0, 1)
			
 
				+
			
 
				+# 图3: 状态分布统计
			
 
				+ax3 = axes[2]
			
 
				+state_counts = df_aligned['state'].value_counts().sort_index()
			
 
				+bars = ax3.bar(range(3), state_counts.values, color=colors, alpha=0.7)
			
 
				+ax3.set_xticks(range(3))
			
 
				+ax3.set_xticklabels(state_names)
			
 
				+ax3.set_ylabel('Days', fontsize=12)
			
 
				+ax3.set_title('State Distribution 2024-2025', fontsize=12)
			
 
				+
			
 
				+# 添加数值标签
			
 
				+for i, (bar, count) in enumerate(zip(bars, state_counts.values)):
			
 
				+    pct = count / len(df_aligned) * 100
			
 
				+    ax3.text(bar.get_x() + bar.get_width()/2, bar.get_height() + 5,
			
 
				+             f'{count}d\n({pct:.1f}%)', 
			
 
				+             ha='center', va='bottom', fontsize=10)
			
 
				+
			
 
				+plt.tight_layout()
			
 
				+plt.savefig('/root/.openclaw/workspace/market-regime-identifier/cyb50_regime_2024_2025.png', 
			
 
				+            dpi=150, bbox_inches='tight')
			
 
				+print("\n✓ 图表已保存: cyb50_regime_2024_2025.png")
			
 
				+
			
 
				+# 生成详细报告
			
 
				+print("\n" + "="*70)
			
 
				+print("2024-2025年详细识别结果")
			
 
				+print("="*70)
			
 
				+
			
 
				+# 按月份统计
			
 
				+print("\n【月度统计】")
			
 
				+print(f"{'月份':<10} {'总天数':<8} {'震荡':<8} {'趋势':<8} {'反转':<8} {'主要状态':<10}")
			
 
				+print("-"*70)
			
 
				+
			
 
				+for year in [2024, 2025]:
			
 
				+    for month in range(1, 13):
			
 
				+        mask = (df_aligned.index.year == year) & (df_aligned.index.month == month)
			
 
				+        if not mask.any():
			
 
				+            continue
			
 
				+        
			
 
				+        month_data = df_aligned[mask]
			
 
				+        total = len(month_data)
			
 
				+        ranging = (month_data['state'] == 0).sum()
			
 
				+        trend = (month_data['state'] == 1).sum()
			
 
				+        reversal = (month_data['state'] == 2).sum()
			
 
				+        
			
 
				+        main_state = state_names[month_data['state'].mode()[0]]
			
 
				+        
			
 
				+        print(f"{year}-{month:02d}    {total:<8} {ranging:<8} {trend:<8} {reversal:<8} {main_state:<10}")
			
 
				+
			
 
				+# 关键点位
			
 
				+print("\n【关键点位标注】")
			
 
				+print(f"{'日期':<12} {'收盘价':<10} {'状态':<10} {'置信度':<10} {'说明':<20}")
			
 
				+print("-"*70)
			
 
				+
			
 
				+# 每月第一个交易日
			
 
				+for year in [2024, 2025]:
			
 
				+    for month in range(1, 13):
			
 
				+        mask = (df_aligned.index.year == year) & (df_aligned.index.month == month)
			
 
				+        if not mask.any():
			
 
				+            continue
			
 
				+        month_data = df_aligned[mask]
			
 
				+        first_day = month_data.iloc[0]
			
 
				+        
			
 
				+        date_str = month_data.index[0].strftime('%Y-%m-%d')
			
 
				+        price = first_day['close']
			
 
				+        state = state_names[int(first_day['state'])]
			
 
				+        prob = first_day['state_prob']
			
 
				+        
			
 
				+        # 简单说明
			
 
				+        if first_day['state'] == 0:
			
 
				+            desc = 'Consolidation'
			
 
				+        elif first_day['state'] == 1:
			
 
				+            if month_data['close'].iloc[-1] > price:
			
 
				+                desc = 'Uptrend'
			
 
				+            else:
			
 
				+                desc = 'Downtrend'
			
 
				+        else:
			
 
				+            desc = 'Reversal'
			
 
				+        
			
 
				+        print(f"{date_str:<12} {price:<10.2f} {state:<10} {prob:<10.2%} {desc:<20}")
			
 
				+
			
 
				+print("\n" + "="*70)
			
 
				+print("✓ 报告生成完成!")
			
 
				+print("="*70)
			
--- a/market-regime-identifier/rf_classifier_v3.pkl
+++ b/market-regime-identifier/rf_classifier_v3.pkl