test on original data

2025-05-26 14:55:03 +08:00
parent 3e94387dcb
commit b1f80099fe
1 changed files with 56 additions and 48 deletions
--- a/test_metatrend_comparison.py
+++ b/test_metatrend_comparison.py
@@ -28,6 +28,7 @@ from cycles.strategies.default_strategy import DefaultStrategy
 from cycles.IncStrategies.indicators.supertrend import SupertrendState, SupertrendCollection
 from cycles.Analysis.supertrend import Supertrends
 from cycles.backtest import Backtest
+from cycles.utils.storage import Storage

 # Configure logging
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
@@ -44,6 +45,7 @@ class MetaTrendComparisonTest:
        self.test_data = None
        self.original_results = None
        self.incremental_results = None
+        self.storage = Storage(logging=logger)
        
        # Supertrend parameters from original implementation
        self.supertrend_params = [
@@ -52,34 +54,44 @@ class MetaTrendComparisonTest:
            {"period": 11, "multiplier": 2.0}
        ]
    
-    def load_test_data(self, symbol: str = "BTCUSDT", limit: int = 500) -> pd.DataFrame:
+    def load_test_data(self, symbol: str = "BTCUSD", start_date: str = "2022-01-01", end_date: str = "2023-01-01", limit: int = None) -> pd.DataFrame:
        """
-        Load test data for comparison.
+        Load test data for comparison using the Storage class.
        
        Args:
-            symbol: Trading symbol to load
-            limit: Number of data points to load
+            symbol: Trading symbol to load (used for filename)
+            start_date: Start date in YYYY-MM-DD format
+            end_date: End date in YYYY-MM-DD format
+            limit: Optional limit on number of data points (applied after date filtering)
            
        Returns:
            DataFrame with OHLCV data
        """
-        logger.info(f"Loading test data for {symbol} (limit: {limit})")
+        logger.info(f"Loading test data for {symbol} from {start_date} to {end_date}")
        
        try:
-            # Try to load from existing data files
-            data_file = f"data/{symbol}_1m.csv"
-            if os.path.exists(data_file):
-                df = pd.read_csv(data_file)
-                df['timestamp'] = pd.to_datetime(df['timestamp'])
-                df.set_index('timestamp', inplace=True)
-                df = df.tail(limit)
-                logger.info(f"Loaded {len(df)} data points from {data_file}")
-            else:
-                # Generate synthetic data for testing if no real data available
-                logger.warning(f"No data file found at {data_file}, generating synthetic data")
-                df = self._generate_synthetic_data(limit)
+            # Use the Storage class to load data with date filtering
+            filename = "btcusd_1-min_data.csv"
            
-            # Ensure required columns
+            # Convert date strings to pandas datetime
+            start_dt = pd.to_datetime(start_date)
+            end_dt = pd.to_datetime(end_date)
+            
+            # Load data using Storage class
+            df = self.storage.load_data(filename, start_dt, end_dt)
+            
+            if df.empty:
+                raise ValueError(f"No data found for the specified date range: {start_date} to {end_date}")
+            
+            logger.info(f"Loaded {len(df)} data points from {start_date} to {end_date}")
+            logger.info(f"Date range in data: {df.index.min()} to {df.index.max()}")
+            
+            # Apply limit if specified
+            if limit is not None and len(df) > limit:
+                df = df.tail(limit)
+                logger.info(f"Limited data to last {limit} points")
+            
+            # Ensure required columns (Storage class should handle column name conversion)
            required_cols = ['open', 'high', 'low', 'close', 'volume']
            for col in required_cols:
                if col not in df.columns:
@@ -92,12 +104,20 @@ class MetaTrendComparisonTest:
            df_with_timestamp = df.reset_index()
            
            self.test_data = df_with_timestamp
+            logger.info(f"Test data prepared: {len(df_with_timestamp)} rows")
+            logger.info(f"Columns: {list(df_with_timestamp.columns)}")
+            logger.info(f"Sample data:\n{df_with_timestamp.head()}")
+            
            return df_with_timestamp
            
        except Exception as e:
            logger.error(f"Failed to load test data: {e}")
-            # Fallback to synthetic data
-            df = self._generate_synthetic_data(limit)
+            import traceback
+            traceback.print_exc()
+            
+            # Fallback to synthetic data if real data loading fails
+            logger.warning("Falling back to synthetic data generation")
+            df = self._generate_synthetic_data(limit or 1000)
            df_with_timestamp = df.reset_index()
            self.test_data = df_with_timestamp
            return df_with_timestamp
@@ -681,13 +701,15 @@ class MetaTrendComparisonTest:
        
        return timeline_df
    
-    def run_full_test(self, symbol: str = "BTCUSDT", limit: int = 500) -> bool:
+    def run_full_test(self, symbol: str = "BTCUSD", start_date: str = "2022-01-01", end_date: str = "2023-01-01", limit: int = None) -> bool:
        """
        Run the complete comparison test.
        
        Args:
            symbol: Trading symbol to test
-            limit: Number of data points to test
+            start_date: Start date in YYYY-MM-DD format
+            end_date: End date in YYYY-MM-DD format
+            limit: Optional limit on number of data points (applied after date filtering)
            
        Returns:
            True if all tests pass, False otherwise
@@ -698,7 +720,7 @@ class MetaTrendComparisonTest:
        
        try:
            # Load test data
-            self.load_test_data(symbol, limit)
+            self.load_test_data(symbol, start_date, end_date, limit)
            logger.info(f"Test data loaded: {len(self.test_data)} points")
            
            # Test original strategy
@@ -760,35 +782,21 @@ def main():
    """Run the MetaTrend comparison test."""
    test = MetaTrendComparisonTest()
    
-    # Run test with different data sizes
-    test_cases = [
-        ("BTCUSDT", 200),   # Small test
-        ("BTCUSDT", 500),   # Medium test
-        ("BTCUSDT", 1000),  # Large test
-    ]
+    # Run test with real BTCUSD data from 2022-01-01 to 2023-01-01
+    logger.info(f"\n{'='*80}")
+    logger.info(f"RUNNING METATREND COMPARISON TEST")
+    logger.info(f"Using real BTCUSD data from 2022-01-01 to 2023-01-01")
+    logger.info(f"{'='*80}")
    
-    all_passed = True
+    # Test with the full year of data (no limit)
+    passed = test.run_full_test("BTCUSD", "2022-01-01", "2023-01-01", limit=None)
    
-    for symbol, limit in test_cases:
-        logger.info(f"\n{'='*80}")
-        logger.info(f"RUNNING TEST CASE: {symbol} with {limit} data points")
-        logger.info(f"{'='*80}")
-        
-        passed = test.run_full_test(symbol, limit)
-        all_passed = all_passed and passed
-        
-        if not passed:
-            logger.error(f"Test case {symbol}:{limit} FAILED")
-            break
-        else:
-            logger.info(f"Test case {symbol}:{limit} PASSED")
-    
-    if all_passed:
-        logger.info("\n🎉 ALL TEST CASES PASSED!")
+    if passed:
+        logger.info("\n🎉 TEST PASSED! Incremental indicators match original strategy.")
    else:
-        logger.error("\n❌ SOME TEST CASES FAILED!")
+        logger.error("\n❌ TEST FAILED! Incremental indicators do not match original strategy.")
    
-    return all_passed
+    return passed


 if __name__ == "__main__":