├── services
    ├── __init__.py
    ├── __pycache__
    │   ├── __init__.cpython-313.pyc
    │   └── strategy_evolution_service.cpython-313.pyc
    ├── utils
    │   ├── __init__.py
    │   ├── circuit_breaker_monitor.py
    │   ├── exchange_interface.py
    │   ├── circuit_breaker.py
    │   ├── metrics.py
    │   └── monitoring.py
    ├── social_monitor_service.py
    └── genetic_algorithm.py
├── monitoring
    ├── grafana
    │   └── provisioning
    │   │   ├── datasources
    │   │       └── prometheus.yml
    │   │   └── dashboards
    │   │       └── dashboard.yml
    ├── logstash.conf
    ├── prometheus.yml
    └── alert_rules.yml
├── backtesting
    ├── __init__.py
    ├── README.md
    ├── social_data_provider.py
    └── backtest_engine.py
├── Dockerfile
├── requirements.txt
├── .env-sample
├── run_ai_model_services.py
├── tests
    ├── test_backtesting.py
    ├── test_strategy_evolution.py
    └── run_tests.py
├── trading_strategy.md
├── CHANGELOG.md
├── run_backtest.py
├── PRODUCTION_READINESS.md
├── docker-compose.yml
└── STRATEGY_EVOLUTION.md


/services/__init__.py:
--------------------------------------------------------------------------------
1 | # This file makes the services directory a Python package
2 | 


--------------------------------------------------------------------------------
/services/__pycache__/__init__.cpython-313.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zd87pl/ai-crypto-trader/HEAD/services/__pycache__/__init__.cpython-313.pyc


--------------------------------------------------------------------------------
/services/__pycache__/strategy_evolution_service.cpython-313.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zd87pl/ai-crypto-trader/HEAD/services/__pycache__/strategy_evolution_service.cpython-313.pyc


--------------------------------------------------------------------------------
/services/utils/__init__.py:
--------------------------------------------------------------------------------
1 | # Market Regime Detection Utils Package
2 | from services.utils.market_regime_detector import MarketRegimeDetector
3 | from services.utils.market_regime_data_collector import MarketRegimeDataCollector


--------------------------------------------------------------------------------
/monitoring/grafana/provisioning/datasources/prometheus.yml:
--------------------------------------------------------------------------------
1 | apiVersion: 1
2 | 
3 | datasources:
4 |   - name: Prometheus
5 |     type: prometheus
6 |     access: proxy
7 |     url: http://prometheus:9090
8 |     isDefault: true
9 |     editable: false


--------------------------------------------------------------------------------
/monitoring/grafana/provisioning/dashboards/dashboard.yml:
--------------------------------------------------------------------------------
 1 | apiVersion: 1
 2 | 
 3 | providers:
 4 |   - name: 'Default'
 5 |     orgId: 1
 6 |     folder: ''
 7 |     type: file
 8 |     disableDeletion: false
 9 |     editable: true
10 |     options:
11 |       path: /etc/grafana/provisioning/dashboards


--------------------------------------------------------------------------------
/backtesting/__init__.py:
--------------------------------------------------------------------------------
 1 | # Backtesting Framework
 2 | # Implements BACK-01/02/09: Backtesting environment with historical data
 3 | 
 4 | from .backtest_engine import BacktestEngine
 5 | from .data_manager import HistoricalDataManager
 6 | from .strategy_tester import StrategyTester
 7 | from .social_data_provider import SocialDataProvider
 8 | from .result_analyzer import ResultAnalyzer
 9 | 
10 | __all__ = [
11 |     'BacktestEngine',
12 |     'HistoricalDataManager',
13 |     'StrategyTester',
14 |     'SocialDataProvider',
15 |     'ResultAnalyzer',
16 | ]


--------------------------------------------------------------------------------
/monitoring/logstash.conf:
--------------------------------------------------------------------------------
 1 | input {
 2 |   file {
 3 |     path => "/app/logs/*.log"
 4 |     start_position => "beginning"
 5 |     sincedb_path => "/dev/null"
 6 |     codec => "json"
 7 |   }
 8 | }
 9 | 
10 | filter {
11 |   json {
12 |     source => "message"
13 |   }
14 |   date {
15 |     match => [ "timestamp", "yyyy-MM-dd HH:mm:ss,SSS" ]
16 |   }
17 |   grok {
18 |     match => { "message" => "\[%{WORD:service}\]" }
19 |   }
20 | }
21 | 
22 | output {
23 |   elasticsearch {
24 |     hosts => ["elasticsearch:9200"]
25 |     index => "crypto-trader-%{+YYYY.MM.dd}"
26 |   }
27 | }


--------------------------------------------------------------------------------
/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.9-slim
 2 | 
 3 | WORKDIR /app
 4 | 
 5 | # Install system dependencies including netcat
 6 | RUN apt-get update && \
 7 |     apt-get install -y --no-install-recommends \
 8 |     build-essential \
 9 |     netcat-traditional \
10 |     && rm -rf /var/lib/apt/lists/*
11 | 
12 | # Copy requirements first to leverage Docker cache
13 | COPY requirements.txt .
14 | RUN pip install --no-cache-dir -r requirements.txt
15 | 
16 | # Copy project files
17 | COPY . .
18 | 
19 | # Set environment variables
20 | ENV PYTHONUNBUFFERED=1
21 | 
22 | CMD ["python3", "run_trader.py"]
23 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | python-binance==1.0.16
 2 | pandas>=1.3.0
 3 | numpy>=1.21.0
 4 | scikit-learn>=0.24.2
 5 | ta>=0.7.0
 6 | websockets==10.4
 7 | openai>=1.0.0
 8 | redis>=5.0.0
 9 | aioredis>=2.0.0
10 | asyncio>=3.4.3
11 | python-dotenv>=1.0.0
12 | requests>=2.31.0
13 | aiohttp>=3.9.0
14 | ujson>=5.8.0
15 | flask>=2.0.0
16 | dash>=2.14.0
17 | plotly>=5.18.0
18 | dash-bootstrap-components>=1.5.0
19 | dash-fontawesome>=0.0.1
20 | 
21 | # Monitoring and Observability
22 | prometheus-client>=0.17.0
23 | structlog>=23.1.0
24 | python-json-logger>=2.0.7
25 | pythonjsonlogger>=0.1.0
26 | elasticapm>=6.16.0
27 | 
28 | # Security and Performance
29 | PyJWT>=2.8.0
30 | cryptography>=41.0.0
31 | redis[hiredis]>=5.0.0
32 | aiofiles>=23.2.0
33 | 
34 | # Backtesting Framework
35 | matplotlib>=3.5.0
36 | seaborn>=0.11.0
37 | pytest>=7.0.0
38 | networkx>=3.0.0
39 | 
40 | # Neural Networks and Deep Learning
41 | tensorflow>=2.10.0
42 | keras>=2.10.0
43 | tensorflow-probability>=0.18.0
44 | scikit-optimize>=0.9.0
45 | optuna>=3.0.0
46 | shap>=0.41.0
47 | 


--------------------------------------------------------------------------------
/monitoring/prometheus.yml:
--------------------------------------------------------------------------------
 1 | global:
 2 |   scrape_interval: 15s
 3 |   evaluation_interval: 15s
 4 |   scrape_timeout: 10s
 5 | 
 6 | rule_files:
 7 |   - "alert_rules.yml"
 8 | 
 9 | alerting:
10 |   alertmanagers:
11 |     - static_configs:
12 |         - targets: []
13 |       scheme: http
14 |       timeout: 10s
15 | 
16 | scrape_configs:
17 |   - job_name: "prometheus"
18 |     static_configs:
19 |       - targets: ["localhost:9090"]
20 | 
21 |   - job_name: "market-monitor"
22 |     static_configs:
23 |       - targets: ["market-monitor:8001"]
24 |     metrics_path: /metrics
25 |     scrape_interval: 15s
26 |     scrape_timeout: 10s
27 | 
28 |   - job_name: "social-monitor"
29 |     static_configs:
30 |       - targets: ["social-monitor:${SOCIAL_MONITOR_PORT}"]
31 |     metrics_path: /metrics
32 | 
33 |   - job_name: "ai-analyzer"
34 |     static_configs:
35 |       - targets: ["ai-analyzer:${AI_ANALYZER_PORT}"]
36 |     metrics_path: /metrics
37 | 
38 |   - job_name: "trade-executor"
39 |     static_configs:
40 |       - targets: ["trade-executor:${TRADE_EXECUTOR_PORT}"]
41 |     metrics_path: /metrics
42 | 
43 |   - job_name: "strategy-evolution"
44 |     static_configs:
45 |       - targets: ["strategy-evolution:${STRATEGY_EVOLUTION_PORT}"]
46 |     metrics_path: /metrics
47 | 
48 |   - job_name: "dashboard"
49 |     static_configs:
50 |       - targets: ["dashboard:8050"]
51 |     metrics_path: /metrics
52 | 
53 |   - job_name: "redis"
54 |     static_configs:
55 |       - targets: ["redis:6379"]
56 |     metrics_path: /metrics
57 | 
58 |   - job_name: "node-exporter"
59 |     static_configs:
60 |       - targets: ["node-exporter:9100"]
61 | 


--------------------------------------------------------------------------------
/.env-sample:
--------------------------------------------------------------------------------
 1 | # Binance API credentials
 2 | BINANCE_API_KEY=your_binance_api_key_here
 3 | BINANCE_API_SECRET=your_binance_api_secret_here
 4 | 
 5 | # OpenAI API credentials
 6 | OPENAI_API_KEY=your_openai_api_key_here
 7 | OPENAI_MODEL=gpt-4
 8 | 
 9 | # LunarCrush API credentials
10 | LUNARCRUSH_API_KEY=your_lunarcrush_api_key_here
11 | 
12 | # Cloudflare credentials
13 | CLOUDFLARE_API_TOKEN=your_cloudflare_api_token_here
14 | CLOUDFLARE_ACCOUNT_ID=your_cloudflare_account_id_here
15 | CLOUDFLARE_ZONE_ID=your_cloudflare_zone_id_here
16 | 
17 | # Service ports
18 | MARKET_MONITOR_PORT=8001
19 | TRADE_EXECUTOR_PORT=8002
20 | AI_ANALYZER_PORT=8003
21 | STRATEGY_EVOLUTION_PORT=8004
22 | SOCIAL_MONITOR_PORT=8005
23 | MODEL_REGISTRY_PORT=8006
24 | AI_EXPLAINABILITY_PORT=8007
25 | PORTFOLIO_RISK_PORT=8008
26 | 
27 | # Redis configuration
28 | REDIS_HOST=redis
29 | REDIS_PORT=6379
30 | REDIS_PASSWORD=
31 | 
32 | # Dashboard configuration
33 | DASHBOARD_PORT=8050
34 | DASHBOARD_THEME=CYBORG  # Available themes: CYBORG, DARKLY, SUPERHERO
35 | DASHBOARD_REFRESH_INTERVAL=5000  # milliseconds
36 | 
37 | # Trading pairs to monitor
38 | TRADING_PAIRS=BTCUSDC,ETHUSDC,SOLUSDC,BNBUSDC,AVAXUSDC
39 | 
40 | # Strategy Evolution Configuration
41 | STRATEGY_BACKTEST_DAYS=30
42 | STRATEGY_MIN_PROFIT_THRESHOLD=2.0
43 | STRATEGY_MAX_DRAWDOWN=10.0
44 | STRATEGY_MIN_TRADES=100
45 | STRATEGY_EVOLUTION_INTERVAL=24  # hours
46 | 
47 | # Risk management settings
48 | MAX_TRADE_AMOUNT_USDC=100
49 | PORTFOLIO_RISK_LEVEL=MEDIUM  # LOW, MEDIUM, HIGH
50 | STOP_LOSS_PERCENTAGE=5
51 | TAKE_PROFIT_PERCENTAGE=15
52 | 
53 | # Worker Configuration
54 | WORKER_MEMORY_LIMIT=128  # MB
55 | WORKER_CPU_LIMIT=10  # ms
56 | WORKER_TIMEOUT=10000  # ms
57 | WORKER_MAX_REQUESTS=1000
58 | 
59 | # Notification settings (optional)
60 | ENABLE_TELEGRAM_NOTIFICATIONS=false
61 | TELEGRAM_BOT_TOKEN=
62 | TELEGRAM_CHAT_ID=
63 | ENABLE_EMAIL_NOTIFICATIONS=false
64 | EMAIL_SMTP_SERVER=
65 | EMAIL_SMTP_PORT=
66 | EMAIL_USERNAME=
67 | EMAIL_PASSWORD=
68 | EMAIL_RECIPIENT=
69 | 


--------------------------------------------------------------------------------
/run_ai_model_services.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | import os
  3 | import sys
  4 | import asyncio
  5 | import argparse
  6 | import logging as logger
  7 | from typing import Dict, List
  8 | from datetime import datetime
  9 | 
 10 | # Configure logging
 11 | logger.basicConfig(
 12 |     level=logger.INFO,
 13 |     format='%(asctime)s - %(levelname)s - %(message)s',
 14 |     handlers=[
 15 |         logger.FileHandler(f'logs/ai_model_services_{datetime.now().strftime("%Y%m%d_%H%M%S")}.log'),
 16 |         logger.StreamHandler(sys.stdout)
 17 |     ]
 18 | )
 19 | 
 20 | # Import services
 21 | try:
 22 |     from services.model_registry_service import ModelRegistryService
 23 |     from services.ai_explainability_service import AIExplainabilityService
 24 | except ImportError as e:
 25 |     logger.error(f"Error importing services: {str(e)}")
 26 |     logger.error("Make sure you're running from the project root directory")
 27 |     sys.exit(1)
 28 | 
 29 | async def run_services(args):
 30 |     """Run the AI model services"""
 31 |     services = []
 32 |     tasks = []
 33 | 
 34 |     try:
 35 |         # Start model registry if requested
 36 |         if args.model_registry:
 37 |             logger.info("Starting Model Registry Service...")
 38 |             model_registry = ModelRegistryService()
 39 |             services.append(model_registry)
 40 |             tasks.append(asyncio.create_task(model_registry.run()))
 41 |             
 42 |         # Start AI explainability service if requested
 43 |         if args.explainability:
 44 |             logger.info("Starting AI Explainability Service...")
 45 |             ai_explainability = AIExplainabilityService()
 46 |             services.append(ai_explainability)
 47 |             tasks.append(asyncio.create_task(ai_explainability.run()))
 48 |             
 49 |         if not tasks:
 50 |             logger.error("No services specified to run. Use --model-registry or --explainability")
 51 |             return
 52 |             
 53 |         # Run all services
 54 |         logger.info(f"Running {len(tasks)} services...")
 55 |         await asyncio.gather(*tasks)
 56 |             
 57 |     except KeyboardInterrupt:
 58 |         logger.info("Keyboard interrupt received, shutting down services...")
 59 |         
 60 |     except Exception as e:
 61 |         logger.error(f"Error running services: {str(e)}")
 62 |         
 63 |     finally:
 64 |         # Stop all services
 65 |         for service in services:
 66 |             try:
 67 |                 await service.stop()
 68 |             except Exception as e:
 69 |                 logger.error(f"Error stopping service: {str(e)}")
 70 |                 
 71 |         logger.info("All services stopped")
 72 | 
 73 | def setup_parser() -> argparse.ArgumentParser:
 74 |     """Setup command line argument parser"""
 75 |     parser = argparse.ArgumentParser(description='AI Model Services CLI')
 76 |     
 77 |     parser.add_argument('--model-registry', action='store_true', help='Run the Model Registry Service')
 78 |     parser.add_argument('--explainability', action='store_true', help='Run the AI Explainability Service')
 79 |     parser.add_argument('--all', action='store_true', help='Run all services')
 80 |     
 81 |     return parser
 82 | 
 83 | def main():
 84 |     # Ensure logs directory exists
 85 |     os.makedirs('logs', exist_ok=True)
 86 |     
 87 |     # Parse command line arguments
 88 |     parser = setup_parser()
 89 |     args = parser.parse_args()
 90 |     
 91 |     # If --all is specified, enable all services
 92 |     if args.all:
 93 |         args.model_registry = True
 94 |         args.explainability = True
 95 |     
 96 |     # Run the services
 97 |     try:
 98 |         asyncio.run(run_services(args))
 99 |     except KeyboardInterrupt:
100 |         logger.info("Keyboard interrupt received in main")
101 |     except Exception as e:
102 |         logger.error(f"Error in main: {str(e)}")
103 |         return 1
104 |         
105 |     return 0
106 | 
107 | if __name__ == "__main__":
108 |     sys.exit(main())


--------------------------------------------------------------------------------
/backtesting/README.md:
--------------------------------------------------------------------------------
  1 | # Backtesting Framework
  2 | 
  3 | This directory contains the backtesting framework for the AI Crypto Trader system. The framework allows you to:
  4 | 
  5 | 1. Fetch and manage historical market data from Binance
  6 | 2. Integrate historical social metrics data from LunarCrush
  7 | 3. Backtest the current AI trading strategy with various parameters
  8 | 4. Analyze and visualize backtest results
  9 | 
 10 | ## Components
 11 | 
 12 | The framework consists of several key components:
 13 | 
 14 | - **HistoricalDataManager**: Fetches, stores, and manages historical market and social data
 15 | - **SocialDataProvider**: Manages social metrics data for backtesting
 16 | - **StrategyTester**: Tests trading strategies against historical data
 17 | - **ResultAnalyzer**: Analyzes and visualizes backtest results
 18 | - **BacktestEngine**: Coordinates the backtesting process
 19 | 
 20 | ## Directory Structure
 21 | 
 22 | ```
 23 | backtesting/
 24 | ├── __init__.py              # Package initialization
 25 | ├── README.md                # This documentation file
 26 | ├── backtest_engine.py       # Main orchestration engine
 27 | ├── data_manager.py          # Historical data management
 28 | ├── result_analyzer.py       # Results analysis and visualization
 29 | ├── social_data_provider.py  # Social metrics integration
 30 | ├── strategy_tester.py       # Strategy testing logic
 31 | ├── data/                    # Storage for historical data
 32 | │   ├── market/              # Market data for each symbol
 33 | │   └── social/              # Social metrics data for each symbol
 34 | ├── results/                 # Storage for backtest results
 35 | └── plots/                   # Storage for generated plots and visualizations
 36 | ```
 37 | 
 38 | ## Command-line Interface
 39 | 
 40 | The framework provides a command-line interface through `run_backtest.py`. Here are the available commands:
 41 | 
 42 | ### Fetch Historical Data
 43 | 
 44 | ```bash
 45 | python run_backtest.py fetch --symbols BTCUSDC ETHUSDC --intervals 1h 4h --days 60
 46 | ```
 47 | 
 48 | This command fetches 60 days of historical market and social data for BTC and ETH in both 1-hour and 4-hour intervals.
 49 | 
 50 | Options:
 51 | - `--symbols`: One or more trading pairs (required)
 52 | - `--intervals`: One or more timeframe intervals (default: 1h)
 53 | - `--days`: Number of days to fetch (default: 30)
 54 | - `--no-social`: Skip fetching social data
 55 | 
 56 | ### Run Backtests
 57 | 
 58 | ```bash
 59 | python run_backtest.py backtest --symbols BTCUSDC --intervals 1h 4h --days 30 --balance 10000
 60 | ```
 61 | 
 62 | This command runs backtests for BTC with 1-hour and 4-hour intervals over the past 30 days, starting with a $10,000 balance.
 63 | 
 64 | Options:
 65 | - `--symbols`: One or more trading pairs to backtest (required)
 66 | - `--intervals`: One or more timeframe intervals (default: 1h)
 67 | - `--days`: Number of days to backtest (default: 30)
 68 | - `--balance`: Initial balance for backtest (default: 10000.0)
 69 | - `--start-date`: Start date in YYYY-MM-DD format (overrides --days)
 70 | - `--end-date`: End date in YYYY-MM-DD format (defaults to today)
 71 | 
 72 | ### List Available Data
 73 | 
 74 | ```bash
 75 | python run_backtest.py list --symbols BTCUSDC --intervals 1h
 76 | ```
 77 | 
 78 | This command lists available historical data, optionally filtered by symbols and intervals.
 79 | 
 80 | Options:
 81 | - `--symbols`: Filter by one or more symbols
 82 | - `--intervals`: Filter by one or more intervals
 83 | 
 84 | ### Analyze Results
 85 | 
 86 | ```bash
 87 | python run_backtest.py analyze --metric sharpe_ratio
 88 | ```
 89 | 
 90 | This command analyzes all available backtest results, comparing them by Sharpe ratio.
 91 | 
 92 | Options:
 93 | - `--results`: Specific result file(s) to analyze
 94 | - `--symbols`: Filter results by symbol(s)
 95 | - `--intervals`: Filter results by interval(s)
 96 | - `--metric`: Metric to compare (default: return_pct)
 97 | 
 98 | ## Advanced Usage
 99 | 
100 | ### Implementing Custom Strategies
101 | 
102 | To implement and test a custom strategy, you would need to:
103 | 
104 | 1. Create a new strategy class in `backtesting/strategies/`
105 | 2. Implement the required interface methods
106 | 3. Register your strategy with the `StrategyTester` class
107 | 4. Run backtests using your custom strategy
108 | 
109 | ### Integration with AI Models
110 | 
111 | The backtesting framework integrates with the existing AI Trader:
112 | 
113 | 1. Historical market data is processed using the same technical indicators
114 | 2. Historical social metrics are included when available
115 | 3. The AI trader's decision logic is applied as in live trading
116 | 4. Results are stored for analysis and optimization
117 | 
118 | ## Visualization Examples
119 | 
120 | The backtesting framework generates visualizations for:
121 | 
122 | 1. Equity curves showing account growth over time
123 | 2. Drawdown analysis
124 | 3. Trade analysis showing win/loss ratios, trade durations, etc.
125 | 4. Performance comparisons across different parameters and time periods
126 | 
127 | ## Configuration
128 | 
129 | The framework uses the same configuration file as the main trading system (`config.json`), with the following key configuration options:
130 | 
131 | - Connection settings for data sources
132 | - Technical indicator parameters
133 | - Trading strategy parameters
134 | - Risk management settings
135 | - Performance metrics thresholds


--------------------------------------------------------------------------------
/tests/test_backtesting.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import sys
  3 | import json
  4 | import asyncio
  5 | import unittest
  6 | from datetime import datetime, timedelta
  7 | import pandas as pd
  8 | from pathlib import Path
  9 | 
 10 | # Add project root to path
 11 | sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 12 | 
 13 | from backtesting.data_manager import HistoricalDataManager
 14 | from backtesting.social_data_provider import SocialDataProvider
 15 | from backtesting.strategy_tester import StrategyTester
 16 | from backtesting.result_analyzer import ResultAnalyzer
 17 | 
 18 | class TestBacktesting(unittest.TestCase):
 19 |     
 20 |     def setUp(self):
 21 |         """Set up test environment"""
 22 |         # Create test data directories
 23 |         self.test_dir = Path('test_backtesting_data')
 24 |         self.test_dir.mkdir(exist_ok=True)
 25 |         
 26 |         # Initialize components with test configuration
 27 |         self.data_manager = HistoricalDataManager('config.json')
 28 |         self.social_provider = SocialDataProvider(self.data_manager)
 29 |         self.strategy_tester = StrategyTester('config.json')
 30 |         self.result_analyzer = ResultAnalyzer()
 31 |         
 32 |     def tearDown(self):
 33 |         """Clean up after tests"""
 34 |         # Remove test data if needed
 35 |         pass
 36 |         
 37 |     async def test_data_manager_initialization(self):
 38 |         """Test data manager initialization"""
 39 |         # Verify data directories were created
 40 |         self.assertTrue(self.data_manager.market_data_dir.exists())
 41 |         self.assertTrue(self.data_manager.social_data_dir.exists())
 42 |         
 43 |     async def test_basic_market_data_structure(self):
 44 |         """Test that market data structure is correct"""
 45 |         # Create a minimal test DataFrame
 46 |         test_data = pd.DataFrame({
 47 |             'timestamp': [datetime.now() - timedelta(minutes=i) for i in range(10)],
 48 |             'open': [100 + i for i in range(10)],
 49 |             'high': [110 + i for i in range(10)],
 50 |             'low': [90 + i for i in range(10)],
 51 |             'close': [105 + i for i in range(10)],
 52 |             'volume': [1000 * (i + 1) for i in range(10)]
 53 |         })
 54 |         
 55 |         # Set timestamp as index
 56 |         test_data.set_index('timestamp', inplace=True)
 57 |         
 58 |         # Ensure data_manager handles this structure
 59 |         # This is a basic structure test, not a data processing test
 60 |         self.assertEqual(test_data.shape[1], 5)  # 5 columns (OHLCV)
 61 |         
 62 |     async def test_social_data_default_values(self):
 63 |         """Test default values for social data provider"""
 64 |         # Get default metrics
 65 |         default_metrics = self.social_provider.default_metrics
 66 |         
 67 |         # Check that default sentiment is neutral (0.5)
 68 |         self.assertEqual(default_metrics['social_sentiment'], 0.5)
 69 |         
 70 |         # Check that required metrics exist
 71 |         required_metrics = ['social_volume', 'social_engagement', 'social_contributors', 'social_sentiment']
 72 |         for metric in required_metrics:
 73 |             self.assertIn(metric, default_metrics)
 74 |             
 75 |     async def test_strategy_tester_initialization(self):
 76 |         """Test strategy tester initialization"""
 77 |         # Check that stats are properly initialized
 78 |         self.assertEqual(self.strategy_tester.stats['initial_balance'], 0.0)
 79 |         self.assertEqual(self.strategy_tester.stats['final_balance'], 0.0)
 80 |         self.assertEqual(self.strategy_tester.stats['total_trades'], 0)
 81 |         
 82 |         # Check that the strategy tester has a valid AI trader
 83 |         self.assertIsNotNone(self.strategy_tester.ai_trader)
 84 |         
 85 |     async def test_result_analyzer_initialization(self):
 86 |         """Test result analyzer initialization"""
 87 |         # Check that plots directory was created
 88 |         self.assertTrue(self.result_analyzer.plots_dir.exists())
 89 |         
 90 | def run_tests():
 91 |     """Run all tests"""
 92 |     async def run_async_tests():
 93 |         # Create test suite
 94 |         suite = unittest.TestSuite()
 95 |         
 96 |         # Create test instance
 97 |         test_case = TestBacktesting()
 98 |         
 99 |         # Set up test case
100 |         test_case.setUp()
101 |         
102 |         # Add tests
103 |         for method_name in dir(test_case):
104 |             if method_name.startswith('test_') and callable(getattr(test_case, method_name)):
105 |                 if method_name.startswith('test_async_'):
106 |                     continue  # Skip async tests for now
107 |                 test_method = getattr(test_case, method_name)
108 |                 if asyncio.iscoroutinefunction(test_method):
109 |                     # Convert async test to sync for unittest
110 |                     setattr(test_case, method_name, lambda test_method=test_method: asyncio.run(test_method()))
111 |                 
112 |         suite.addTest(test_case)
113 |         
114 |         # Run tests
115 |         runner = unittest.TextTestRunner()
116 |         runner.run(suite)
117 |         
118 |         # Clean up
119 |         test_case.tearDown()
120 |     
121 |     # Run async tests
122 |     asyncio.run(run_async_tests())
123 | 
124 | if __name__ == '__main__':
125 |     run_tests()


--------------------------------------------------------------------------------
/tests/test_strategy_evolution.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import sys
  3 | import json
  4 | import asyncio
  5 | import unittest
  6 | from datetime import datetime, timedelta
  7 | 
  8 | # Add project root to path
  9 | sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 10 | 
 11 | from services.strategy_evolution_service import StrategyEvolutionService
 12 | 
 13 | class TestStrategyEvolution(unittest.TestCase):
 14 |     async def asyncSetUp(self):
 15 |         """Set up test environment"""
 16 |         # Load test configuration
 17 |         with open('config.json', 'r') as f:
 18 |             self.config = json.load(f)
 19 | 
 20 |         # Initialize service
 21 |         self.service = StrategyEvolutionService()
 22 | 
 23 |         # Test parameters
 24 |         self.test_params = {
 25 |             'type': 'mean_reversion',
 26 |             'timeframe': '5m',
 27 |             'risk_limit': 1.5,
 28 |             'target_profit': 1.0,
 29 |             'max_position_size': 5
 30 |         }
 31 | 
 32 |     async def test_strategy_generation(self):
 33 |         """Test strategy generation"""
 34 |         # Generate strategy
 35 |         strategy_code = await self.service.generate_strategy(self.test_params)
 36 |         
 37 |         # Verify strategy code
 38 |         self.assertIsNotNone(strategy_code)
 39 |         self.assertIn('async fetch(request, env)', strategy_code)
 40 |         self.assertIn('export default', strategy_code)
 41 | 
 42 |     async def test_strategy_deployment(self):
 43 |         """Test strategy deployment to Cloudflare"""
 44 |         # Generate and deploy strategy
 45 |         strategy_code = await self.service.generate_strategy(self.test_params)
 46 |         worker_id = await self.service.deploy_strategy(strategy_code)
 47 |         
 48 |         # Verify deployment
 49 |         self.assertIsNotNone(worker_id)
 50 |         self.assertTrue(worker_id in self.service.active_strategies)
 51 | 
 52 |     async def test_strategy_monitoring(self):
 53 |         """Test strategy performance monitoring"""
 54 |         # Deploy strategy
 55 |         strategy_code = await self.service.generate_strategy(self.test_params)
 56 |         worker_id = await self.service.deploy_strategy(strategy_code)
 57 |         
 58 |         # Monitor performance
 59 |         performance = await self.service.monitor_strategy(worker_id)
 60 |         
 61 |         # Verify monitoring data
 62 |         self.assertIsNotNone(performance)
 63 |         self.assertIn('sharpe_ratio', performance)
 64 |         self.assertIn('drawdown', performance)
 65 |         self.assertIn('win_rate', performance)
 66 | 
 67 |     async def test_strategy_evolution(self):
 68 |         """Test strategy evolution process"""
 69 |         # Deploy initial strategy
 70 |         strategy_code = await self.service.generate_strategy(self.test_params)
 71 |         worker_id = await self.service.deploy_strategy(strategy_code)
 72 |         
 73 |         # Create test performance data
 74 |         test_performance = {
 75 |             'sharpe_ratio': 0.5,  # Below threshold to trigger evolution
 76 |             'drawdown': 20,
 77 |             'win_rate': 0.45,
 78 |             'profit_factor': 1.1,
 79 |             'total_trades': 100,
 80 |             'period_start': (datetime.now() - timedelta(days=7)).isoformat(),
 81 |             'period_end': datetime.now().isoformat()
 82 |         }
 83 |         
 84 |         # Evolve strategy
 85 |         improved_strategy = await self.service.evolve_strategy(worker_id, test_performance)
 86 |         
 87 |         # Verify evolution
 88 |         self.assertIsNotNone(improved_strategy)
 89 |         self.assertNotEqual(improved_strategy, strategy_code)
 90 | 
 91 |     async def test_complete_cycle(self):
 92 |         """Test complete strategy lifecycle"""
 93 |         # 1. Generate initial strategy
 94 |         strategy_code = await self.service.generate_strategy(self.test_params)
 95 |         self.assertIsNotNone(strategy_code)
 96 |         
 97 |         # 2. Deploy strategy
 98 |         worker_id = await self.service.deploy_strategy(strategy_code)
 99 |         self.assertIsNotNone(worker_id)
100 |         
101 |         # 3. Monitor performance
102 |         performance = await self.service.monitor_strategy(worker_id)
103 |         self.assertIsNotNone(performance)
104 |         
105 |         # 4. Trigger evolution
106 |         test_performance = {
107 |             'sharpe_ratio': 0.5,
108 |             'drawdown': 20,
109 |             'win_rate': 0.45
110 |         }
111 |         improved_strategy = await self.service.evolve_strategy(worker_id, test_performance)
112 |         self.assertIsNotNone(improved_strategy)
113 |         
114 |         # 5. Deploy improved version
115 |         new_worker_id = await self.service.deploy_strategy(improved_strategy)
116 |         self.assertIsNotNone(new_worker_id)
117 |         self.assertNotEqual(worker_id, new_worker_id)
118 | 
119 | def run_tests():
120 |     """Run all tests"""
121 |     async def run_async_tests():
122 |         # Create test suite
123 |         suite = unittest.TestSuite()
124 |         
125 |         # Create test instance
126 |         test_case = TestStrategyEvolution()
127 |         
128 |         # Set up test case
129 |         await test_case.asyncSetUp()
130 |         
131 |         # Add tests
132 |         suite.addTest(test_case)
133 |         
134 |         # Run tests
135 |         runner = unittest.TextTestRunner()
136 |         runner.run(suite)
137 |     
138 |     # Run async tests
139 |     asyncio.run(run_async_tests())
140 | 
141 | if __name__ == '__main__':
142 |     run_tests()
143 | 


--------------------------------------------------------------------------------
/tests/run_tests.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import sys
  3 | import json
  4 | import asyncio
  5 | import logging
  6 | from dotenv import load_dotenv
  7 | 
  8 | # Configure logging
  9 | logging.basicConfig(
 10 |     level=logging.INFO,
 11 |     format='%(asctime)s - %(levelname)s - %(message)s'
 12 | )
 13 | logger = logging.getLogger(__name__)
 14 | 
 15 | # Add project root to path
 16 | sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 17 | 
 18 | class TestEnvironment:
 19 |     """Test environment setup and teardown"""
 20 |     
 21 |     @staticmethod
 22 |     def setup():
 23 |         """Set up test environment"""
 24 |         try:
 25 |             # Load environment variables
 26 |             load_dotenv('.env')
 27 |             
 28 |             # Verify required environment variables
 29 |             required_vars = [
 30 |                 'OPENAI_API_KEY',
 31 |                 'CLOUDFLARE_API_TOKEN',
 32 |                 'CLOUDFLARE_ACCOUNT_ID'
 33 |             ]
 34 |             
 35 |             missing_vars = [var for var in required_vars if not os.getenv(var)]
 36 |             if missing_vars:
 37 |                 raise ValueError(f"Missing required environment variables: {', '.join(missing_vars)}")
 38 |             
 39 |             # Create test config
 40 |             test_config = {
 41 |                 "trading_params": {
 42 |                     "min_volume_usdc": 10000,  # Lower for testing
 43 |                     "position_size": 0.05,     # Smaller for testing
 44 |                     "max_positions": 2,        # Fewer for testing
 45 |                     "stop_loss_pct": 1,
 46 |                     "take_profit_pct": 2,
 47 |                     "min_trade_amount": 10
 48 |                 },
 49 |                 "evolution": {
 50 |                     "min_sharpe_ratio": 1.0,
 51 |                     "max_drawdown": 20.0,
 52 |                     "min_win_rate": 0.5,
 53 |                     "min_profit_factor": 1.2,
 54 |                     "improvement_threshold": 0.1,
 55 |                     "max_iterations": 3,        # Fewer for testing
 56 |                     "convergence_criteria": 0.05
 57 |                 },
 58 |                 "worker_defaults": {
 59 |                     "memory_limit": "128MB",
 60 |                     "cpu_limit": "10ms",
 61 |                     "timeout": 5000            # Shorter for testing
 62 |                 }
 63 |             }
 64 |             
 65 |             # Save test config
 66 |             with open('tests/test_config.json', 'w') as f:
 67 |                 json.dump(test_config, f, indent=2)
 68 |             
 69 |             logger.info("Test environment setup completed")
 70 |             return True
 71 |             
 72 |         except Exception as e:
 73 |             logger.error(f"Error setting up test environment: {str(e)}")
 74 |             return False
 75 | 
 76 |     @staticmethod
 77 |     def teardown():
 78 |         """Clean up test environment"""
 79 |         try:
 80 |             # Remove test config
 81 |             if os.path.exists('tests/test_config.json'):
 82 |                 os.remove('tests/test_config.json')
 83 |             
 84 |             # Clean up any test workers
 85 |             # This would typically involve calling Cloudflare API to remove test workers
 86 |             
 87 |             logger.info("Test environment cleanup completed")
 88 |             return True
 89 |             
 90 |         except Exception as e:
 91 |             logger.error(f"Error cleaning up test environment: {str(e)}")
 92 |             return False
 93 | 
 94 | async def run_tests():
 95 |     """Run all tests"""
 96 |     try:
 97 |         # Set up test environment
 98 |         if not TestEnvironment.setup():
 99 |             logger.error("Failed to set up test environment")
100 |             return False
101 |         
102 |         # Import and run tests
103 |         from test_strategy_evolution import TestStrategyEvolution
104 |         
105 |         # Create test suite
106 |         import unittest
107 |         suite = unittest.TestSuite()
108 |         
109 |         # Create test instance
110 |         test_case = TestStrategyEvolution()
111 |         
112 |         # Set up test case
113 |         await test_case.asyncSetUp()
114 |         
115 |         # Add tests
116 |         test_methods = [
117 |             'test_strategy_generation',
118 |             'test_strategy_deployment',
119 |             'test_strategy_monitoring',
120 |             'test_strategy_evolution',
121 |             'test_complete_cycle'
122 |         ]
123 |         
124 |         for method in test_methods:
125 |             suite.addTest(TestStrategyEvolution(method))
126 |         
127 |         # Run tests
128 |         runner = unittest.TextTestRunner(verbosity=2)
129 |         result = runner.run(suite)
130 |         
131 |         # Clean up test environment
132 |         TestEnvironment.teardown()
133 |         
134 |         return result.wasSuccessful()
135 |         
136 |     except Exception as e:
137 |         logger.error(f"Error running tests: {str(e)}")
138 |         TestEnvironment.teardown()
139 |         return False
140 | 
141 | def main():
142 |     """Main entry point"""
143 |     try:
144 |         logger.info("Starting test run...")
145 |         success = asyncio.run(run_tests())
146 |         
147 |         if success:
148 |             logger.info("All tests passed successfully")
149 |             sys.exit(0)
150 |         else:
151 |             logger.error("Some tests failed")
152 |             sys.exit(1)
153 |             
154 |     except KeyboardInterrupt:
155 |         logger.info("Test run interrupted")
156 |         TestEnvironment.teardown()
157 |         sys.exit(1)
158 |     except Exception as e:
159 |         logger.error(f"Error in test runner: {str(e)}")
160 |         TestEnvironment.teardown()
161 |         sys.exit(1)
162 | 
163 | if __name__ == "__main__":
164 |     main()
165 | 


--------------------------------------------------------------------------------
/monitoring/alert_rules.yml:
--------------------------------------------------------------------------------
  1 | groups:
  2 |   - name: crypto-trader-alerts
  3 |     rules:
  4 |       # Service Health Alerts
  5 |       - alert: ServiceDown
  6 |         expr: crypto_trader_service_health == 0
  7 |         for: 1m
  8 |         labels:
  9 |           severity: critical
 10 |           service: "{{ $labels.service }}"
 11 |         annotations:
 12 |           summary: "Service {{ $labels.service }} is down"
 13 |           description: "Service {{ $labels.service }} has been down for more than 1 minute"
 14 | 
 15 |       # Trading Performance Alerts
 16 |       - alert: LowTradingVolume
 17 |         expr: rate(crypto_trader_trades_executed_total[5m]) < 0.1
 18 |         for: 5m
 19 |         labels:
 20 |           severity: warning
 21 |         annotations:
 22 |           summary: "Low trading volume detected"
 23 |           description: "Trading volume has been below 0.1 trades/minute for the last 5 minutes"
 24 | 
 25 |       - alert: HighErrorRate
 26 |         expr: rate(crypto_trader_errors_total[5m]) > 1
 27 |         for: 2m
 28 |         labels:
 29 |           severity: critical
 30 |         annotations:
 31 |           summary: "High error rate in {{ $labels.service }}"
 32 |           description: "Error rate in {{ $labels.service }} is above 1 error/minute for the last 2 minutes"
 33 | 
 34 |       # AI Model Performance Alerts
 35 |       - alert: LowAIModelConfidence
 36 |         expr: avg_over_time(crypto_trader_ai_model_confidence[10m]) < 0.5
 37 |         for: 5m
 38 |         labels:
 39 |           severity: warning
 40 |         annotations:
 41 |           summary: "Low AI model confidence for {{ $labels.symbol }}"
 42 |           description: "AI model confidence for {{ $labels.symbol }} has been below 50% for 5 minutes"
 43 | 
 44 |       # Market Data Alerts
 45 |       - alert: StaleMarketData
 46 |         expr: time() - crypto_trader_market_data_updates_total > 300
 47 |         for: 1m
 48 |         labels:
 49 |           severity: critical
 50 |         annotations:
 51 |           summary: "Stale market data for {{ $labels.symbol }}"
 52 |           description: "No market data updates received for {{ $labels.symbol }} in the last 5 minutes"
 53 | 
 54 |       # Risk Management Alerts
 55 |       - alert: HighPortfolioVaR
 56 |         expr: crypto_trader_portfolio_var > 0.1
 57 |         for: 2m
 58 |         labels:
 59 |           severity: critical
 60 |         annotations:
 61 |           summary: "High portfolio VaR detected"
 62 |           description: "Portfolio VaR is above 10% for the last 2 minutes"
 63 | 
 64 |       - alert: ExcessiveDrawdown
 65 |         expr: crypto_trader_profit_loss_usd < -1000
 66 |         for: 1m
 67 |         labels:
 68 |           severity: critical
 69 |         annotations:
 70 |           summary: "Excessive drawdown detected"
 71 |           description: "Portfolio drawdown exceeds $1000"
 72 | 
 73 |       # System Resource Alerts
 74 |       - alert: HighRequestLatency
 75 |         expr: histogram_quantile(0.95, sum(rate(crypto_trader_request_latency_seconds_bucket[5m])) by (le, service)) > 5
 76 |         for: 2m
 77 |         labels:
 78 |           severity: warning
 79 |         annotations:
 80 |           summary: "High request latency in {{ $labels.service }}"
 81 |           description: "95th percentile latency in {{ $labels.service }} is above 5 seconds"
 82 | 
 83 |       # Social Sentiment Alerts
 84 |       - alert: ExtremeSocialSentiment
 85 |         expr: crypto_trader_social_sentiment > 0.9 or crypto_trader_social_sentiment < 0.1
 86 |         for: 10m
 87 |         labels:
 88 |           severity: warning
 89 |         annotations:
 90 |           summary: "Extreme social sentiment for {{ $labels.symbol }}"
 91 |           description: "Social sentiment for {{ $labels.symbol }} is at extreme levels ({{ $value }})"
 92 | 
 93 |       # Redis Connection Alerts
 94 |       - alert: RedisConnectionFailure
 95 |         expr: increase(crypto_trader_errors_total{error_type="redis_connection"}[5m]) > 5
 96 |         for: 1m
 97 |         labels:
 98 |           severity: critical
 99 |         annotations:
100 |           summary: "Redis connection failures in {{ $labels.service }}"
101 |           description: "Multiple Redis connection failures detected in {{ $labels.service }}"
102 | 
103 |       # Price Movement Alerts
104 |       - alert: ExtremeVolatility
105 |         expr: abs(crypto_trader_price_change_percent) > 10
106 |         for: 1m
107 |         labels:
108 |           severity: warning
109 |         annotations:
110 |           summary: "Extreme price volatility for {{ $labels.symbol }}"
111 |           description: "{{ $labels.symbol }} price changed by {{ $value }}% in {{ $labels.timeframe }}"
112 | 
113 |   - name: crypto-trader-system-alerts
114 |     rules:
115 |       # Memory and CPU alerts would go here if we had node_exporter metrics
116 |       - alert: HighMemoryUsage
117 |         expr: (1 - (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes)) > 0.9
118 |         for: 5m
119 |         labels:
120 |           severity: warning
121 |         annotations:
122 |           summary: "High memory usage on {{ $labels.instance }}"
123 |           description: "Memory usage is above 90% on {{ $labels.instance }}"
124 | 
125 |       - alert: HighCPUUsage
126 |         expr: 100 - (avg by(instance) (irate(node_cpu_seconds_total{mode="idle"}[5m])) * 100) > 80
127 |         for: 5m
128 |         labels:
129 |           severity: warning
130 |         annotations:
131 |           summary: "High CPU usage on {{ $labels.instance }}"
132 |           description: "CPU usage is above 80% on {{ $labels.instance }}"
133 | 
134 |       - alert: DiskSpaceLow
135 |         expr: (node_filesystem_avail_bytes{mountpoint="/"} / node_filesystem_size_bytes{mountpoint="/"}) * 100 < 10
136 |         for: 5m
137 |         labels:
138 |           severity: critical
139 |         annotations:
140 |           summary: "Low disk space on {{ $labels.instance }}"
141 |           description: "Disk space is below 10% on {{ $labels.instance }}"
142 | 


--------------------------------------------------------------------------------
/trading_strategy.md:
--------------------------------------------------------------------------------
  1 | # Crypto Trading Strategy Implementation
  2 | 
  3 | ## Core Components
  4 | 
  5 | ### 1. Market Data Analysis
  6 | - Real-time price monitoring via Binance WebSocket
  7 | - Technical indicators calculation:
  8 |   - RSI (1m, 3m, 5m timeframes)
  9 |   - MACD (1m, 3m, 5m timeframes)
 10 |   - Stochastic K
 11 |   - Williams %R
 12 |   - Bollinger Bands
 13 | - Price change tracking (1m, 3m, 5m, 15m intervals)
 14 | - Volume analysis with minimum USDC threshold
 15 | 
 16 | ### 2. Social Metrics Integration
 17 | - LunarCrush API data collection:
 18 |   - Social volume tracking
 19 |   - Social engagement metrics
 20 |   - Social sentiment analysis
 21 |   - Social contributors count
 22 | - Recent news sentiment analysis
 23 | - Social metrics caching with 5-minute updates
 24 | - Fallback mechanisms for API disruptions
 25 | 
 26 | ### 3. AI Analysis System
 27 | - OpenAI GPT-4 powered analysis
 28 | - Combined analysis of:
 29 |   - Technical indicators
 30 |   - Price action
 31 |   - Social sentiment
 32 |   - Market context
 33 | - Risk level assessment
 34 | - Confidence scoring
 35 | - Trading decision generation
 36 | 
 37 | ## Trading Rules
 38 | 
 39 | ### 1. Entry Conditions
 40 | Technical Requirements:
 41 | - Minimum 24h volume: $50,000 USDC
 42 | - Price change threshold: 0.5%
 43 | - RSI between 30-70
 44 | - Positive MACD momentum
 45 | - Favorable Bollinger Band position
 46 | 
 47 | Social Requirements:
 48 | - Minimum social engagement: 1,000
 49 | - Positive social sentiment (>0.5)
 50 | - Active social contributors
 51 | - No significant negative news
 52 | 
 53 | ### 2. Position Sizing
 54 | - Base size: 40% of available capital
 55 | - Adjustments based on:
 56 |   - AI confidence score
 57 |   - Social sentiment strength
 58 |   - Technical indicator alignment
 59 |   - Market volatility
 60 | - Maximum position: 5 concurrent trades
 61 | 
 62 | ### 3. Risk Management
 63 | - Stop Loss: 2.0% from entry
 64 | - Take Profit: 4.0% from entry
 65 | - Maximum daily drawdown: 6%
 66 | - Position correlation limits: 0.7
 67 | - Minimum trade amount: $40
 68 | 
 69 | ## Implementation Flow
 70 | 
 71 | ### 1. Market Monitoring
 72 | ```python
 73 | class MarketMonitorService:
 74 |     # Continuous market data collection
 75 |     async def process_market_data(self, msg):
 76 |         # Process incoming market data
 77 |         # Calculate technical indicators
 78 |         # Queue updates for analysis
 79 | ```
 80 | 
 81 | ### 2. Social Analysis
 82 | ```python
 83 | class SocialMonitorService:
 84 |     # Social metrics collection and analysis
 85 |     async def fetch_social_metrics(self, symbol):
 86 |         # Fetch LunarCrush data
 87 |         # Calculate sentiment metrics
 88 |         # Cache and distribute updates
 89 | ```
 90 | 
 91 | ### 3. AI Analysis
 92 | ```python
 93 | class AIAnalyzerService:
 94 |     # Combined market and social analysis
 95 |     async def analyze_market_data(self, market_update):
 96 |         # Combine market and social data
 97 |         # Generate AI analysis
 98 |         # Produce trading signals
 99 | ```
100 | 
101 | ### 4. Trade Execution
102 | ```python
103 | class AITrader:
104 |     # Trading decision implementation
105 |     async def analyze_trade_opportunity(self, market_data):
106 |         # Analyze combined data
107 |         # Generate trading decisions
108 |         # Implement risk management
109 | ```
110 | 
111 | ## Performance Metrics
112 | 
113 | ### 1. Trading Metrics
114 | - Win rate target: >52%
115 | - Profit factor: >1.2
116 | - Sharpe ratio: >1.2
117 | - Maximum drawdown: <15%
118 | - Risk-reward ratio: 2:1
119 | 
120 | ### 2. Technical Metrics
121 | - Analysis interval: 60 seconds
122 | - Update latency: <100ms
123 | - Cache duration: 300 seconds
124 | - API rate limits:
125 |   - LunarCrush: 300s cache
126 |   - Binance: Real-time WebSocket
127 | 
128 | ### 3. Social Impact Metrics
129 | - Sentiment accuracy: >65%
130 | - Social correlation: >0.3
131 | - Engagement threshold: 1,000
132 | - News age limit: 3,600s
133 | 
134 | ## Risk Controls
135 | 
136 | ### 1. System Safeguards
137 | - Automatic failover for API disruptions
138 | - Default values for missing social data
139 | - Redis-based data persistence
140 | - Health check monitoring
141 | 
142 | ### 2. Trading Safeguards
143 | - Maximum position limits
144 | - Correlation-based exposure limits
145 | - Volatility-based position sizing
146 | - Multi-timeframe confirmation
147 | 
148 | ### 3. Market Conditions
149 | - Minimum liquidity requirements
150 | - Volatility thresholds
151 | - Social sentiment minimums
152 | - News sentiment validation
153 | 
154 | ## Monitoring and Evolution
155 | 
156 | ### 1. Performance Monitoring
157 | - Real-time trade tracking
158 | - Social metrics impact analysis
159 | - Strategy performance metrics
160 | - Risk parameter optimization
161 | 
162 | ### 2. Strategy Evolution
163 | - AI-driven strategy improvements
164 | - Social sentiment adaptation
165 | - Risk parameter optimization
166 | - Performance-based adjustments
167 | 
168 | ## Implementation Notes
169 | 
170 | ### 1. Configuration
171 | ```json
172 | {
173 |     "trading_params": {
174 |         "min_volume_usdc": 50000,
175 |         "min_price_change_pct": 0.5,
176 |         "position_size": 0.4,
177 |         "max_positions": 5,
178 |         "stop_loss_pct": 2.0,
179 |         "take_profit_pct": 4.0
180 |     }
181 | }
182 | ```
183 | 
184 | ### 2. Environment Setup
185 | ```bash
186 | # Required API keys
187 | BINANCE_API_KEY=your_key
188 | BINANCE_API_SECRET=your_secret
189 | OPENAI_API_KEY=your_key
190 | LUNARCRUSH_API_KEY=your_key
191 | ```
192 | 
193 | ### 3. Service Ports
194 | ```bash
195 | MARKET_MONITOR_PORT=8001
196 | TRADE_EXECUTOR_PORT=8002
197 | AI_ANALYZER_PORT=8003
198 | SOCIAL_MONITOR_PORT=8004
199 | ```
200 | 
201 | ## Critical Considerations
202 | 
203 | 1. Always maintain:
204 |    - API key security
205 |    - Data validation
206 |    - Error handling
207 |    - Failover mechanisms
208 | 
209 | 2. Regular monitoring of:
210 |    - Strategy performance
211 |    - Social metric accuracy
212 |    - System resource usage
213 |    - API rate limits
214 | 
215 | 3. Continuous improvement:
216 |    - Strategy optimization
217 |    - Risk parameter tuning
218 |    - Social metrics integration
219 |    - AI model enhancement
220 | 


--------------------------------------------------------------------------------
/services/utils/circuit_breaker_monitor.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Circuit Breaker Monitoring Service
  3 | Provides real-time visibility into circuit breaker states and statistics
  4 | """
  5 | import json
  6 | import asyncio
  7 | from aiohttp import web
  8 | from services.utils.circuit_breaker import get_all_circuit_breakers
  9 | from services.utils.metrics import get_metrics, is_metrics_enabled
 10 | import logging
 11 | 
 12 | logger = logging.getLogger(__name__)
 13 | 
 14 | class CircuitBreakerMonitor:
 15 |     """Monitor and expose circuit breaker statistics"""
 16 |     
 17 |     def __init__(self, port: int = 9091):
 18 |         self.port = port
 19 |         self.app = web.Application()
 20 |         self.setup_routes()
 21 |         
 22 |         # Initialize metrics if enabled
 23 |         self.metrics = None
 24 |         if is_metrics_enabled():
 25 |             self.metrics = get_metrics('circuit_breaker_monitor', port)
 26 |     
 27 |     def setup_routes(self):
 28 |         """Setup HTTP routes for monitoring"""
 29 |         self.app.router.add_get('/circuit-breakers', self.get_all_circuit_breakers)
 30 |         self.app.router.add_get('/circuit-breakers/{name}', self.get_circuit_breaker)
 31 |         self.app.router.add_post('/circuit-breakers/{name}/reset', self.reset_circuit_breaker)
 32 |         self.app.router.add_get('/health', self.health_check)
 33 |     
 34 |     async def get_all_circuit_breakers(self, request):
 35 |         """Get statistics for all circuit breakers"""
 36 |         try:
 37 |             circuit_breakers = get_all_circuit_breakers()
 38 |             stats = {}
 39 |             
 40 |             for name, cb in circuit_breakers.items():
 41 |                 stats[name] = cb.get_stats()
 42 |                 
 43 |                 # Update metrics if enabled
 44 |                 if self.metrics:
 45 |                     # Circuit breaker state (0=closed, 1=half-open, 2=open)
 46 |                     state_value = {'CLOSED': 0, 'HALF_OPEN': 1, 'OPEN': 2}[cb.state.value]
 47 |                     self.metrics.request_counter.labels(
 48 |                         service='circuit_breaker_monitor',
 49 |                         endpoint='get_all_circuit_breakers',
 50 |                         method='GET'
 51 |                     ).inc()
 52 |             
 53 |             return web.json_response({
 54 |                 'circuit_breakers': stats,
 55 |                 'total_count': len(stats),
 56 |                 'timestamp': asyncio.get_event_loop().time()
 57 |             })
 58 |         except Exception as e:
 59 |             logger.error(f"Error getting circuit breaker stats: {e}")
 60 |             return web.json_response({'error': str(e)}, status=500)
 61 |     
 62 |     async def get_circuit_breaker(self, request):
 63 |         """Get statistics for a specific circuit breaker"""
 64 |         try:
 65 |             name = request.match_info['name']
 66 |             circuit_breakers = get_all_circuit_breakers()
 67 |             
 68 |             if name not in circuit_breakers:
 69 |                 return web.json_response({'error': f'Circuit breaker {name} not found'}, status=404)
 70 |             
 71 |             cb = circuit_breakers[name]
 72 |             stats = cb.get_stats()
 73 |             
 74 |             if self.metrics:
 75 |                 self.metrics.request_counter.labels(
 76 |                     service='circuit_breaker_monitor',
 77 |                     endpoint='get_circuit_breaker',
 78 |                     method='GET'
 79 |                 ).inc()
 80 |             
 81 |             return web.json_response(stats)
 82 |         except Exception as e:
 83 |             logger.error(f"Error getting circuit breaker {name}: {e}")
 84 |             return web.json_response({'error': str(e)}, status=500)
 85 |     
 86 |     async def reset_circuit_breaker(self, request):
 87 |         """Reset a specific circuit breaker"""
 88 |         try:
 89 |             name = request.match_info['name']
 90 |             circuit_breakers = get_all_circuit_breakers()
 91 |             
 92 |             if name not in circuit_breakers:
 93 |                 return web.json_response({'error': f'Circuit breaker {name} not found'}, status=404)
 94 |             
 95 |             cb = circuit_breakers[name]
 96 |             cb.reset()
 97 |             
 98 |             if self.metrics:
 99 |                 self.metrics.request_counter.labels(
100 |                     service='circuit_breaker_monitor',
101 |                     endpoint='reset_circuit_breaker',
102 |                     method='POST'
103 |                 ).inc()
104 |             
105 |             logger.info(f"Circuit breaker {name} has been reset")
106 |             return web.json_response({'message': f'Circuit breaker {name} reset successfully'})
107 |         except Exception as e:
108 |             logger.error(f"Error resetting circuit breaker {name}: {e}")
109 |             return web.json_response({'error': str(e)}, status=500)
110 |     
111 |     async def health_check(self, request):
112 |         """Health check endpoint"""
113 |         return web.json_response({'status': 'healthy'})
114 |     
115 |     async def start(self):
116 |         """Start the monitoring server"""
117 |         try:
118 |             # Start metrics server if enabled
119 |             if self.metrics:
120 |                 await self.metrics.start_server()
121 |             
122 |             runner = web.AppRunner(self.app)
123 |             await runner.setup()
124 |             site = web.TCPSite(runner, '0.0.0.0', self.port)
125 |             await site.start()
126 |             
127 |             logger.info(f"Circuit Breaker Monitor started on port {self.port}")
128 |             logger.info(f"Available endpoints:")
129 |             logger.info(f"  GET  /circuit-breakers - Get all circuit breaker stats")
130 |             logger.info(f"  GET  /circuit-breakers/{{name}} - Get specific circuit breaker stats")
131 |             logger.info(f"  POST /circuit-breakers/{{name}}/reset - Reset circuit breaker")
132 |             logger.info(f"  GET  /health - Health check")
133 |             
134 |         except Exception as e:
135 |             logger.error(f"Failed to start Circuit Breaker Monitor: {e}")
136 |             raise
137 | 
138 | if __name__ == "__main__":
139 |     async def main():
140 |         monitor = CircuitBreakerMonitor()
141 |         await monitor.start()
142 |         
143 |         # Keep running
144 |         try:
145 |             while True:
146 |                 await asyncio.sleep(1)
147 |         except KeyboardInterrupt:
148 |             logger.info("Circuit Breaker Monitor stopped")
149 |     
150 |     asyncio.run(main())
151 | 


--------------------------------------------------------------------------------
/CHANGELOG.md:
--------------------------------------------------------------------------------
  1 | # Changelog
  2 | 
  3 | All notable changes to the AI Crypto Trader project will be documented in this file.
  4 | 
  5 | The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
  6 | and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
  7 | 
  8 | ## [2.0.0] - 2025-01-06 - PRODUCTION READY RELEASE 🚀
  9 | 
 10 | ### Major Features Added
 11 | 
 12 | #### 🎯 **Phase 1A: Complete Observability**
 13 | - **Comprehensive Metrics System** (`services/utils/metrics.py`)
 14 |   - 20+ trading-specific Prometheus metrics
 15 |   - Portfolio value, trade execution, AI confidence tracking
 16 |   - Request latency, error rates, service health monitoring
 17 |   - Auto-discovery and service registration
 18 | 
 19 | - **Enhanced Market Monitor Service**
 20 |   - Full metrics integration tracking all operations
 21 |   - Performance monitoring with request duration tracking
 22 |   - Error classification and detailed monitoring
 23 |   - Health status reporting with price change metrics
 24 | 
 25 | - **Advanced Alerting System** (`monitoring/alert_rules.yml`)
 26 |   - Service health alerts (down services, high error rates)
 27 |   - Trading performance alerts (low volume, execution issues)
 28 |   - AI model health monitoring (confidence thresholds)
 29 |   - Risk management alerts (VaR, drawdown limits)
 30 |   - System resource monitoring (CPU, memory, disk)
 31 | 
 32 | #### 🛡️ **Phase 1B: Reliability & Resilience**
 33 | - **Circuit Breaker System** (`services/utils/circuit_breaker.py`)
 34 |   - Multiple algorithms: Token Bucket, Sliding Window, Fixed Window, Leaky Bucket
 35 |   - Automatic failure detection with configurable thresholds
 36 |   - Smart recovery with half-open state testing
 37 |   - Comprehensive state management and metrics
 38 | 
 39 | - **Protected External Services**
 40 |   - Binance API: Circuit breaker with 3 failure threshold, 30s recovery
 41 |   - Redis Operations: Circuit breaker with 5 failure threshold, 10s recovery
 42 |   - Retry Logic: Exponential backoff with jitter for transient failures
 43 | 
 44 | - **Circuit Breaker Monitoring** (`services/utils/circuit_breaker_monitor.py`)
 45 |   - Real-time visibility into circuit breaker states
 46 |   - API endpoints for monitoring and manual reset
 47 |   - Integration with metrics system
 48 | 
 49 | #### ⚡ **Phase 1C: Performance & Security**
 50 | - **Redis Connection Pooling** (`services/utils/redis_pool.py`)
 51 |   - Advanced pooling with configurable pool sizes (20 max connections)
 52 |   - Redis Cluster support with automatic failover
 53 |   - Health monitoring and connection reuse optimization
 54 |   - Circuit breaker integration for fault tolerance
 55 | 
 56 | - **Intelligent Rate Limiting** (`services/utils/rate_limiter.py`)
 57 |   - Multiple algorithms: Sliding Window, Token Bucket, Fixed Window, Leaky Bucket
 58 |   - Distributed storage with Redis backend
 59 |   - Smart defaults: 10K market data, 1K API, 50 AI requests/min
 60 |   - Per-endpoint and per-user customization
 61 | 
 62 | - **Enterprise API Security** (`services/utils/api_security.py`)
 63 |   - Automatic key rotation (30-day cycle with grace periods)
 64 |   - Multi-level access control (READ_ONLY, TRADING, ADMIN, SYSTEM)
 65 |   - IP whitelisting and key expiration management
 66 |   - Comprehensive audit logging with encryption
 67 | 
 68 | ### Enhanced Monitoring & Alerting
 69 | 
 70 | #### **Prometheus Configuration** (`monitoring/prometheus.yml`)
 71 | - Service discovery for all components
 72 | - Optimized scraping intervals (15s)
 73 | - Integration with alerting rules
 74 | 
 75 | #### **Grafana Dashboards** (`monitoring/grafana/`)
 76 | - System overview with service health indicators
 77 | - Trading performance visualization
 78 | - AI model confidence tracking
 79 | - Social sentiment impact analysis
 80 | 
 81 | ### Updated Dependencies
 82 | - Added security packages: PyJWT, cryptography
 83 | - Enhanced Redis support with hiredis
 84 | - Updated monitoring stack components
 85 | 
 86 | ### Documentation Updates
 87 | 
 88 | #### **Production Readiness Guide** (`PRODUCTION_READINESS.md`)
 89 | - Complete setup and configuration guide
 90 | - Monitoring and alerting best practices
 91 | - Security configuration recommendations
 92 | - Performance optimization guidelines
 93 | 
 94 | #### **Development Backlog** (`BACKLOG.md`)
 95 | - Updated completion status for all Phase 1 items
 96 | - Clear roadmap for Phase 2 and beyond
 97 | - Priority classification and timeline estimates
 98 | 
 99 | ### Performance Improvements
100 | - **Redis Optimization**: Connection pooling reduces latency by ~60%
101 | - **Rate Limiting**: Intelligent algorithms prevent system overload
102 | - **Circuit Breakers**: Automatic protection from cascading failures
103 | - **Caching**: Smart data caching strategies for social metrics
104 | 
105 | ### Security Enhancements
106 | - **API Key Management**: Enterprise-grade security with automatic rotation
107 | - **Access Control**: Granular permissions with audit trails
108 | - **Rate Limiting**: DDoS protection and fair resource usage
109 | - **Encryption**: Secure storage of sensitive data
110 | 
111 | ### Breaking Changes
112 | - Environment variable `ENABLE_METRICS=true` required for metrics collection
113 | - New Redis configuration options for connection pooling
114 | - API security features require additional environment variables
115 | 
116 | ### Migration Guide
117 | 1. Update `.env` file with new configuration options
118 | 2. Restart services to enable new monitoring features
119 | 3. Access monitoring dashboards at configured ports
120 | 4. Review and customize alerting thresholds
121 | 
122 | ### Monitoring Endpoints
123 | - **Prometheus**: http://localhost:9090
124 | - **Grafana**: http://localhost:3000 (admin/admin)
125 | - **Market Monitor Metrics**: http://localhost:8001/metrics
126 | - **Circuit Breaker Monitor**: http://localhost:9091/circuit-breakers
127 | 
128 | ### Production Readiness Score: 🟢 **ENTERPRISE READY**
129 | 
130 | The system now includes:
131 | - ✅ **Complete Observability**: 20+ metrics, real-time alerts, comprehensive dashboards
132 | - ✅ **Fault Tolerance**: Circuit breakers, retry logic, automatic recovery
133 | - ✅ **High Performance**: Connection pooling, intelligent caching, optimized operations
134 | - ✅ **Enterprise Security**: API key rotation, access controls, audit logging
135 | - ✅ **Scalability**: Rate limiting, distributed coordination, cluster support
136 | 
137 | ---
138 | 
139 | ## [1.5.0] - Previous Release
140 | ### Added
141 | - AI Strategy Evolution with genetic algorithms
142 | - Social metrics integration with LunarCrush
143 | - Risk management with portfolio VaR calculations
144 | - Advanced backtesting framework
145 | - Real-time trading dashboard
146 | 
147 | ---
148 | 
149 | ## [1.0.0] - Initial Release
150 | ### Added
151 | - Basic trading functionality
152 | - Market data monitoring
153 | - Simple dashboard interface
154 | - Docker containerization
155 | - Basic configuration management
156 | 


--------------------------------------------------------------------------------
/services/utils/exchange_interface.py:
--------------------------------------------------------------------------------
  1 | import abc
  2 | from typing import Dict, List, Optional, Union, Any
  3 | import logging
  4 | import os
  5 | from binance.client import Client as BinanceClient
  6 | from binance.exceptions import BinanceAPIException
  7 | 
  8 | logger = logging.getLogger(__name__)
  9 | 
 10 | class ExchangeInterface(abc.ABC):
 11 |     """
 12 |     Abstract base class for exchange interfaces.
 13 |     Defines the common interface for all exchanges.
 14 |     """
 15 |     
 16 |     @abc.abstractmethod
 17 |     def get_ticker(self, symbol: str) -> Dict:
 18 |         """Get current ticker data for a symbol"""
 19 |         pass
 20 |     
 21 |     @abc.abstractmethod
 22 |     def get_order_book(self, symbol: str, limit: int = 100) -> Dict:
 23 |         """Get order book data for a symbol"""
 24 |         pass
 25 |     
 26 |     @abc.abstractmethod
 27 |     def get_symbols(self) -> List[str]:
 28 |         """Get all available trading symbols"""
 29 |         pass
 30 |     
 31 |     @abc.abstractmethod
 32 |     def get_exchange_info(self) -> Dict:
 33 |         """Get exchange information"""
 34 |         pass
 35 |     
 36 |     @abc.abstractmethod
 37 |     def place_order(self, symbol: str, side: str, order_type: str, quantity: float, price: Optional[float] = None) -> Dict:
 38 |         """Place an order on the exchange"""
 39 |         pass
 40 |     
 41 |     @abc.abstractmethod
 42 |     def get_balance(self, asset: str) -> float:
 43 |         """Get balance for a specific asset"""
 44 |         pass
 45 |     
 46 |     @abc.abstractmethod
 47 |     def get_all_balances(self) -> Dict:
 48 |         """Get balances for all assets"""
 49 |         pass
 50 |     
 51 |     @abc.abstractmethod
 52 |     def get_fees(self, symbol: Optional[str] = None) -> Dict:
 53 |         """Get fee information"""
 54 |         pass
 55 |     
 56 |     @abc.abstractmethod
 57 |     def get_ticker_all(self) -> Dict:
 58 |         """Get ticker data for all symbols"""
 59 |         pass
 60 |     
 61 |     @abc.abstractmethod
 62 |     def get_name(self) -> str:
 63 |         """Get the name of the exchange"""
 64 |         pass
 65 | 
 66 | 
 67 | class BinanceExchange(ExchangeInterface):
 68 |     """
 69 |     Binance exchange implementation of the ExchangeInterface.
 70 |     """
 71 |     
 72 |     def __init__(self, api_key: Optional[str] = None, api_secret: Optional[str] = None):
 73 |         """Initialize Binance exchange interface"""
 74 |         self.api_key = api_key or os.environ.get('BINANCE_API_KEY', '')
 75 |         self.api_secret = api_secret or os.environ.get('BINANCE_API_SECRET', '')
 76 |         
 77 |         try:
 78 |             self.client = BinanceClient(self.api_key, self.api_secret)
 79 |             logger.info("Binance client initialized")
 80 |         except Exception as e:
 81 |             logger.error(f"Error initializing Binance client: {str(e)}")
 82 |             raise
 83 |     
 84 |     def get_ticker(self, symbol: str) -> Dict:
 85 |         """Get current ticker data for a symbol"""
 86 |         try:
 87 |             ticker = self.client.get_symbol_ticker(symbol=symbol)
 88 |             return {
 89 |                 'symbol': ticker['symbol'],
 90 |                 'price': float(ticker['price'])
 91 |             }
 92 |         except BinanceAPIException as e:
 93 |             logger.error(f"Error getting ticker for {symbol}: {str(e)}")
 94 |             raise
 95 |     
 96 |     def get_order_book(self, symbol: str, limit: int = 100) -> Dict:
 97 |         """Get order book data for a symbol"""
 98 |         try:
 99 |             order_book = self.client.get_order_book(symbol=symbol, limit=limit)
100 |             return {
101 |                 'symbol': symbol,
102 |                 'bids': [[float(price), float(qty)] for price, qty in order_book['bids']],
103 |                 'asks': [[float(price), float(qty)] for price, qty in order_book['asks']],
104 |                 'timestamp': order_book['lastUpdateId']
105 |             }
106 |         except BinanceAPIException as e:
107 |             logger.error(f"Error getting order book for {symbol}: {str(e)}")
108 |             raise
109 |     
110 |     def get_symbols(self) -> List[str]:
111 |         """Get all available trading symbols"""
112 |         try:
113 |             exchange_info = self.client.get_exchange_info()
114 |             return [s['symbol'] for s in exchange_info['symbols'] if s['status'] == 'TRADING']
115 |         except BinanceAPIException as e:
116 |             logger.error(f"Error getting symbols: {str(e)}")
117 |             raise
118 |     
119 |     def get_exchange_info(self) -> Dict:
120 |         """Get exchange information"""
121 |         try:
122 |             return self.client.get_exchange_info()
123 |         except BinanceAPIException as e:
124 |             logger.error(f"Error getting exchange info: {str(e)}")
125 |             raise
126 |     
127 |     def place_order(self, symbol: str, side: str, order_type: str, quantity: float, price: Optional[float] = None) -> Dict:
128 |         """Place an order on the exchange"""
129 |         try:
130 |             params = {
131 |                 'symbol': symbol,
132 |                 'side': side,
133 |                 'type': order_type,
134 |                 'quantity': quantity
135 |             }
136 |             
137 |             if price is not None and order_type != 'MARKET':
138 |                 params['price'] = price
139 |                 params['timeInForce'] = 'GTC'
140 |             
141 |             order = self.client.create_order(**params)
142 |             return order
143 |         except BinanceAPIException as e:
144 |             logger.error(f"Error placing order for {symbol}: {str(e)}")
145 |             raise
146 |     
147 |     def get_balance(self, asset: str) -> float:
148 |         """Get balance for a specific asset"""
149 |         try:
150 |             account = self.client.get_account()
151 |             for balance in account['balances']:
152 |                 if balance['asset'] == asset:
153 |                     return float(balance['free'])
154 |             return 0.0
155 |         except BinanceAPIException as e:
156 |             logger.error(f"Error getting balance for {asset}: {str(e)}")
157 |             raise
158 |     
159 |     def get_all_balances(self) -> Dict:
160 |         """Get balances for all assets"""
161 |         try:
162 |             account = self.client.get_account()
163 |             balances = {}
164 |             for balance in account['balances']:
165 |                 free = float(balance['free'])
166 |                 locked = float(balance['locked'])
167 |                 total = free + locked
168 |                 if total > 0:  # Only include non-zero balances
169 |                     balances[balance['asset']] = {
170 |                         'free': free,
171 |                         'locked': locked,
172 |                         'total': total
173 |                     }
174 |             return balances
175 |         except BinanceAPIException as e:
176 |             logger.error(f"Error getting all balances: {str(e)}")
177 |             raise
178 |     
179 |     def get_fees(self, symbol: Optional[str] = None) -> Dict:
180 |         """Get fee information"""
181 |         try:
182 |             if symbol:
183 |                 fees = self.client.get_trade_fee(symbol=symbol)
184 |             else:
185 |                 fees = self.client.get_trade_fee()
186 |             return fees
187 |         except BinanceAPIException as e:
188 |             logger.error(f"Error getting fees: {str(e)}")
189 |             # If not available through API, return default values
190 |             return {
191 |                 'maker': 0.001,  # 0.1%
192 |                 'taker': 0.001   # 0.1%
193 |             }
194 |     
195 |     def get_ticker_all(self) -> Dict:
196 |         """Get ticker data for all symbols"""
197 |         try:
198 |             tickers = self.client.get_all_tickers()
199 |             return {ticker['symbol']: float(ticker['price']) for ticker in tickers}
200 |         except BinanceAPIException as e:
201 |             logger.error(f"Error getting all tickers: {str(e)}")
202 |             raise
203 |     
204 |     def get_name(self) -> str:
205 |         """Get the name of the exchange"""
206 |         return "Binance"
207 | 
208 | 
209 | class ExchangeFactory:
210 |     """
211 |     Factory class for creating exchange interfaces.
212 |     """
213 |     
214 |     @staticmethod
215 |     def create_exchange(exchange_name: str, api_key: Optional[str] = None, api_secret: Optional[str] = None) -> ExchangeInterface:
216 |         """Create an exchange interface instance"""
217 |         if exchange_name.lower() == 'binance':
218 |             return BinanceExchange(api_key, api_secret)
219 |         else:
220 |             raise ValueError(f"Unsupported exchange: {exchange_name}")


--------------------------------------------------------------------------------
/run_backtest.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | import os
  3 | import sys
  4 | import json
  5 | import argparse
  6 | import asyncio
  7 | import logging as logger
  8 | from datetime import datetime, timedelta
  9 | from typing import List, Dict, Any
 10 | 
 11 | from backtesting import BacktestEngine, ResultAnalyzer
 12 | from backtesting.data_manager import HistoricalDataManager
 13 | 
 14 | # Configure logging
 15 | logger.basicConfig(
 16 |     level=logger.INFO,
 17 |     format='%(asctime)s - %(levelname)s - %(message)s',
 18 |     handlers=[
 19 |         logger.FileHandler(f'logs/backtest_{datetime.now().strftime("%Y%m%d_%H%M%S")}.log'),
 20 |         logger.StreamHandler(sys.stdout)
 21 |     ]
 22 | )
 23 | 
 24 | def setup_parser() -> argparse.ArgumentParser:
 25 |     """Set up command line argument parser"""
 26 |     parser = argparse.ArgumentParser(description='Crypto Trading Backtesting CLI')
 27 |     
 28 |     # Create subparsers for different commands
 29 |     subparsers = parser.add_subparsers(dest='command', help='Command to run')
 30 |     
 31 |     # Fetch data command
 32 |     fetch_parser = subparsers.add_parser('fetch', help='Fetch historical data')
 33 |     fetch_parser.add_argument('--symbols', type=str, nargs='+', required=True, help='Symbol(s) to fetch data for (e.g. BTCUSDC)')
 34 |     fetch_parser.add_argument('--intervals', type=str, nargs='+', default=['1h'], help='Timeframe interval(s) (e.g. 1m, 5m, 15m, 1h, 4h, 1d)')
 35 |     fetch_parser.add_argument('--days', type=int, default=30, help='Number of days to fetch')
 36 |     fetch_parser.add_argument('--no-social', action='store_true', help='Skip fetching social data')
 37 |     
 38 |     # Run backtest command
 39 |     backtest_parser = subparsers.add_parser('backtest', help='Run a backtest')
 40 |     backtest_parser.add_argument('--symbols', type=str, nargs='+', required=True, help='Symbol(s) to backtest (e.g. BTCUSDC)')
 41 |     backtest_parser.add_argument('--intervals', type=str, nargs='+', default=['1h'], help='Timeframe interval(s) (e.g. 1m, 5m, 15m, 1h, 4h, 1d)')
 42 |     backtest_parser.add_argument('--days', type=int, default=30, help='Number of days to backtest')
 43 |     backtest_parser.add_argument('--balance', type=float, default=10000.0, help='Initial balance for backtest')
 44 |     backtest_parser.add_argument('--start-date', type=str, help='Start date (YYYY-MM-DD) (overrides --days)')
 45 |     backtest_parser.add_argument('--end-date', type=str, help='End date (YYYY-MM-DD) (defaults to today)')
 46 |     
 47 |     # List data command
 48 |     list_parser = subparsers.add_parser('list', help='List available data')
 49 |     list_parser.add_argument('--symbols', type=str, nargs='+', help='Filter by symbol(s)')
 50 |     list_parser.add_argument('--intervals', type=str, nargs='+', help='Filter by interval(s)')
 51 |     
 52 |     # Analyze results command
 53 |     analyze_parser = subparsers.add_parser('analyze', help='Analyze backtest results')
 54 |     analyze_parser.add_argument('--results', type=str, nargs='+', help='Result file(s) to analyze')
 55 |     analyze_parser.add_argument('--symbols', type=str, nargs='+', help='Filter results by symbol(s)')
 56 |     analyze_parser.add_argument('--intervals', type=str, nargs='+', help='Filter results by interval(s)')
 57 |     analyze_parser.add_argument('--metric', type=str, default='return_pct', help='Metric to compare (return_pct, win_rate, sharpe_ratio, etc.)')
 58 |     
 59 |     return parser
 60 | 
 61 | async def fetch_data(args: argparse.Namespace) -> Dict:
 62 |     """Fetch historical data for the specified symbols and intervals"""
 63 |     logger.info(f"Fetching data for {args.symbols} ({', '.join(args.intervals)}) for the past {args.days} days")
 64 |     
 65 |     # Initialize components
 66 |     data_manager = HistoricalDataManager()
 67 |     backtest_engine = BacktestEngine()
 68 |     
 69 |     # Calculate dates
 70 |     end_date = datetime.now()
 71 |     start_date = end_date - timedelta(days=args.days)
 72 |     
 73 |     # Fetch data for each symbol and interval
 74 |     results = {}
 75 |     for symbol in args.symbols:
 76 |         symbol_result = await backtest_engine.fetch_data_for_backtest(
 77 |             symbol, args.intervals, start_date, end_date, not args.no_social
 78 |         )
 79 |         results[symbol] = symbol_result
 80 |     
 81 |     return results
 82 | 
 83 | async def run_backtest(args: argparse.Namespace) -> Dict:
 84 |     """Run backtests for the specified symbols and intervals"""
 85 |     # Parse dates
 86 |     if args.start_date:
 87 |         start_date = datetime.strptime(args.start_date, '%Y-%m-%d')
 88 |     else:
 89 |         start_date = datetime.now() - timedelta(days=args.days)
 90 |         
 91 |     if args.end_date:
 92 |         end_date = datetime.strptime(args.end_date, '%Y-%m-%d')
 93 |     else:
 94 |         end_date = datetime.now()
 95 |     
 96 |     logger.info(f"Running backtest for {args.symbols} ({', '.join(args.intervals)}) "
 97 |                f"from {start_date.strftime('%Y-%m-%d')} to {end_date.strftime('%Y-%m-%d')} "
 98 |                f"with initial balance ${args.balance}")
 99 |     
100 |     # Initialize backtesting engine
101 |     backtest_engine = BacktestEngine()
102 |     
103 |     # Run backtests
104 |     results = await backtest_engine.run_multiple_backtests(
105 |         args.symbols, args.intervals, start_date, end_date, args.balance
106 |     )
107 |     
108 |     return results
109 | 
110 | def list_data(args: argparse.Namespace) -> Dict:
111 |     """List available historical data"""
112 |     logger.info("Listing available historical data")
113 |     
114 |     # Initialize data manager
115 |     data_manager = HistoricalDataManager()
116 |     
117 |     # Get available data
118 |     available_data = data_manager.available_symbols()
119 |     
120 |     # Filter by symbols if specified
121 |     if args.symbols:
122 |         available_data = [symbol for symbol in available_data if symbol in args.symbols]
123 |     
124 |     # Get detailed data for each symbol
125 |     result = {}
126 |     for symbol in available_data:
127 |         intervals = data_manager.available_intervals(symbol)
128 |         
129 |         # Filter by intervals if specified
130 |         if args.intervals:
131 |             intervals = [interval for interval in intervals if interval in args.intervals]
132 |         
133 |         symbol_data = {'intervals': {}}
134 |         for interval in intervals:
135 |             start_date, end_date = data_manager.get_data_range(symbol, interval)
136 |             if start_date and end_date:
137 |                 symbol_data['intervals'][interval] = {
138 |                     'start_date': start_date.strftime('%Y-%m-%d'),
139 |                     'end_date': end_date.strftime('%Y-%m-%d'),
140 |                     'days': (end_date - start_date).days
141 |                 }
142 |         
143 |         result[symbol] = symbol_data
144 |     
145 |     return result
146 | 
147 | def analyze_results(args: argparse.Namespace) -> Dict:
148 |     """Analyze backtest results"""
149 |     logger.info("Analyzing backtest results")
150 |     
151 |     # Initialize result analyzer
152 |     result_analyzer = ResultAnalyzer()
153 |     
154 |     # Get all available results if not specified
155 |     if args.results:
156 |         # Load specific result files
157 |         results = []
158 |         for result_path in args.results:
159 |             result = result_analyzer.load_results(result_path)
160 |             if result:
161 |                 results.append(result)
162 |     else:
163 |         # Filter available results
164 |         results = result_analyzer.filter_results(
165 |             symbol=args.symbols[0] if args.symbols and len(args.symbols) == 1 else None,
166 |             interval=args.intervals[0] if args.intervals and len(args.intervals) == 1 else None
167 |         )
168 |     
169 |     # If no results found
170 |     if not results:
171 |         logger.error("No results found matching the criteria")
172 |         return {'error': 'No results found'}
173 |     
174 |     # Generate summary report
175 |     summary = result_analyzer.generate_summary_report(results)
176 |     summary_path = result_analyzer.save_summary_report(summary)
177 |     
178 |     # Generate comparison chart
179 |     comparison_path = result_analyzer.compare_results(results, args.metric)
180 |     
181 |     # Add paths to summary
182 |     summary['summary_path'] = summary_path
183 |     if comparison_path:
184 |         summary['comparison_chart'] = comparison_path
185 |     
186 |     return summary
187 | 
188 | def print_json_result(result: Dict):
189 |     """Print result as formatted JSON"""
190 |     print(json.dumps(result, indent=2))
191 | 
192 | async def main():
193 |     """Main entry point"""
194 |     parser = setup_parser()
195 |     args = parser.parse_args()
196 |     
197 |     if not args.command:
198 |         parser.print_help()
199 |         sys.exit(1)
200 |     
201 |     try:
202 |         # Execute the selected command
203 |         if args.command == 'fetch':
204 |             result = await fetch_data(args)
205 |             print_json_result(result)
206 |             
207 |         elif args.command == 'backtest':
208 |             result = await run_backtest(args)
209 |             print_json_result(result)
210 |             
211 |         elif args.command == 'list':
212 |             result = list_data(args)
213 |             print_json_result(result)
214 |             
215 |         elif args.command == 'analyze':
216 |             result = analyze_results(args)
217 |             print_json_result(result)
218 |         
219 |     except Exception as e:
220 |         logger.error(f"Error executing command: {str(e)}")
221 |         sys.exit(1)
222 | 
223 | if __name__ == "__main__":
224 |     # Create logs directory if it doesn't exist
225 |     os.makedirs('logs', exist_ok=True)
226 |     
227 |     # Run the main function
228 |     asyncio.run(main())


--------------------------------------------------------------------------------
/PRODUCTION_READINESS.md:
--------------------------------------------------------------------------------
  1 | # Production Readiness Implementation
  2 | 
  3 | ## Overview
  4 | 
  5 | This document outlines the production readiness features implemented for the AI Crypto Trader system, focusing on observability, monitoring, and reliability improvements.
  6 | 
  7 | ## 🎯 What We've Implemented
  8 | 
  9 | ### 1. Comprehensive Metrics System
 10 | 
 11 | **Location**: `services/utils/metrics.py`
 12 | 
 13 | **Features**:
 14 | - **Prometheus Integration**: Full Prometheus metrics collection
 15 | - **Trading-Specific Metrics**: Portfolio value, trade execution, AI confidence, social sentiment
 16 | - **System Metrics**: Request latency, error rates, service health
 17 | - **Auto-Discovery**: Automatic service registration and metrics exposure
 18 | 
 19 | **Key Metrics**:
 20 | ```
 21 | crypto_trader_service_health           # Service up/down status
 22 | crypto_trader_portfolio_value_usd      # Real-time portfolio value
 23 | crypto_trader_trades_executed_total    # Trading activity
 24 | crypto_trader_ai_model_confidence      # AI decision confidence
 25 | crypto_trader_social_sentiment         # Social sentiment scores
 26 | crypto_trader_request_latency_seconds  # API response times
 27 | crypto_trader_errors_total             # Error tracking
 28 | ```
 29 | 
 30 | ### 2. Enhanced Market Monitor Service
 31 | 
 32 | **Location**: `services/market_monitor_service.py`
 33 | 
 34 | **Improvements**:
 35 | - ✅ **Metrics Integration**: Comprehensive tracking of all operations
 36 | - ✅ **Error Monitoring**: Detailed error classification and counting
 37 | - ✅ **Performance Tracking**: Request duration and throughput monitoring
 38 | - ✅ **Health Checks**: Service health status reporting
 39 | - ✅ **Price Change Tracking**: Real-time price movement metrics
 40 | 
 41 | ### 3. Advanced Alerting System
 42 | 
 43 | **Location**: `monitoring/alert_rules.yml`
 44 | 
 45 | **Alert Categories**:
 46 | - **Service Health**: Immediate notification when services go down
 47 | - **Trading Performance**: Alerts for low volume, high error rates
 48 | - **AI Model Health**: Confidence threshold monitoring
 49 | - **Market Data**: Stale data detection
 50 | - **Risk Management**: Portfolio VaR and drawdown alerts
 51 | - **System Resources**: CPU, memory, disk space monitoring
 52 | 
 53 | ### 4. Enhanced Monitoring Configuration
 54 | 
 55 | **Location**: `monitoring/prometheus.yml`
 56 | 
 57 | **Improvements**:
 58 | - ✅ **Service Discovery**: Automatic metric scraping from all services
 59 | - ✅ **Rule Files**: Integration with alerting rules
 60 | - ✅ **Optimized Intervals**: Balanced scraping frequency
 61 | 
 62 | ## 🚀 Quick Start
 63 | 
 64 | ### Enable Metrics Collection
 65 | 
 66 | Set the environment variable in your `.env` file:
 67 | ```bash
 68 | ENABLE_METRICS=true
 69 | ```
 70 | 
 71 | ### Start the System
 72 | 
 73 | ```bash
 74 | # Start all services with monitoring
 75 | docker-compose up -d
 76 | 
 77 | # Verify metrics are being collected
 78 | curl http://localhost:8001/metrics  # Market Monitor metrics
 79 | curl http://localhost:9090/targets  # Prometheus targets
 80 | ```
 81 | 
 82 | ### Access Monitoring Dashboards
 83 | 
 84 | - **Prometheus**: http://localhost:9090
 85 | - **Grafana**: http://localhost:3000 (admin/admin)
 86 | - **Kibana**: http://localhost:5601
 87 | 
 88 | ## 📊 Available Dashboards
 89 | 
 90 | ### 1. System Overview Dashboard
 91 | **Location**: `monitoring/grafana/provisioning/dashboards/system_overview.json`
 92 | 
 93 | **Panels**:
 94 | - Request rates by service
 95 | - Error rates and types
 96 | - Request latency percentiles
 97 | - Trading signal generation
 98 | - AI model confidence
 99 | - Portfolio performance
100 | - Social sentiment tracking
101 | 
102 | ### 2. Trading Performance Dashboard
103 | - Real-time portfolio value
104 | - Trade execution rates
105 | - Win/loss ratios
106 | - Strategy performance comparison
107 | - Risk metrics (VaR, drawdown)
108 | 
109 | ### 3. AI Model Monitoring Dashboard
110 | - Model confidence trends
111 | - Request duration by model
112 | - Feature importance tracking
113 | - Prediction accuracy
114 | 
115 | ## 🔔 Alert Notifications
116 | 
117 | ### Critical Alerts (Immediate Action Required)
118 | - **Service Down**: Any service becomes unavailable
119 | - **High Error Rate**: Error rate exceeds 1/minute
120 | - **Portfolio Risk**: VaR exceeds 10% or drawdown > $1000
121 | - **Redis Connection Failures**: Multiple Redis connection issues
122 | 
123 | ### Warning Alerts (Monitoring Required)
124 | - **Low AI Confidence**: Model confidence below 50%
125 | - **Extreme Social Sentiment**: Sentiment at extreme levels
126 | - **High Request Latency**: 95th percentile above 5 seconds
127 | - **System Resources**: High CPU/memory/disk usage
128 | 
129 | ## 📈 Key Performance Indicators (KPIs)
130 | 
131 | ### Trading Performance
132 | ```
133 | - Portfolio Value: crypto_trader_portfolio_value_usd
134 | - Daily Return: rate(crypto_trader_profit_loss_usd[1d])
135 | - Trade Success Rate: crypto_trader_win_rate
136 | - Trading Volume: rate(crypto_trader_trades_executed_total[1h])
137 | ```
138 | 
139 | ### System Health
140 | ```
141 | - Service Uptime: crypto_trader_service_health
142 | - Error Rate: rate(crypto_trader_errors_total[5m])
143 | - Response Time: crypto_trader_request_latency_seconds
144 | - Data Freshness: crypto_trader_market_data_updates_total
145 | ```
146 | 
147 | ### AI Performance
148 | ```
149 | - Model Confidence: avg(crypto_trader_ai_model_confidence)
150 | - AI Request Rate: rate(crypto_trader_ai_requests_total[5m])
151 | - Social Sentiment Accuracy: crypto_trader_social_sentiment
152 | ```
153 | 
154 | ## 🛠 Integration with Other Services
155 | 
156 | ### Adding Metrics to New Services
157 | 
158 | 1. **Import the metrics utility**:
159 | ```python
160 | from services.utils.metrics import get_metrics, is_metrics_enabled
161 | ```
162 | 
163 | 2. **Initialize metrics in your service**:
164 | ```python
165 | def __init__(self):
166 |     self.metrics = None
167 |     if is_metrics_enabled():
168 |         self.metrics = get_metrics('your_service_name', port)
169 | ```
170 | 
171 | 3. **Start the metrics server**:
172 | ```python
173 | async def run(self):
174 |     if self.metrics:
175 |         await self.metrics.start_server()
176 | ```
177 | 
178 | 4. **Record metrics in your operations**:
179 | ```python
180 | if self.metrics:
181 |     self.metrics.record_trading_signal(symbol, action, strategy)
182 |     self.metrics.update_portfolio_value(value)
183 |     self.metrics.record_ai_request(model, duration)
184 | ```
185 | 
186 | ### Example Integration
187 | 
188 | ```python
189 | class MyTradingService:
190 |     def __init__(self):
191 |         self.metrics = get_metrics('my_service', 8080)
192 |     
193 |     @self.metrics.measure_time('execute_trade', 'POST')
194 |     async def execute_trade(self, symbol, action):
195 |         try:
196 |             # Trading logic here
197 |             if self.metrics:
198 |                 self.metrics.record_trade_execution(symbol, action)
199 |         except Exception as e:
200 |             if self.metrics:
201 |                 self.metrics.error_counter.labels(
202 |                     service='my_service',
203 |                     error_type=type(e).__name__,
204 |                     endpoint='execute_trade'
205 |                 ).inc()
206 |             raise
207 | ```
208 | 
209 | ## 🔧 Configuration Options
210 | 
211 | ### Metrics Configuration
212 | ```python
213 | # Environment variables
214 | ENABLE_METRICS=true          # Enable/disable metrics collection
215 | PROMETHEUS_PORT=9090         # Prometheus server port
216 | METRICS_SCRAPE_INTERVAL=15s  # How often to collect metrics
217 | ```
218 | 
219 | ### Alert Thresholds
220 | Edit `monitoring/alert_rules.yml` to customize:
221 | - Error rate thresholds
222 | - Portfolio risk limits
223 | - Response time limits
224 | - Resource usage thresholds
225 | 
226 | ## 📊 Monitoring Best Practices
227 | 
228 | ### 1. Golden Signals for Trading Systems
229 | - **Latency**: How long does it take to process trades?
230 | - **Traffic**: How many trades per second?
231 | - **Errors**: What percentage of trades fail?
232 | - **Saturation**: How much of our trading capacity are we using?
233 | 
234 | ### 2. Trading-Specific Monitoring
235 | - **Portfolio Health**: Track portfolio value, drawdown, VaR
236 | - **Strategy Performance**: Monitor individual strategy success rates
237 | - **Market Data Quality**: Ensure fresh, accurate market data
238 | - **AI Model Performance**: Track confidence and accuracy
239 | 
240 | ### 3. Alert Fatigue Prevention
241 | - Set appropriate thresholds to avoid noise
242 | - Use different severity levels (critical, warning, info)
243 | - Group related alerts together
244 | - Include actionable information in alert descriptions
245 | 
246 | ## 🚨 Troubleshooting
247 | 
248 | ### Common Issues
249 | 
250 | **Metrics not appearing in Prometheus**:
251 | 1. Check service is running with `ENABLE_METRICS=true`
252 | 2. Verify metrics endpoint: `curl http://service:port/metrics`
253 | 3. Check Prometheus targets page for scraping errors
254 | 
255 | **High memory usage**:
256 | 1. Monitor metric cardinality (too many label combinations)
257 | 2. Consider sampling for high-frequency metrics
258 | 3. Adjust retention policies in Prometheus
259 | 
260 | **Missing alerts**:
261 | 1. Verify alert rules are loaded in Prometheus
262 | 2. Check alert rule syntax with `promtool check rules`
263 | 3. Ensure alertmanager is configured (optional)
264 | 
265 | ## 🎯 Next Steps
266 | 
267 | ### Phase 2 Enhancements (Next Sprint)
268 | 1. **Circuit Breakers**: Implement automatic service protection
269 | 2. **Rate Limiting**: Add intelligent request throttling
270 | 3. **Caching Optimization**: Redis connection pooling and optimization
271 | 4. **Service Mesh**: Consider Istio for advanced traffic management
272 | 
273 | ### Phase 3 Enhancements (Future)
274 | 1. **Distributed Tracing**: Add Jaeger for request tracing
275 | 2. **Chaos Engineering**: Implement fault injection testing
276 | 3. **Auto-scaling**: Dynamic resource scaling based on load
277 | 4. **Multi-region Deployment**: Geographic distribution for resilience
278 | 
279 | ## 📞 Support
280 | 
281 | For questions about the monitoring implementation:
282 | 1. Check the logs in `logs/` directory
283 | 2. Review Prometheus targets: http://localhost:9090/targets
284 | 3. Inspect service metrics endpoints directly
285 | 4. Check Grafana dashboards for visual insights
286 | 
287 | ---
288 | 
289 | **Production Readiness Score**: 🟢 **READY**
290 | 
291 | The system now includes comprehensive monitoring, alerting, and observability features suitable for production deployment.
292 | 


--------------------------------------------------------------------------------
/backtesting/social_data_provider.py:
--------------------------------------------------------------------------------
  1 | import pandas as pd
  2 | import numpy as np
  3 | import logging as logger
  4 | from datetime import datetime, timedelta
  5 | from typing import Dict, Optional, Union
  6 | from pathlib import Path
  7 | 
  8 | from .data_manager import HistoricalDataManager
  9 | 
 10 | class SocialDataProvider:
 11 |     """Provider for social data during backtesting"""
 12 |     
 13 |     def __init__(self, data_manager: HistoricalDataManager = None):
 14 |         """Initialize with optional data manager"""
 15 |         self.data_manager = data_manager or HistoricalDataManager()
 16 |         self.social_data = {}  # Cache for loaded social data
 17 |         self.default_metrics = {
 18 |             'social_volume': 0,
 19 |             'social_engagement': 0,
 20 |             'social_contributors': 0,
 21 |             'social_sentiment': 0.5,  # Neutral sentiment
 22 |             'twitter_volume': 0,
 23 |             'reddit_volume': 0,
 24 |             'news_volume': 0
 25 |         }
 26 |     
 27 |     def load_social_data(self, symbol: str, start_date: datetime, end_date: datetime = None) -> pd.DataFrame:
 28 |         """Load social data for the given symbol and date range"""
 29 |         # Generate cache key
 30 |         cache_key = f"{symbol}_{start_date.strftime('%Y%m%d')}_{end_date.strftime('%Y%m%d') if end_date else 'now'}"
 31 |         
 32 |         # Check if already in cache
 33 |         if cache_key in self.social_data:
 34 |             return self.social_data[cache_key]
 35 |         
 36 |         # Load social data using data manager
 37 |         data = self.data_manager.load_social_data(symbol, start_date, end_date)
 38 |         
 39 |         # Store in cache
 40 |         self.social_data[cache_key] = data
 41 |         
 42 |         return data
 43 |     
 44 |     def get_social_metrics_at(self, symbol: str, timestamp: datetime) -> Dict:
 45 |         """Get social metrics for a specific point in time"""
 46 |         # Check if we have data loaded for this symbol
 47 |         if symbol not in self.social_data:
 48 |             # Try to load data for the past 90 days
 49 |             start_date = timestamp - timedelta(days=90)
 50 |             end_date = timestamp + timedelta(days=1)  # Include the target day
 51 |             self.load_social_data(symbol, start_date, end_date)
 52 |         
 53 |         # If we have data for this symbol, find the closest data point
 54 |         for cache_key, data in self.social_data.items():
 55 |             if symbol in cache_key and not data.empty:
 56 |                 # Get the closest date not exceeding the timestamp
 57 |                 try:
 58 |                     # Find dates that are less than or equal to the timestamp
 59 |                     valid_dates = data.index[data.index <= timestamp]
 60 |                     
 61 |                     if len(valid_dates) > 0:
 62 |                         # Get the most recent date
 63 |                         closest_date = valid_dates[-1]
 64 |                         row = data.loc[closest_date]
 65 |                         
 66 |                         # Extract relevant social metrics
 67 |                         metrics = {}
 68 |                         for metric in self.default_metrics.keys():
 69 |                             if metric in row:
 70 |                                 metrics[metric] = row[metric]
 71 |                             else:
 72 |                                 metrics[metric] = self.default_metrics[metric]
 73 |                         
 74 |                         return metrics
 75 |                 except Exception as e:
 76 |                     logger.error(f"Error getting social metrics for {symbol} at {timestamp}: {str(e)}")
 77 |         
 78 |         # If no data found, return default metrics
 79 |         logger.warning(f"No social data found for {symbol} at {timestamp}, using defaults")
 80 |         return self.default_metrics.copy()
 81 |     
 82 |     def get_news_sentiment(self, symbol: str, timestamp: datetime, lookback_days: int = 7) -> Dict:
 83 |         """Get news sentiment from social data"""
 84 |         # Define default response
 85 |         default_response = {
 86 |             'sentiment': 0.5,  # Neutral sentiment
 87 |             'recent_news': []
 88 |         }
 89 |         
 90 |         try:
 91 |             # Calculate start date for lookback
 92 |             start_date = timestamp - timedelta(days=lookback_days)
 93 |             
 94 |             # Load social data if needed
 95 |             data = self.load_social_data(symbol, start_date, timestamp)
 96 |             
 97 |             if data.empty:
 98 |                 return default_response
 99 |             
100 |             # Extract news sentiment if available
101 |             if 'news_sentiment' in data.columns:
102 |                 # Get the most recent sentiment value
103 |                 recent_indices = data.index[data.index <= timestamp]
104 |                 if len(recent_indices) > 0:
105 |                     latest_idx = recent_indices[-1]
106 |                     sentiment = data.loc[latest_idx, 'news_sentiment']
107 |                     return {
108 |                         'sentiment': sentiment,
109 |                         'recent_news': []  # We don't have the actual news content in historical data
110 |                     }
111 |             
112 |             # If no specific news sentiment column, use general social sentiment
113 |             if 'social_sentiment' in data.columns:
114 |                 recent_indices = data.index[data.index <= timestamp]
115 |                 if len(recent_indices) > 0:
116 |                     latest_idx = recent_indices[-1]
117 |                     sentiment = data.loc[latest_idx, 'social_sentiment']
118 |                     return {
119 |                         'sentiment': sentiment,
120 |                         'recent_news': []
121 |                     }
122 |             
123 |             return default_response
124 |             
125 |         except Exception as e:
126 |             logger.error(f"Error getting news sentiment for {symbol}: {str(e)}")
127 |             return default_response
128 |     
129 |     def get_social_indicators(self, symbol: str, timestamp: datetime, lookback_days: int = 30) -> Dict:
130 |         """Get derived social indicators like momentum, trend, etc."""
131 |         try:
132 |             # Calculate start date for lookback
133 |             start_date = timestamp - timedelta(days=lookback_days)
134 |             
135 |             # Load social data if needed
136 |             data = self.load_social_data(symbol, start_date, timestamp)
137 |             
138 |             if data.empty:
139 |                 return {
140 |                     'social_momentum': 0,
141 |                     'social_trend': 'neutral',
142 |                     'social_intensity': 0,
143 |                     'social_engagement_rate': 0
144 |                 }
145 |             
146 |             # Filter data to timestamp
147 |             data = data[data.index <= timestamp]
148 |             
149 |             if len(data) < 2:
150 |                 return {
151 |                     'social_momentum': 0,
152 |                     'social_trend': 'neutral',
153 |                     'social_intensity': 0,
154 |                     'social_engagement_rate': 0
155 |                 }
156 |             
157 |             # Calculate social momentum (rate of change in volume)
158 |             if 'social_volume' in data.columns:
159 |                 recent_volume = data['social_volume'].iloc[-1]
160 |                 prev_volume = data['social_volume'].iloc[-2]
161 |                 social_momentum = ((recent_volume - prev_volume) / max(prev_volume, 1)) * 100
162 |             else:
163 |                 social_momentum = 0
164 |             
165 |             # Determine social trend
166 |             if social_momentum > 20:
167 |                 social_trend = 'bullish'
168 |             elif social_momentum < -20:
169 |                 social_trend = 'bearish'
170 |             else:
171 |                 social_trend = 'neutral'
172 |             
173 |             # Calculate social intensity (volatility of social metrics)
174 |             if 'social_volume' in data.columns and len(data) > 5:
175 |                 social_intensity = data['social_volume'].pct_change().std() * 100
176 |             else:
177 |                 social_intensity = 0
178 |             
179 |             # Calculate engagement rate
180 |             if 'social_engagement' in data.columns and 'social_volume' in data.columns:
181 |                 social_engagement_rate = data['social_engagement'].iloc[-1] / max(data['social_volume'].iloc[-1], 1)
182 |             else:
183 |                 social_engagement_rate = 0
184 |             
185 |             return {
186 |                 'social_momentum': social_momentum,
187 |                 'social_trend': social_trend,
188 |                 'social_intensity': social_intensity,
189 |                 'social_engagement_rate': social_engagement_rate
190 |             }
191 |             
192 |         except Exception as e:
193 |             logger.error(f"Error calculating social indicators for {symbol}: {str(e)}")
194 |             return {
195 |                 'social_momentum': 0,
196 |                 'social_trend': 'neutral',
197 |                 'social_intensity': 0,
198 |                 'social_engagement_rate': 0
199 |             }
200 |             
201 |     def generate_market_update_with_social(self, market_data: Dict, timestamp: datetime) -> Dict:
202 |         """Enrich market data with social metrics for backtesting"""
203 |         symbol = market_data['symbol']
204 |         
205 |         # Get social metrics
206 |         social_metrics = self.get_social_metrics_at(symbol, timestamp)
207 |         
208 |         # Get news sentiment
209 |         news_sentiment = self.get_news_sentiment(symbol, timestamp)
210 |         
211 |         # Get social indicators
212 |         social_indicators = self.get_social_indicators(symbol, timestamp)
213 |         
214 |         # Merge all the data
215 |         enriched_data = market_data.copy()
216 |         enriched_data.update({
217 |             'social_volume': social_metrics.get('social_volume', 0),
218 |             'social_engagement': social_metrics.get('social_engagement', 0),
219 |             'social_contributors': social_metrics.get('social_contributors', 0),
220 |             'social_sentiment': social_metrics.get('social_sentiment', 0.5),
221 |             'twitter_volume': social_metrics.get('twitter_volume', 0),
222 |             'reddit_volume': social_metrics.get('reddit_volume', 0),
223 |             'news_volume': social_metrics.get('news_volume', 0),
224 |             'news_sentiment': news_sentiment.get('sentiment', 0.5),
225 |             'recent_news': news_sentiment.get('recent_news', []),
226 |             'social_momentum': social_indicators.get('social_momentum', 0),
227 |             'social_trend': social_indicators.get('social_trend', 'neutral'),
228 |             'social_intensity': social_indicators.get('social_intensity', 0),
229 |             'social_engagement_rate': social_indicators.get('social_engagement_rate', 0)
230 |         })
231 |         
232 |         return enriched_data


--------------------------------------------------------------------------------
/services/utils/circuit_breaker.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Circuit Breaker implementation for AI Crypto Trader services
  3 | """
  4 | import asyncio
  5 | import time
  6 | import logging
  7 | from enum import Enum
  8 | from typing import Callable, Any, Optional, Dict
  9 | from functools import wraps
 10 | from dataclasses import dataclass
 11 | 
 12 | logger = logging.getLogger(__name__)
 13 | 
 14 | class CircuitState(Enum):
 15 |     CLOSED = "CLOSED"       # Normal operation
 16 |     OPEN = "OPEN"          # Circuit is open, requests fail fast
 17 |     HALF_OPEN = "HALF_OPEN" # Testing if service is back
 18 | 
 19 | @dataclass
 20 | class CircuitBreakerConfig:
 21 |     failure_threshold: int = 5          # Number of failures to open circuit
 22 |     recovery_timeout: int = 60          # Seconds before trying half-open
 23 |     expected_exception: type = Exception # Exception type that counts as failure
 24 |     success_threshold: int = 3          # Successes needed to close from half-open
 25 |     timeout: float = 30.0               # Request timeout in seconds
 26 | 
 27 | class CircuitBreakerOpenException(Exception):
 28 |     """Raised when circuit breaker is open"""
 29 |     pass
 30 | 
 31 | class CircuitBreaker:
 32 |     """
 33 |     Circuit Breaker implementation for protecting external service calls
 34 |     """
 35 |     
 36 |     def __init__(self, name: str, config: CircuitBreakerConfig = None):
 37 |         self.name = name
 38 |         self.config = config or CircuitBreakerConfig()
 39 |         
 40 |         # State management
 41 |         self.state = CircuitState.CLOSED
 42 |         self.failure_count = 0
 43 |         self.success_count = 0
 44 |         self.last_failure_time: Optional[float] = None
 45 |         
 46 |         # Metrics tracking
 47 |         self.total_requests = 0
 48 |         self.total_failures = 0
 49 |         self.total_successes = 0
 50 |         self.total_timeouts = 0
 51 |         self.total_circuit_opens = 0
 52 |         
 53 |     def __call__(self, func: Callable) -> Callable:
 54 |         """Decorator to wrap functions with circuit breaker"""
 55 |         @wraps(func)
 56 |         async def async_wrapper(*args, **kwargs):
 57 |             return await self._call_async(func, *args, **kwargs)
 58 |             
 59 |         @wraps(func)
 60 |         def sync_wrapper(*args, **kwargs):
 61 |             return self._call_sync(func, *args, **kwargs)
 62 |             
 63 |         return async_wrapper if asyncio.iscoroutinefunction(func) else sync_wrapper
 64 |     
 65 |     async def _call_async(self, func: Callable, *args, **kwargs) -> Any:
 66 |         """Execute async function with circuit breaker protection"""
 67 |         self.total_requests += 1
 68 |         
 69 |         # Check if circuit is open
 70 |         if self.state == CircuitState.OPEN:
 71 |             if self._should_attempt_reset():
 72 |                 self._move_to_half_open()
 73 |             else:
 74 |                 logger.warning(f"Circuit breaker {self.name} is OPEN, failing fast")
 75 |                 raise CircuitBreakerOpenException(f"Circuit breaker {self.name} is open")
 76 |         
 77 |         try:
 78 |             # Execute with timeout
 79 |             result = await asyncio.wait_for(
 80 |                 func(*args, **kwargs),
 81 |                 timeout=self.config.timeout
 82 |             )
 83 |             self._on_success()
 84 |             return result
 85 |             
 86 |         except asyncio.TimeoutError:
 87 |             self.total_timeouts += 1
 88 |             self._on_failure()
 89 |             logger.error(f"Circuit breaker {self.name}: Request timed out after {self.config.timeout}s")
 90 |             raise
 91 |             
 92 |         except self.config.expected_exception as e:
 93 |             self._on_failure()
 94 |             logger.error(f"Circuit breaker {self.name}: Expected failure: {str(e)}")
 95 |             raise
 96 |             
 97 |         except Exception as e:
 98 |             # Unexpected exceptions don't count as failures
 99 |             logger.error(f"Circuit breaker {self.name}: Unexpected error: {str(e)}")
100 |             raise
101 |     
102 |     def _call_sync(self, func: Callable, *args, **kwargs) -> Any:
103 |         """Execute sync function with circuit breaker protection"""
104 |         self.total_requests += 1
105 |         
106 |         # Check if circuit is open
107 |         if self.state == CircuitState.OPEN:
108 |             if self._should_attempt_reset():
109 |                 self._move_to_half_open()
110 |             else:
111 |                 logger.warning(f"Circuit breaker {self.name} is OPEN, failing fast")
112 |                 raise CircuitBreakerOpenException(f"Circuit breaker {self.name} is open")
113 |         
114 |         try:
115 |             result = func(*args, **kwargs)
116 |             self._on_success()
117 |             return result
118 |             
119 |         except self.config.expected_exception as e:
120 |             self._on_failure()
121 |             logger.error(f"Circuit breaker {self.name}: Expected failure: {str(e)}")
122 |             raise
123 |             
124 |         except Exception as e:
125 |             # Unexpected exceptions don't count as failures
126 |             logger.error(f"Circuit breaker {self.name}: Unexpected error: {str(e)}")
127 |             raise
128 |     
129 |     def _should_attempt_reset(self) -> bool:
130 |         """Check if enough time has passed to attempt reset"""
131 |         if self.last_failure_time is None:
132 |             return False
133 |         return time.time() - self.last_failure_time >= self.config.recovery_timeout
134 |     
135 |     def _move_to_half_open(self):
136 |         """Move circuit to half-open state"""
137 |         self.state = CircuitState.HALF_OPEN
138 |         self.success_count = 0
139 |         logger.info(f"Circuit breaker {self.name} moved to HALF_OPEN")
140 |     
141 |     def _on_success(self):
142 |         """Handle successful request"""
143 |         self.total_successes += 1
144 |         
145 |         if self.state == CircuitState.HALF_OPEN:
146 |             self.success_count += 1
147 |             if self.success_count >= self.config.success_threshold:
148 |                 self._close_circuit()
149 |         elif self.state == CircuitState.CLOSED:
150 |             # Reset failure count on success
151 |             self.failure_count = 0
152 |     
153 |     def _on_failure(self):
154 |         """Handle failed request"""
155 |         self.total_failures += 1
156 |         self.failure_count += 1
157 |         self.last_failure_time = time.time()
158 |         
159 |         if self.state == CircuitState.HALF_OPEN:
160 |             # Any failure in half-open moves back to open
161 |             self._open_circuit()
162 |         elif self.state == CircuitState.CLOSED:
163 |             if self.failure_count >= self.config.failure_threshold:
164 |                 self._open_circuit()
165 |     
166 |     def _open_circuit(self):
167 |         """Open the circuit breaker"""
168 |         self.state = CircuitState.OPEN
169 |         self.total_circuit_opens += 1
170 |         logger.warning(f"Circuit breaker {self.name} OPENED after {self.failure_count} failures")
171 |     
172 |     def _close_circuit(self):
173 |         """Close the circuit breaker"""
174 |         self.state = CircuitState.CLOSED
175 |         self.failure_count = 0
176 |         self.success_count = 0
177 |         logger.info(f"Circuit breaker {self.name} CLOSED - service recovered")
178 |     
179 |     def get_stats(self) -> Dict[str, Any]:
180 |         """Get circuit breaker statistics"""
181 |         return {
182 |             'name': self.name,
183 |             'state': self.state.value,
184 |             'failure_count': self.failure_count,
185 |             'success_count': self.success_count,
186 |             'total_requests': self.total_requests,
187 |             'total_failures': self.total_failures,
188 |             'total_successes': self.total_successes,
189 |             'total_timeouts': self.total_timeouts,
190 |             'total_circuit_opens': self.total_circuit_opens,
191 |             'failure_rate': self.total_failures / max(self.total_requests, 1),
192 |             'last_failure_time': self.last_failure_time,
193 |             'config': {
194 |                 'failure_threshold': self.config.failure_threshold,
195 |                 'recovery_timeout': self.config.recovery_timeout,
196 |                 'success_threshold': self.config.success_threshold,
197 |                 'timeout': self.config.timeout
198 |             }
199 |         }
200 |     
201 |     def reset(self):
202 |         """Manually reset the circuit breaker"""
203 |         self.state = CircuitState.CLOSED
204 |         self.failure_count = 0
205 |         self.success_count = 0
206 |         self.last_failure_time = None
207 |         logger.info(f"Circuit breaker {self.name} manually reset")
208 | 
209 | 
210 | class RetryConfig:
211 |     """Configuration for retry mechanism"""
212 |     def __init__(
213 |         self,
214 |         max_attempts: int = 3,
215 |         base_delay: float = 1.0,
216 |         max_delay: float = 60.0,
217 |         backoff_factor: float = 2.0,
218 |         jitter: bool = True
219 |     ):
220 |         self.max_attempts = max_attempts
221 |         self.base_delay = base_delay
222 |         self.max_delay = max_delay
223 |         self.backoff_factor = backoff_factor
224 |         self.jitter = jitter
225 | 
226 | 
227 | async def retry_with_backoff(
228 |     func: Callable,
229 |     config: RetryConfig = None,
230 |     exceptions: tuple = (Exception,),
231 |     *args,
232 |     **kwargs
233 | ) -> Any:
234 |     """
235 |     Retry function with exponential backoff
236 |     """
237 |     import random
238 |     
239 |     config = config or RetryConfig()
240 |     last_exception = None
241 |     
242 |     for attempt in range(config.max_attempts):
243 |         try:
244 |             if asyncio.iscoroutinefunction(func):
245 |                 return await func(*args, **kwargs)
246 |             else:
247 |                 return func(*args, **kwargs)
248 |                 
249 |         except exceptions as e:
250 |             last_exception = e
251 |             
252 |             if attempt == config.max_attempts - 1:
253 |                 # Last attempt, re-raise the exception
254 |                 raise e
255 |             
256 |             # Calculate delay with exponential backoff
257 |             delay = min(
258 |                 config.base_delay * (config.backoff_factor ** attempt),
259 |                 config.max_delay
260 |             )
261 |             
262 |             # Add jitter to prevent thundering herd
263 |             if config.jitter:
264 |                 delay *= (0.5 + random.random() * 0.5)
265 |             
266 |             logger.warning(
267 |                 f"Attempt {attempt + 1} failed: {str(e)}. "
268 |                 f"Retrying in {delay:.2f}s..."
269 |             )
270 |             
271 |             await asyncio.sleep(delay)
272 |     
273 |     # Should never reach here, but just in case
274 |     if last_exception:
275 |         raise last_exception
276 | 
277 | 
278 | # Global circuit breaker registry
279 | _circuit_breakers: Dict[str, CircuitBreaker] = {}
280 | 
281 | def get_circuit_breaker(name: str, config: CircuitBreakerConfig = None) -> CircuitBreaker:
282 |     """Get or create a circuit breaker by name"""
283 |     if name not in _circuit_breakers:
284 |         _circuit_breakers[name] = CircuitBreaker(name, config)
285 |     return _circuit_breakers[name]
286 | 
287 | def get_all_circuit_breakers() -> Dict[str, CircuitBreaker]:
288 |     """Get all registered circuit breakers"""
289 |     return _circuit_breakers.copy()
290 | 
291 | def reset_all_circuit_breakers():
292 |     """Reset all circuit breakers - useful for testing"""
293 |     for cb in _circuit_breakers.values():
294 |         cb.reset()
295 | 
296 | # Convenience decorators
297 | def circuit_breaker(
298 |     name: str,
299 |     failure_threshold: int = 5,
300 |     recovery_timeout: int = 60,
301 |     timeout: float = 30.0
302 | ):
303 |     """Decorator for easy circuit breaker application"""
304 |     config = CircuitBreakerConfig(
305 |         failure_threshold=failure_threshold,
306 |         recovery_timeout=recovery_timeout,
307 |         timeout=timeout
308 |     )
309 |     cb = get_circuit_breaker(name, config)
310 |     return cb
311 | 
312 | def with_retry(
313 |     max_attempts: int = 3,
314 |     base_delay: float = 1.0,
315 |     exceptions: tuple = (Exception,)
316 | ):
317 |     """Decorator for adding retry functionality"""
318 |     def decorator(func):
319 |         @wraps(func)
320 |         async def async_wrapper(*args, **kwargs):
321 |             config = RetryConfig(max_attempts=max_attempts, base_delay=base_delay)
322 |             return await retry_with_backoff(func, config, exceptions, *args, **kwargs)
323 |         
324 |         @wraps(func)
325 |         def sync_wrapper(*args, **kwargs):
326 |             # For sync functions, we'll need to handle this differently
327 |             # For now, just call the function directly
328 |             return func(*args, **kwargs)
329 |         
330 |         return async_wrapper if asyncio.iscoroutinefunction(func) else sync_wrapper
331 |     return decorator
332 | 


--------------------------------------------------------------------------------
/docker-compose.yml:
--------------------------------------------------------------------------------
  1 | version: '3.8'
  2 | 
  3 | services:
  4 |   redis:
  5 |     image: redis:alpine
  6 |     container_name: crypto-redis
  7 |     ports:
  8 |       - "6379:6379"
  9 |     networks:
 10 |       - crypto-net
 11 |     healthcheck:
 12 |       test: ["CMD", "redis-cli", "ping"]
 13 |       interval: 5s
 14 |       timeout: 3s
 15 |       retries: 3
 16 |     volumes:
 17 |       - redis-data:/data
 18 |     restart: unless-stopped
 19 | 
 20 |   redis-exporter:
 21 |     image: oliver006/redis_exporter:latest
 22 |     container_name: crypto-redis-exporter
 23 |     networks:
 24 |       - crypto-net
 25 |     depends_on:
 26 |       - redis
 27 |     command: --redis.addr=redis://redis:6379
 28 |     restart: unless-stopped
 29 | 
 30 |   market-monitor:
 31 |     build: .
 32 |     container_name: crypto-market-monitor
 33 |     command: python3 services/market_monitor_service.py
 34 |     environment:
 35 |       - BINANCE_API_KEY=${BINANCE_API_KEY}
 36 |       - BINANCE_API_SECRET=${BINANCE_API_SECRET}
 37 |       - REDIS_HOST=${REDIS_HOST}
 38 |       - REDIS_PORT=${REDIS_PORT}
 39 |       - SERVICE_PORT=${MARKET_MONITOR_PORT}
 40 |       - ENABLE_METRICS=true
 41 |     ports:
 42 |       - "${MARKET_MONITOR_PORT}:${MARKET_MONITOR_PORT}"
 43 |     volumes:
 44 |       - ./config.json:/app/config.json
 45 |       - ./logs:/app/logs
 46 |       - ./data:/app/data
 47 |     networks:
 48 |       - crypto-net
 49 |     depends_on:
 50 |       redis:
 51 |         condition: service_healthy
 52 |     healthcheck:
 53 |       test: ["CMD", "nc", "-z", "crypto-market-monitor", "${MARKET_MONITOR_PORT}"]
 54 |       interval: 30s
 55 |       timeout: 10s
 56 |       retries: 3
 57 |     restart: unless-stopped
 58 | 
 59 |   trade-executor:
 60 |     build: .
 61 |     container_name: crypto-trade-executor
 62 |     command: python3 services/trade_executor_service.py
 63 |     environment:
 64 |       - BINANCE_API_KEY=${BINANCE_API_KEY}
 65 |       - BINANCE_API_SECRET=${BINANCE_API_SECRET}
 66 |       - REDIS_HOST=${REDIS_HOST}
 67 |       - REDIS_PORT=${REDIS_PORT}
 68 |       - SERVICE_PORT=${TRADE_EXECUTOR_PORT}
 69 |       - ENABLE_METRICS=true
 70 |     ports:
 71 |       - "${TRADE_EXECUTOR_PORT}:${TRADE_EXECUTOR_PORT}"
 72 |     volumes:
 73 |       - ./config.json:/app/config.json
 74 |       - ./logs:/app/logs
 75 |       - ./data:/app/data
 76 |     networks:
 77 |       - crypto-net
 78 |     depends_on:
 79 |       redis:
 80 |         condition: service_healthy
 81 |       market-monitor:
 82 |         condition: service_healthy
 83 |     healthcheck:
 84 |       test: ["CMD", "nc", "-z", "crypto-trade-executor", "${TRADE_EXECUTOR_PORT}"]
 85 |       interval: 30s
 86 |       timeout: 10s
 87 |       retries: 3
 88 |     restart: unless-stopped
 89 | 
 90 |   ai-analyzer:
 91 |     build: .
 92 |     container_name: crypto-ai-analyzer
 93 |     command: python3 services/ai_analyzer_service.py
 94 |     environment:
 95 |       - OPENAI_API_KEY=${OPENAI_API_KEY}
 96 |       - REDIS_HOST=${REDIS_HOST}
 97 |       - REDIS_PORT=${REDIS_PORT}
 98 |       - SERVICE_PORT=${AI_ANALYZER_PORT}
 99 |       - ENABLE_METRICS=true
100 |     ports:
101 |       - "${AI_ANALYZER_PORT}:${AI_ANALYZER_PORT}"
102 |     volumes:
103 |       - ./config.json:/app/config.json
104 |       - ./logs:/app/logs
105 |       - ./data:/app/data
106 |     networks:
107 |       - crypto-net
108 |     depends_on:
109 |       redis:
110 |         condition: service_healthy
111 |       market-monitor:
112 |         condition: service_healthy
113 |     healthcheck:
114 |       test: ["CMD", "nc", "-z", "crypto-ai-analyzer", "${AI_ANALYZER_PORT}"]
115 |       interval: 30s
116 |       timeout: 10s
117 |       retries: 3
118 |     restart: unless-stopped
119 | 
120 |   strategy-evolution:
121 |     build: .
122 |     container_name: crypto-strategy-evolution
123 |     command: python3 services/strategy_evolution_service.py
124 |     environment:
125 |       - OPENAI_API_KEY=${OPENAI_API_KEY}
126 |       - CLOUDFLARE_API_TOKEN=${CLOUDFLARE_API_TOKEN}
127 |       - CLOUDFLARE_ACCOUNT_ID=${CLOUDFLARE_ACCOUNT_ID}
128 |       - CLOUDFLARE_ZONE_ID=${CLOUDFLARE_ZONE_ID}
129 |       - REDIS_HOST=${REDIS_HOST}
130 |       - REDIS_PORT=${REDIS_PORT}
131 |       - SERVICE_PORT=${STRATEGY_EVOLUTION_PORT}
132 |       - ENABLE_METRICS=true
133 |     ports:
134 |       - "${STRATEGY_EVOLUTION_PORT}:${STRATEGY_EVOLUTION_PORT}"
135 |     volumes:
136 |       - ./config.json:/app/config.json
137 |       - ./logs:/app/logs
138 |       - ./data:/app/data
139 |       - ./strategies:/app/strategies
140 |     networks:
141 |       - crypto-net
142 |     depends_on:
143 |       redis:
144 |         condition: service_healthy
145 |       market-monitor:
146 |         condition: service_healthy
147 |       ai-analyzer:
148 |         condition: service_healthy
149 |     healthcheck:
150 |       test: ["CMD", "nc", "-z", "crypto-strategy-evolution", "${STRATEGY_EVOLUTION_PORT}"]
151 |       interval: 30s
152 |       timeout: 10s
153 |       retries: 3
154 |     restart: unless-stopped
155 |     
156 |   dashboard:
157 |     build: .
158 |     container_name: crypto-dashboard
159 |     command: python3 dashboard.py
160 |     environment:
161 |       - REDIS_HOST=${REDIS_HOST}
162 |       - REDIS_PORT=${REDIS_PORT}
163 |       - REDIS_PASSWORD=${REDIS_PASSWORD}
164 |       - ENABLE_METRICS=true
165 |       - DASH_FONT_AWESOME_SERVE_LOCALLY=true
166 |     ports:
167 |       - "8050:8050"
168 |     volumes:
169 |       - ./config.json:/app/config.json
170 |       - ./logs:/app/logs
171 |       - ./static:/app/static
172 |     networks:
173 |       - crypto-net
174 |     depends_on:
175 |       redis:
176 |         condition: service_healthy
177 |       portfolio-risk:
178 |         condition: service_started
179 |       ai-explainability:
180 |         condition: service_started
181 |       model-registry:
182 |         condition: service_started
183 |     healthcheck:
184 |       test: ["CMD", "nc", "-z", "crypto-dashboard", "8050"]
185 |       interval: 30s
186 |       timeout: 10s
187 |       retries: 3
188 |     restart: unless-stopped
189 |     
190 |   backtesting:
191 |     build: .
192 |     container_name: crypto-backtesting
193 |     # No specific command as this is used for running ad-hoc backtests
194 |     environment:
195 |       - BINANCE_API_KEY=${BINANCE_API_KEY}
196 |       - BINANCE_API_SECRET=${BINANCE_API_SECRET}
197 |       - OPENAI_API_KEY=${OPENAI_API_KEY}
198 |       - LUNARCRUSH_API_KEY=${LUNARCRUSH_API_KEY}
199 |     volumes:
200 |       - ./config.json:/app/config.json
201 |       - ./logs:/app/logs
202 |       - ./backtesting:/app/backtesting
203 |       - ./backtesting/data:/app/backtesting/data
204 |       - ./backtesting/results:/app/backtesting/results
205 |       - ./backtesting/plots:/app/backtesting/plots
206 |     networks:
207 |       - crypto-net
208 |     depends_on:
209 |       - redis
210 |     profiles:
211 |       - tools
212 |     # No auto-start - use docker-compose run backtesting python run_backtest.py [...]
213 | 
214 |   # AI Model Services
215 |   model-registry:
216 |     build: .
217 |     container_name: crypto-model-registry
218 |     command: python3 run_ai_model_services.py --model-registry
219 |     environment:
220 |       - OPENAI_API_KEY=${OPENAI_API_KEY}
221 |       - REDIS_HOST=${REDIS_HOST}
222 |       - REDIS_PORT=${REDIS_PORT}
223 |       - SERVICE_PORT=${MODEL_REGISTRY_PORT}
224 |       - ENABLE_METRICS=true
225 |     ports:
226 |       - "${MODEL_REGISTRY_PORT}:${MODEL_REGISTRY_PORT}"
227 |     volumes:
228 |       - ./config.json:/app/config.json
229 |       - ./logs:/app/logs
230 |       - ./data:/app/data
231 |       - ./models:/app/models
232 |     networks:
233 |       - crypto-net
234 |     depends_on:
235 |       redis:
236 |         condition: service_healthy
237 |     healthcheck:
238 |       test: ["CMD", "nc", "-z", "crypto-model-registry", "${MODEL_REGISTRY_PORT}"]
239 |       interval: 30s
240 |       timeout: 10s
241 |       retries: 3
242 |     restart: unless-stopped
243 |     
244 |   portfolio-risk:
245 |     build: .
246 |     container_name: crypto-portfolio-risk
247 |     command: python3 services/portfolio_risk_service.py
248 |     environment:
249 |       - BINANCE_API_KEY=${BINANCE_API_KEY}
250 |       - BINANCE_API_SECRET=${BINANCE_API_SECRET}
251 |       - REDIS_HOST=${REDIS_HOST}
252 |       - REDIS_PORT=${REDIS_PORT}
253 |       - SERVICE_PORT=${PORTFOLIO_RISK_PORT}
254 |       - ENABLE_METRICS=true
255 |     ports:
256 |       - "${PORTFOLIO_RISK_PORT}:${PORTFOLIO_RISK_PORT}"
257 |     volumes:
258 |       - ./config.json:/app/config.json
259 |       - ./logs:/app/logs
260 |       - ./data:/app/data
261 |     networks:
262 |       - crypto-net
263 |     depends_on:
264 |       redis:
265 |         condition: service_healthy
266 |       trade-executor:
267 |         condition: service_healthy
268 |     healthcheck:
269 |       test: ["CMD", "nc", "-z", "crypto-portfolio-risk", "${PORTFOLIO_RISK_PORT}"]
270 |       interval: 30s
271 |       timeout: 10s
272 |       retries: 3
273 |     restart: unless-stopped
274 | 
275 |   ai-explainability:
276 |     build: .
277 |     container_name: crypto-ai-explainability
278 |     command: python3 run_ai_model_services.py --explainability
279 |     environment:
280 |       - OPENAI_API_KEY=${OPENAI_API_KEY}
281 |       - REDIS_HOST=${REDIS_HOST}
282 |       - REDIS_PORT=${REDIS_PORT}
283 |       - SERVICE_PORT=${AI_EXPLAINABILITY_PORT}
284 |       - ENABLE_METRICS=true
285 |     ports:
286 |       - "${AI_EXPLAINABILITY_PORT}:${AI_EXPLAINABILITY_PORT}"
287 |     volumes:
288 |       - ./config.json:/app/config.json
289 |       - ./logs:/app/logs
290 |       - ./data:/app/data
291 |       - ./explanations:/app/explanations
292 |     networks:
293 |       - crypto-net
294 |     depends_on:
295 |       redis:
296 |         condition: service_healthy
297 |       ai-analyzer:
298 |         condition: service_healthy
299 |     healthcheck:
300 |       test: ["CMD", "nc", "-z", "crypto-ai-explainability", "${AI_EXPLAINABILITY_PORT}"]
301 |       interval: 30s
302 |       timeout: 10s
303 |       retries: 3
304 |     restart: unless-stopped
305 | 
306 |   # Monitoring Stack
307 |   prometheus:
308 |     image: prom/prometheus:latest
309 |     container_name: crypto-prometheus
310 |     volumes:
311 |       - ./monitoring/prometheus.yml:/etc/prometheus/prometheus.yml
312 |       - prometheus-data:/prometheus
313 |     command:
314 |       - '--config.file=/etc/prometheus/prometheus.yml'
315 |       - '--storage.tsdb.path=/prometheus'
316 |       - '--web.console.libraries=/etc/prometheus/console_libraries'
317 |       - '--web.console.templates=/etc/prometheus/consoles'
318 |       - '--web.enable-lifecycle'
319 |     ports:
320 |       - "9090:9090"
321 |     networks:
322 |       - crypto-net
323 |     restart: unless-stopped
324 | 
325 |   grafana:
326 |     image: grafana/grafana:latest
327 |     container_name: crypto-grafana
328 |     volumes:
329 |       - ./monitoring/grafana/provisioning:/etc/grafana/provisioning
330 |       - grafana-data:/var/lib/grafana
331 |     environment:
332 |       - GF_SECURITY_ADMIN_USER=${GRAFANA_ADMIN_USER:-admin}
333 |       - GF_SECURITY_ADMIN_PASSWORD=${GRAFANA_ADMIN_PASSWORD:-admin}
334 |       - GF_USERS_ALLOW_SIGN_UP=false
335 |     ports:
336 |       - "3000:3000"
337 |     networks:
338 |       - crypto-net
339 |     depends_on:
340 |       - prometheus
341 |     restart: unless-stopped
342 | 
343 |   node-exporter:
344 |     image: prom/node-exporter:latest
345 |     container_name: crypto-node-exporter
346 |     volumes:
347 |       - /proc:/host/proc:ro
348 |       - /sys:/host/sys:ro
349 |       - /:/rootfs:ro
350 |     command:
351 |       - '--path.procfs=/host/proc'
352 |       - '--path.rootfs=/rootfs'
353 |       - '--path.sysfs=/host/sys'
354 |       - '--collector.filesystem.mount-points-exclude=^/(sys|proc|dev|host|etc)($$|/)'
355 |     networks:
356 |       - crypto-net
357 |     restart: unless-stopped
358 | 
359 |   elasticsearch:
360 |     image: docker.elastic.co/elasticsearch/elasticsearch:7.17.10
361 |     container_name: crypto-elasticsearch
362 |     environment:
363 |       - discovery.type=single-node
364 |       - "ES_JAVA_OPTS=-Xms512m -Xmx512m"
365 |     volumes:
366 |       - elasticsearch-data:/usr/share/elasticsearch/data
367 |     ports:
368 |       - "9200:9200"
369 |     networks:
370 |       - crypto-net
371 |     healthcheck:
372 |       test: ["CMD-SHELL", "curl -s http://localhost:9200 >/dev/null || exit 1"]
373 |       interval: 30s
374 |       timeout: 10s
375 |       retries: 3
376 |     restart: unless-stopped
377 | 
378 |   logstash:
379 |     image: docker.elastic.co/logstash/logstash:7.17.10
380 |     container_name: crypto-logstash
381 |     volumes:
382 |       - ./monitoring/logstash.conf:/usr/share/logstash/pipeline/logstash.conf
383 |       - ./logs:/app/logs:ro
384 |     depends_on:
385 |       elasticsearch:
386 |         condition: service_healthy
387 |     networks:
388 |       - crypto-net
389 |     restart: unless-stopped
390 | 
391 |   kibana:
392 |     image: docker.elastic.co/kibana/kibana:7.17.10
393 |     container_name: crypto-kibana
394 |     environment:
395 |       - ELASTICSEARCH_HOSTS=http://elasticsearch:9200
396 |     ports:
397 |       - "5601:5601"
398 |     networks:
399 |       - crypto-net
400 |     depends_on:
401 |       elasticsearch:
402 |         condition: service_healthy
403 |     restart: unless-stopped
404 | 
405 | networks:
406 |   crypto-net:
407 |     driver: bridge
408 | 
409 | volumes:
410 |   redis-data:
411 |   logs:
412 |   data:
413 |   strategies:
414 |   models:
415 |   explanations:
416 |   prometheus-data:
417 |   grafana-data:
418 |   elasticsearch-data:
419 | 


--------------------------------------------------------------------------------
/STRATEGY_EVOLUTION.md:
--------------------------------------------------------------------------------
  1 | # Strategy Evolution System
  2 | 
  3 | ## Overview
  4 | 
  5 | A self-improving trading system that uses OpenAI to generate, test, and evolve trading strategies, incorporating both technical analysis and social sentiment metrics, deploying successful ones as Cloudflare Workers.
  6 | 
  7 | ## System Components
  8 | 
  9 | ### 1. Strategy Generator Service
 10 | ```python
 11 | class StrategyGenerator:
 12 |     def generate_strategy():
 13 |         # Use OpenAI to create new trading strategies
 14 |         # Incorporate social metrics and sentiment analysis
 15 |         # Return strategy as executable code
 16 | ```
 17 | 
 18 | Key Features:
 19 | - Uses OpenAI to generate trading strategies in JavaScript (for Cloudflare Workers)
 20 | - Implements various trading patterns (Mean Reversion, Trend Following, etc.)
 21 | - Integrates social sentiment analysis from LunarCrush
 22 | - Generates risk management rules with social metrics consideration
 23 | - Creates backtesting parameters
 24 | 
 25 | ### 2. Strategy Validator Service
 26 | ```python
 27 | class StrategyValidator:
 28 |     def validate_strategy(strategy_code):
 29 |         # Validate strategy code
 30 |         # Test for common issues
 31 |         # Validate social metrics integration
 32 |         # Return validation results
 33 | ```
 34 | 
 35 | Validation Checks:
 36 | - Code security analysis
 37 | - Performance impact assessment
 38 | - Resource usage estimation
 39 | - Risk management validation
 40 | - Social metrics reliability checks
 41 | - Sentiment analysis validation
 42 | 
 43 | ### 3. Backtesting Engine
 44 | ```python
 45 | class BacktestEngine:
 46 |     def backtest_strategy(strategy, historical_data, social_data):
 47 |         # Run strategy against historical data
 48 |         # Include historical social metrics
 49 |         # Calculate performance metrics
 50 |         # Return detailed results
 51 | ```
 52 | 
 53 | Metrics Tracked:
 54 | - Sharpe Ratio
 55 | - Maximum Drawdown
 56 | - Win Rate
 57 | - Profit Factor
 58 | - Risk-Adjusted Return
 59 | - Social Sentiment Correlation
 60 | - Social Volume Impact
 61 | 
 62 | ### 4. Strategy Evolution Engine
 63 | ```python
 64 | class StrategyEvolution:
 65 |     def evolve_strategy(strategy, performance_data, social_metrics):
 66 |         # Use OpenAI to improve strategy based on results
 67 |         # Incorporate social sentiment trends
 68 |         # Return improved strategy
 69 | ```
 70 | 
 71 | Evolution Parameters:
 72 | - Performance targets
 73 | - Risk limits
 74 | - Market conditions
 75 | - Trading costs
 76 | - Social sentiment thresholds
 77 | - Social volume requirements
 78 | 
 79 | ### 5. Cloudflare Worker Deployment System
 80 | ```python
 81 | class WorkerDeployment:
 82 |     def deploy_strategy(strategy_code):
 83 |         # Deploy strategy as Cloudflare Worker
 84 |         # Monitor performance and social metrics
 85 |         # Return deployment status
 86 | ```
 87 | 
 88 | Deployment Process:
 89 | 1. Package strategy code
 90 | 2. Create Worker
 91 | 3. Deploy to Cloudflare
 92 | 4. Monitor execution and social metrics
 93 | 
 94 | ## Implementation Plan
 95 | 
 96 | ### Phase 1: Strategy Generation
 97 | 
 98 | 1. Create OpenAI Prompts:
 99 | ```json
100 | {
101 |     "system": "You are an expert algorithmic trader...",
102 |     "user": "Create a mean reversion strategy incorporating social sentiment with the following parameters...",
103 |     "parameters": {
104 |         "timeframe": "5m",
105 |         "risk_limit": 2,
106 |         "target_profit": 1.5,
107 |         "min_social_volume": 1000,
108 |         "min_social_sentiment": 0.6
109 |     }
110 | }
111 | ```
112 | 
113 | 2. Strategy Template with Social Metrics:
114 | ```javascript
115 | export default {
116 |     async fetch(request, env) {
117 |         // Get market data
118 |         const marketData = await getMarketData();
119 |         // Get social metrics
120 |         const socialMetrics = await getSocialMetrics();
121 |         // Combined analysis
122 |         const analysis = await analyzeMarket(marketData, socialMetrics);
123 |         // Strategy implementation
124 |         return handleAnalysis(analysis);
125 |     }
126 | }
127 | ```
128 | 
129 | ### Phase 2: Testing & Validation
130 | 
131 | 1. Backtesting Infrastructure:
132 | ```python
133 | def run_backtest(strategy_code, market_data, social_data):
134 |     results = {
135 |         'profit_loss': [],
136 |         'trades': [],
137 |         'metrics': {},
138 |         'social_impact': {}
139 |     }
140 |     return results
141 | ```
142 | 
143 | 2. Performance Metrics:
144 | ```python
145 | def calculate_metrics(backtest_results):
146 |     metrics = {
147 |         'sharpe_ratio': 0,
148 |         'max_drawdown': 0,
149 |         'win_rate': 0,
150 |         'social_correlation': 0,
151 |         'sentiment_accuracy': 0
152 |     }
153 |     return metrics
154 | ```
155 | 
156 | ### Phase 3: Evolution System
157 | 
158 | 1. Performance Analysis:
159 | ```python
160 | def analyze_performance(strategy_results):
161 |     analysis = {
162 |         'strengths': [],
163 |         'weaknesses': [],
164 |         'improvement_areas': [],
165 |         'social_metrics_impact': {
166 |             'sentiment_influence': 0,
167 |             'volume_impact': 0,
168 |             'engagement_correlation': 0
169 |         },
170 |         'feature_importance': {
171 |             'top_features': {},
172 |             'top_categories': {},
173 |             'recommendations': {}
174 |         }
175 |     }
176 |     return analysis
177 | ```
178 | 
179 | 2. Feature Importance Analysis:
180 | ```python
181 | def analyze_feature_importance(strategy_data, trading_history):
182 |     # Calculate permutation importance for features
183 |     permutation_results = calculate_permutation_importance(strategy_data)
184 |     
185 |     # Group features by category
186 |     category_importance = calculate_category_importance(permutation_results)
187 |     
188 |     # Generate recommendations for feature prioritization
189 |     recommendations = generate_feature_recommendations(permutation_results, category_importance)
190 |     
191 |     # Optimize model based on feature importance
192 |     optimized_model = create_optimized_model(permutation_results)
193 |     
194 |     return {
195 |         'permutation_importance': permutation_results,
196 |         'category_importance': category_importance,
197 |         'recommendations': recommendations,
198 |         'optimized_model': optimized_model
199 |     }
200 | ```
201 | 
202 | 3. Strategy Improvement:
203 | ```python
204 | def improve_strategy(analysis):
205 |     # Use feature importance insights to focus improvements
206 |     feature_importance = analysis['feature_importance']
207 |     top_features = feature_importance['top_features']
208 |     feature_recommendations = feature_importance['recommendations']
209 |     
210 |     # Create improvement prompt with feature importance guidance
211 |     prompt = create_improvement_prompt(analysis)
212 |     
213 |     # Add feature importance insights to prompt
214 |     prompt += f"\nFocus on these high-importance features: {', '.join(feature_recommendations['features_to_prioritize'])}"
215 |     prompt += f"\nConsider reducing reliance on: {', '.join(feature_recommendations['features_to_reconsider'])}"
216 |     
217 |     improved_strategy = openai.chat.completions.create(
218 |         model="gpt-4o",
219 |         messages=[
220 |             {"role": "system", "content": "You are improving a trading strategy with feature importance insights..."},
221 |             {"role": "user", "content": prompt}
222 |         ]
223 |     )
224 |     return improved_strategy
225 | ```
226 | 
227 | ### Phase 4: Worker Deployment
228 | 
229 | 1. Worker Creation with Social Metrics:
230 | ```javascript
231 | async function deployWorker(strategy) {
232 |     const worker = new CloudflareWorker({
233 |         name: `strategy-${strategy.id}`,
234 |         code: strategy.code,
235 |         env: {
236 |             LUNARCRUSH_API_KEY: process.env.LUNARCRUSH_API_KEY
237 |         }
238 |     });
239 |     return worker;
240 | }
241 | ```
242 | 
243 | 2. Enhanced Monitoring System:
244 | ```javascript
245 | class WorkerMonitor {
246 |     constructor(worker) {
247 |         this.worker = worker;
248 |         this.metrics = {
249 |             performance: {},
250 |             social: {}
251 |         };
252 |     }
253 | 
254 |     async monitor() {
255 |         // Monitor worker performance
256 |         // Track social metrics impact
257 |         // Collect metrics
258 |         // Alert on issues
259 |     }
260 | }
261 | ```
262 | 
263 | ## Evolution Process
264 | 
265 | 1. Initial Strategy Generation:
266 | ```mermaid
267 | graph LR
268 |     A[OpenAI] --> B[Generate Strategy]
269 |     B --> C[Validate]
270 |     C --> D[Backtest]
271 |     D --> E[Deploy Worker]
272 |     F[Social Metrics] --> B
273 |     F --> C
274 |     F --> D
275 | ```
276 | 
277 | 2. Continuous Improvement with Feature Importance:
278 | ```mermaid
279 | graph LR
280 |     A[Monitor Performance] --> B[Analyze Results]
281 |     G[Feature Importance] --> B
282 |     B --> C[Generate Improvements]
283 |     C --> D[Test New Version]
284 |     D --> E[Deploy Update]
285 |     F[Social Trends] --> B
286 |     F --> C
287 |     G --> C
288 |     G --> H[Model Optimization]
289 |     H --> D
290 | ```
291 | 
292 | ## Performance Goals
293 | 
294 | 1. Strategy Metrics:
295 | ```json
296 | {
297 |     "min_sharpe_ratio": 1.5,
298 |     "max_drawdown": 0.15,
299 |     "min_win_rate": 0.55,
300 |     "min_profit_factor": 1.3,
301 |     "min_social_correlation": 0.3,
302 |     "min_sentiment_accuracy": 0.65
303 | }
304 | ```
305 | 
306 | 2. Evolution Targets:
307 | ```json
308 | {
309 |     "improvement_threshold": 0.1,
310 |     "max_iterations": 10,
311 |     "convergence_criteria": 0.02,
312 |     "social_metrics_weight": 0.3,
313 |     "feature_importance": {
314 |         "weight": 0.25,
315 |         "min_importance_threshold": 0.05,
316 |         "feature_pruning_threshold": 0.25,
317 |         "top_features_count": 10,
318 |         "model_update_frequency": "daily",
319 |         "optimization_enabled": true
320 |     }
321 | }
322 | ```
323 | 
324 | ## Implementation Example
325 | 
326 | 1. Generate Strategy with Social Integration:
327 | ```python
328 | async def generate_new_strategy():
329 |     prompt = create_strategy_prompt()
330 |     response = await openai.chat.completions.create(
331 |         model="gpt-4o",
332 |         messages=[
333 |             {"role": "system", "content": "Create a trading strategy incorporating social metrics..."},
334 |             {"role": "user", "content": prompt}
335 |         ]
336 |     )
337 |     return parse_strategy(response)
338 | ```
339 | 
340 | 2. Deploy as Worker with Social Metrics:
341 | ```javascript
342 | export default {
343 |     async fetch(request, env) {
344 |         const strategy = await loadStrategy();
345 |         const market_data = await fetchMarketData();
346 |         const social_data = await fetchSocialMetrics(env.LUNARCRUSH_API_KEY);
347 |         const signals = await executeStrategy(strategy, market_data, social_data);
348 |         return new Response(JSON.stringify(signals));
349 |     }
350 | }
351 | ```
352 | 
353 | 3. Monitor and Evolve with Feature Importance and Social Trends:
354 | ```python
355 | async def monitor_and_evolve():
356 |     while True:
357 |         # Collect performance data
358 |         performance = await monitor_strategy()
359 |         social_impact = await analyze_social_impact()
360 |         
361 |         # Run feature importance analysis
362 |         feature_importance = await analyze_feature_importance(
363 |             performance.trading_data,
364 |             performance.trade_history
365 |         )
366 |         
367 |         # Check if any factor indicates need for strategy evolution
368 |         needs_update = (
369 |             performance.needs_improvement() or 
370 |             social_impact.indicates_change() or
371 |             feature_importance.significant_changes()
372 |         )
373 |         
374 |         if needs_update:
375 |             # Create comprehensive analysis including feature importance
376 |             combined_analysis = {
377 |                 "performance": performance,
378 |                 "social_impact": social_impact,
379 |                 "feature_importance": feature_importance
380 |             }
381 |             
382 |             # Evolve strategy with all insights
383 |             improved_strategy = await evolve_strategy(combined_analysis)
384 |             
385 |             # Deploy optimized model based on feature importance
386 |             if feature_importance.has_optimized_model():
387 |                 await deploy_optimized_model(feature_importance.optimized_model)
388 |             
389 |             # Deploy improved strategy
390 |             await deploy_new_version(improved_strategy)
391 |             
392 |         # Generate feature importance reports
393 |         if time_for_feature_report():
394 |             await generate_feature_importance_report(feature_importance)
395 |             
396 |         await asyncio.sleep(3600)  # Check hourly
397 | ```
398 | 
399 | ## Security Considerations
400 | 
401 | 1. Code Validation:
402 | - Static analysis
403 | - Sandbox testing
404 | - Resource limits
405 | - Access control
406 | - API key security
407 | - Rate limiting
408 | 
409 | 2. Deployment Safety:
410 | - Gradual rollout
411 | - Performance monitoring
412 | - Automatic rollback
413 | - Error thresholds
414 | - Social metrics validation
415 | 
416 | ## Next Steps
417 | 
418 | 1. Implementation Priority:
419 | - Social Metrics Integration
420 | - Strategy Generator Service
421 | - Backtesting Engine with Social Data
422 | - Worker Deployment System
423 | - Evolution Engine
424 | - Monitoring System
425 | 
426 | 2. Development Phases:
427 | - Phase 1: Basic strategy generation and testing with social metrics
428 | - Phase 2: Worker deployment and monitoring
429 | - Phase 3: Performance analysis and evolution
430 | - Phase 4: Full automation and optimization
431 | 
432 | 3. Timeline:
433 | - Week 1-2: Social metrics integration and basic implementation
434 | - Week 3-4: Testing and validation with social data
435 | - Week 5-6: Evolution system with social trends
436 | - Week 7-8: Production deployment
437 | 
438 | 4. Success Metrics:
439 | - Strategy performance improvement
440 | - Social metrics correlation accuracy
441 | - System stability
442 | - Resource efficiency
443 | - Trading profits
444 | - Sentiment prediction accuracy
445 | 


--------------------------------------------------------------------------------
/backtesting/backtest_engine.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import json
  3 | import asyncio
  4 | import logging as logger
  5 | from datetime import datetime, timedelta
  6 | from typing import Dict, List, Optional, Union, Tuple
  7 | from pathlib import Path
  8 | 
  9 | from .data_manager import HistoricalDataManager
 10 | from .social_data_provider import SocialDataProvider
 11 | from .strategy_tester import StrategyTester
 12 | from .result_analyzer import ResultAnalyzer
 13 | 
 14 | class BacktestEngine:
 15 |     """Main engine for running and managing backtests"""
 16 |     
 17 |     def __init__(self, config_path: str = 'config.json'):
 18 |         """Initialize with configuration"""
 19 |         # Load configuration
 20 |         with open(config_path, 'r') as f:
 21 |             self.config = json.load(f)
 22 |             
 23 |         # Initialize components
 24 |         self.data_manager = HistoricalDataManager(config_path)
 25 |         self.social_provider = SocialDataProvider(self.data_manager)
 26 |         self.strategy_tester = StrategyTester(config_path)
 27 |         self.result_analyzer = ResultAnalyzer()
 28 |         
 29 |         # Task queue for managing backtest operations
 30 |         self.task_queue = asyncio.Queue()
 31 |         self.running_tasks = set()
 32 |     
 33 |     async def fetch_data_for_backtest(self, symbol: str, intervals: List[str],
 34 |                                    start_date: datetime, end_date: datetime = None,
 35 |                                    include_social: bool = True) -> Dict[str, bool]:
 36 |         """Fetch all necessary data for backtesting"""
 37 |         if end_date is None:
 38 |             end_date = datetime.now()
 39 |             
 40 |         results = {}
 41 |         
 42 |         for interval in intervals:
 43 |             try:
 44 |                 logger.info(f"Fetching {interval} data for {symbol} from {start_date} to {end_date}")
 45 |                 market_success, social_success = await self.data_manager.fetch_and_save_data(
 46 |                     symbol, interval, start_date, end_date, include_social
 47 |                 )
 48 |                 
 49 |                 results[interval] = {
 50 |                     'market_data': market_success,
 51 |                     'social_data': social_success if include_social else False
 52 |                 }
 53 |                 
 54 |             except Exception as e:
 55 |                 logger.error(f"Error fetching data for {symbol} ({interval}): {str(e)}")
 56 |                 results[interval] = {
 57 |                     'market_data': False,
 58 |                     'social_data': False,
 59 |                     'error': str(e)
 60 |                 }
 61 |                 
 62 |         return results
 63 |     
 64 |     async def run_backtest(self, symbol: str, interval: str,
 65 |                          start_date: datetime, end_date: datetime = None,
 66 |                          initial_balance: float = 10000.0,
 67 |                          save_results: bool = True) -> Dict:
 68 |         """Run a backtest for a specific symbol and interval"""
 69 |         try:
 70 |             if end_date is None:
 71 |                 end_date = datetime.now()
 72 |                 
 73 |             logger.info(f"Running backtest for {symbol} ({interval}) from {start_date} to {end_date}")
 74 |             
 75 |             # Check if we have data
 76 |             market_data = self.data_manager.load_market_data(symbol, interval, start_date, end_date)
 77 |             if market_data.empty:
 78 |                 # Try to fetch data first
 79 |                 fetch_results = await self.fetch_data_for_backtest(
 80 |                     symbol, [interval], start_date, end_date
 81 |                 )
 82 |                 
 83 |                 if not fetch_results.get(interval, {}).get('market_data', False):
 84 |                     logger.error(f"No market data available for {symbol} ({interval}) and data fetch failed")
 85 |                     return {'error': 'No market data available and data fetch failed'}
 86 |                     
 87 |                 # Try loading again
 88 |                 market_data = self.data_manager.load_market_data(symbol, interval, start_date, end_date)
 89 |                 if market_data.empty:
 90 |                     logger.error(f"No market data available for {symbol} ({interval}) even after fetch attempt")
 91 |                     return {'error': 'No market data available even after fetch attempt'}
 92 |             
 93 |             # Run backtest
 94 |             result = await self.strategy_tester.backtest_strategy(
 95 |                 symbol, interval, start_date, end_date, initial_balance
 96 |             )
 97 |             
 98 |             # Save results if requested
 99 |             if save_results:
100 |                 strategy_name = f"AI_Social_Strategy"
101 |                 result_path = self.strategy_tester.save_results(
102 |                     strategy_name, symbol, interval, start_date, end_date
103 |                 )
104 |                 
105 |                 # Generate equity curve plot
106 |                 plot_path = self.result_analyzer.plot_equity_curve(
107 |                     {'strategy': strategy_name, 'symbol': symbol, 'interval': interval, 'stats': result}
108 |                 )
109 |                 
110 |                 # Generate trade analysis plot if there are trades
111 |                 if result.get('total_trades', 0) > 0:
112 |                     trade_plot_path = self.result_analyzer.plot_trade_analysis(
113 |                         {'strategy': strategy_name, 'symbol': symbol, 'interval': interval, 'stats': result}
114 |                     )
115 |                     
116 |                     result['trade_plot_path'] = trade_plot_path
117 |                 
118 |                 result['result_path'] = result_path
119 |                 result['plot_path'] = plot_path
120 |             
121 |             return result
122 |             
123 |         except Exception as e:
124 |             logger.error(f"Error running backtest for {symbol} ({interval}): {str(e)}")
125 |             return {'error': str(e)}
126 |     
127 |     async def run_multiple_backtests(self, symbols: List[str], intervals: List[str],
128 |                                    start_date: datetime, end_date: datetime = None,
129 |                                    initial_balance: float = 10000.0) -> Dict:
130 |         """Run multiple backtests for different symbols/intervals"""
131 |         results = {}
132 |         
133 |         for symbol in symbols:
134 |             symbol_results = {}
135 |             
136 |             for interval in intervals:
137 |                 try:
138 |                     result = await self.run_backtest(
139 |                         symbol, interval, start_date, end_date, initial_balance
140 |                     )
141 |                     
142 |                     symbol_results[interval] = result
143 |                     
144 |                 except Exception as e:
145 |                     logger.error(f"Error in backtest for {symbol} on {interval}: {str(e)}")
146 |                     symbol_results[interval] = {"error": str(e)}
147 |             
148 |             results[symbol] = symbol_results
149 |         
150 |         # Generate summary report
151 |         all_results = []
152 |         for symbol, sym_results in results.items():
153 |             for interval, result in sym_results.items():
154 |                 if 'error' not in result:
155 |                     all_results.append({
156 |                         'strategy': 'AI_Social_Strategy',
157 |                         'symbol': symbol,
158 |                         'interval': interval,
159 |                         'stats': result
160 |                     })
161 |         
162 |         if all_results:
163 |             summary = self.result_analyzer.generate_summary_report(all_results)
164 |             summary_path = self.result_analyzer.save_summary_report(summary)
165 |             
166 |             # Add summary path to results
167 |             results['summary'] = {
168 |                 'path': summary_path,
169 |                 'profitable_strategies': summary.get('profitable_strategies', 0),
170 |                 'total_results': summary.get('total_results', 0)
171 |             }
172 |             
173 |             # Generate comparison chart
174 |             comparison_path = self.result_analyzer.compare_results(all_results, 'return_pct')
175 |             if comparison_path:
176 |                 results['summary']['comparison_chart'] = comparison_path
177 |         
178 |         return results
179 |     
180 |     def get_available_data(self) -> Dict:
181 |         """Get information about available historical data"""
182 |         symbols = self.data_manager.available_symbols()
183 |         
184 |         available_data = {}
185 |         for symbol in symbols:
186 |             intervals = self.data_manager.available_intervals(symbol)
187 |             symbol_data = {'intervals': {}}
188 |             
189 |             for interval in intervals:
190 |                 start_date, end_date = self.data_manager.get_data_range(symbol, interval)
191 |                 if start_date and end_date:
192 |                     symbol_data['intervals'][interval] = {
193 |                         'start_date': start_date.isoformat(),
194 |                         'end_date': end_date.isoformat(),
195 |                         'days': (end_date - start_date).days
196 |                     }
197 |             
198 |             available_data[symbol] = symbol_data
199 |         
200 |         return available_data
201 |     
202 |     async def fetch_data_for_symbols(self, symbols: List[str], intervals: List[str],
203 |                                    days_back: int = 30) -> Dict:
204 |         """Fetch historical data for multiple symbols and intervals"""
205 |         end_date = datetime.now()
206 |         start_date = end_date - timedelta(days=days_back)
207 |         
208 |         results = {}
209 |         for symbol in symbols:
210 |             symbol_result = await self.fetch_data_for_backtest(
211 |                 symbol, intervals, start_date, end_date
212 |             )
213 |             results[symbol] = symbol_result
214 |         
215 |         return results
216 |     
217 |     async def add_backtest_task(self, task_type: str, params: Dict) -> int:
218 |         """Add a backtest task to the queue"""
219 |         task_id = len(self.running_tasks) + self.task_queue.qsize() + 1
220 |         
221 |         await self.task_queue.put({
222 |             'id': task_id,
223 |             'type': task_type,
224 |             'params': params,
225 |             'status': 'queued',
226 |             'created_at': datetime.now().isoformat()
227 |         })
228 |         
229 |         return task_id
230 |     
231 |     async def process_task_queue(self):
232 |         """Process tasks from the queue"""
233 |         while True:
234 |             try:
235 |                 task = await self.task_queue.get()
236 |                 
237 |                 # Update task status
238 |                 task['status'] = 'running'
239 |                 task['started_at'] = datetime.now().isoformat()
240 |                 
241 |                 # Add to running tasks
242 |                 self.running_tasks.add(task['id'])
243 |                 
244 |                 # Process based on task type
245 |                 if task['type'] == 'fetch_data':
246 |                     params = task['params']
247 |                     result = await self.fetch_data_for_symbols(
248 |                         params.get('symbols', []),
249 |                         params.get('intervals', []),
250 |                         params.get('days_back', 30)
251 |                     )
252 |                     
253 |                 elif task['type'] == 'run_backtest':
254 |                     params = task['params']
255 |                     result = await self.run_backtest(
256 |                         params.get('symbol'),
257 |                         params.get('interval'),
258 |                         datetime.fromisoformat(params.get('start_date')),
259 |                         datetime.fromisoformat(params.get('end_date')) if params.get('end_date') else None,
260 |                         params.get('initial_balance', 10000.0)
261 |                     )
262 |                     
263 |                 elif task['type'] == 'run_multiple_backtests':
264 |                     params = task['params']
265 |                     result = await self.run_multiple_backtests(
266 |                         params.get('symbols', []),
267 |                         params.get('intervals', []),
268 |                         datetime.fromisoformat(params.get('start_date')),
269 |                         datetime.fromisoformat(params.get('end_date')) if params.get('end_date') else None,
270 |                         params.get('initial_balance', 10000.0)
271 |                     )
272 |                     
273 |                 else:
274 |                     result = {'error': f"Unknown task type: {task['type']}"}
275 |                 
276 |                 # Update task status
277 |                 task['status'] = 'completed'
278 |                 task['completed_at'] = datetime.now().isoformat()
279 |                 task['result'] = result
280 |                 
281 |                 # Remove from running tasks
282 |                 self.running_tasks.remove(task['id'])
283 |                 
284 |                 # Mark task as done
285 |                 self.task_queue.task_done()
286 |                 
287 |             except Exception as e:
288 |                 logger.error(f"Error processing task: {str(e)}")
289 |                 
290 |                 # Update task status if possible
291 |                 if 'task' in locals():
292 |                     task['status'] = 'failed'
293 |                     task['error'] = str(e)
294 |                     task['completed_at'] = datetime.now().isoformat()
295 |                     
296 |                     # Remove from running tasks
297 |                     if task['id'] in self.running_tasks:
298 |                         self.running_tasks.remove(task['id'])
299 |                     
300 |                     # Mark task as done
301 |                     self.task_queue.task_done()
302 |                 
303 |                 # Wait before trying next task
304 |                 await asyncio.sleep(1)
305 |     
306 |     async def run(self):
307 |         """Run the backtest engine"""
308 |         # Start task processor
309 |         task_processor = asyncio.create_task(self.process_task_queue())
310 |         
311 |         try:
312 |             # Keep the engine running
313 |             while True:
314 |                 await asyncio.sleep(1)
315 |                 
316 |         except asyncio.CancelledError:
317 |             logger.info("Backtest engine shutting down...")
318 |             
319 |         finally:
320 |             # Cancel task processor
321 |             task_processor.cancel()
322 |             try:
323 |                 await task_processor
324 |             except asyncio.CancelledError:
325 |                 pass


--------------------------------------------------------------------------------
/services/utils/metrics.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Prometheus metrics utility for AI Crypto Trader services
  3 | """
  4 | import time
  5 | import logging
  6 | from functools import wraps
  7 | from typing import Dict, Optional
  8 | from prometheus_client import Counter, Histogram, Gauge, CollectorRegistry, start_http_server, generate_latest
  9 | import asyncio
 10 | from aiohttp import web
 11 | import os
 12 | 
 13 | logger = logging.getLogger(__name__)
 14 | 
 15 | class PrometheusMetrics:
 16 |     """Centralized Prometheus metrics for crypto trading services"""
 17 |     
 18 |     def __init__(self, service_name: str, port: Optional[int] = None):
 19 |         self.service_name = service_name
 20 |         self.port = port
 21 |         self.registry = CollectorRegistry()
 22 |         self.app = None
 23 |         self.server = None
 24 |         
 25 |         # Common metrics for all services
 26 |         self.request_counter = Counter(
 27 |             'crypto_trader_request_total',
 28 |             'Total number of requests processed by service',
 29 |             ['service', 'endpoint', 'method'],
 30 |             registry=self.registry
 31 |         )
 32 |         
 33 |         self.request_duration = Histogram(
 34 |             'crypto_trader_request_latency_seconds',
 35 |             'Request latency in seconds',
 36 |             ['service', 'endpoint', 'method'],
 37 |             registry=self.registry
 38 |         )
 39 |         
 40 |         self.error_counter = Counter(
 41 |             'crypto_trader_errors_total',
 42 |             'Total number of errors by service',
 43 |             ['service', 'error_type', 'endpoint'],
 44 |             registry=self.registry
 45 |         )
 46 |         
 47 |         self.service_health = Gauge(
 48 |             'crypto_trader_service_health',
 49 |             'Service health status (1=healthy, 0=unhealthy)',
 50 |             ['service'],
 51 |             registry=self.registry
 52 |         )
 53 |         
 54 |         # Trading-specific metrics
 55 |         self.trading_signals = Counter(
 56 |             'crypto_trader_trading_signals_total',
 57 |             'Total trading signals generated',
 58 |             ['symbol', 'action', 'strategy'],
 59 |             registry=self.registry
 60 |         )
 61 |         
 62 |         self.trades_executed = Counter(
 63 |             'crypto_trader_trades_executed_total',
 64 |             'Total trades executed',
 65 |             ['symbol', 'action', 'strategy'],
 66 |             registry=self.registry
 67 |         )
 68 |         
 69 |         self.portfolio_value = Gauge(
 70 |             'crypto_trader_portfolio_value_usd',
 71 |             'Current portfolio value in USD',
 72 |             registry=self.registry
 73 |         )
 74 |         
 75 |         self.asset_holdings = Gauge(
 76 |             'crypto_trader_asset_holdings',
 77 |             'Current asset holdings',
 78 |             ['symbol'],
 79 |             registry=self.registry
 80 |         )
 81 |         
 82 |         # AI-specific metrics
 83 |         self.ai_requests = Counter(
 84 |             'crypto_trader_ai_requests_total',
 85 |             'Total AI requests',
 86 |             ['model', 'service'],
 87 |             registry=self.registry
 88 |         )
 89 |         
 90 |         self.ai_request_duration = Histogram(
 91 |             'crypto_trader_ai_request_duration_seconds',
 92 |             'AI request duration',
 93 |             ['model', 'service'],
 94 |             registry=self.registry
 95 |         )
 96 |         
 97 |         self.ai_model_confidence = Gauge(
 98 |             'crypto_trader_ai_model_confidence',
 99 |             'AI model confidence scores',
100 |             ['symbol', 'action', 'model'],
101 |             registry=self.registry
102 |         )
103 |         
104 |         # Social metrics
105 |         self.social_sentiment = Gauge(
106 |             'crypto_trader_social_sentiment',
107 |             'Social sentiment scores',
108 |             ['symbol'],
109 |             registry=self.registry
110 |         )
111 |         
112 |         self.social_volume = Gauge(
113 |             'crypto_trader_social_volume',
114 |             'Social media volume',
115 |             ['symbol'],
116 |             registry=self.registry
117 |         )
118 |         
119 |         # Risk metrics
120 |         self.portfolio_var = Gauge(
121 |             'crypto_trader_portfolio_var',
122 |             'Portfolio Value at Risk',
123 |             registry=self.registry
124 |         )
125 |         
126 |         self.position_risk = Gauge(
127 |             'crypto_trader_position_risk',
128 |             'Individual position risk scores',
129 |             ['symbol'],
130 |             registry=self.registry
131 |         )
132 |         
133 |         # Execution metrics
134 |         self.execution_errors = Counter(
135 |             'crypto_trader_execution_errors_total',
136 |             'Trading execution errors',
137 |             ['symbol', 'error_type'],
138 |             registry=self.registry
139 |         )
140 |         
141 |         self.order_latency = Histogram(
142 |             'crypto_trader_order_latency_seconds',
143 |             'Order execution latency',
144 |             ['symbol', 'order_type'],
145 |             registry=self.registry
146 |         )
147 |         
148 |         # Market data metrics
149 |         self.market_data_updates = Counter(
150 |             'crypto_trader_market_data_updates_total',
151 |             'Market data updates received',
152 |             ['symbol', 'source'],
153 |             registry=self.registry
154 |         )
155 |         
156 |         self.price_changes = Gauge(
157 |             'crypto_trader_price_change_percent',
158 |             'Price change percentages',
159 |             ['symbol', 'timeframe'],
160 |             registry=self.registry
161 |         )
162 |         
163 |         # Performance metrics
164 |         self.win_rate = Gauge(
165 |             'crypto_trader_win_rate',
166 |             'Trading win rate',
167 |             ['symbol', 'strategy'],
168 |             registry=self.registry
169 |         )
170 |         
171 |         self.profit_loss = Gauge(
172 |             'crypto_trader_profit_loss_usd',
173 |             'Profit/Loss in USD',
174 |             ['symbol', 'strategy'],
175 |             registry=self.registry
176 |         )
177 |         
178 |         # Strategy metrics
179 |         self.strategy_performance = Gauge(
180 |             'crypto_trader_strategy_performance',
181 |             'Strategy performance scores',
182 |             ['strategy_id', 'metric'],
183 |             registry=self.registry
184 |         )
185 |         
186 |         # Initialize service health
187 |         self.service_health.labels(service=self.service_name).set(1)
188 |         
189 |     async def start_server(self, port: Optional[int] = None):
190 |         """Start the metrics HTTP server"""
191 |         if not port:
192 |             port = self.port or 9090
193 |             
194 |         try:
195 |             self.app = web.Application()
196 |             self.app.router.add_get('/metrics', self._metrics_handler)
197 |             self.app.router.add_get('/health', self._health_handler)
198 |             
199 |             runner = web.AppRunner(self.app)
200 |             await runner.setup()
201 |             site = web.TCPSite(runner, '0.0.0.0', port)
202 |             await site.start()
203 |             
204 |             logger.info(f"Metrics server started on port {port} for service {self.service_name}")
205 |             
206 |         except Exception as e:
207 |             logger.error(f"Failed to start metrics server: {e}")
208 |             
209 |     async def _metrics_handler(self, request):
210 |         """Handle metrics endpoint requests"""
211 |         try:
212 |             metrics_data = generate_latest(self.registry)
213 |             return web.Response(text=metrics_data.decode('utf-8'), content_type='text/plain')
214 |         except Exception as e:
215 |             logger.error(f"Error generating metrics: {e}")
216 |             return web.Response(text="Error generating metrics", status=500)
217 |             
218 |     async def _health_handler(self, request):
219 |         """Handle health check requests"""
220 |         return web.Response(text="OK", status=200)
221 |         
222 |     def measure_time(self, endpoint: str, method: str = "GET"):
223 |         """Decorator to measure request duration"""
224 |         def decorator(func):
225 |             @wraps(func)
226 |             async def async_wrapper(*args, **kwargs):
227 |                 start_time = time.time()
228 |                 try:
229 |                     self.request_counter.labels(
230 |                         service=self.service_name,
231 |                         endpoint=endpoint,
232 |                         method=method
233 |                     ).inc()
234 |                     
235 |                     result = await func(*args, **kwargs)
236 |                     return result
237 |                 except Exception as e:
238 |                     self.error_counter.labels(
239 |                         service=self.service_name,
240 |                         error_type=type(e).__name__,
241 |                         endpoint=endpoint
242 |                     ).inc()
243 |                     raise
244 |                 finally:
245 |                     duration = time.time() - start_time
246 |                     self.request_duration.labels(
247 |                         service=self.service_name,
248 |                         endpoint=endpoint,
249 |                         method=method
250 |                     ).observe(duration)
251 |                     
252 |             @wraps(func)
253 |             def sync_wrapper(*args, **kwargs):
254 |                 start_time = time.time()
255 |                 try:
256 |                     self.request_counter.labels(
257 |                         service=self.service_name,
258 |                         endpoint=endpoint,
259 |                         method=method
260 |                     ).inc()
261 |                     
262 |                     result = func(*args, **kwargs)
263 |                     return result
264 |                 except Exception as e:
265 |                     self.error_counter.labels(
266 |                         service=self.service_name,
267 |                         error_type=type(e).__name__,
268 |                         endpoint=endpoint
269 |                     ).inc()
270 |                     raise
271 |                 finally:
272 |                     duration = time.time() - start_time
273 |                     self.request_duration.labels(
274 |                         service=self.service_name,
275 |                         endpoint=endpoint,
276 |                         method=method
277 |                     ).observe(duration)
278 |                     
279 |             return async_wrapper if asyncio.iscoroutinefunction(func) else sync_wrapper
280 |         return decorator
281 |         
282 |     def record_trading_signal(self, symbol: str, action: str, strategy: str = "default"):
283 |         """Record a trading signal"""
284 |         self.trading_signals.labels(
285 |             symbol=symbol,
286 |             action=action,
287 |             strategy=strategy
288 |         ).inc()
289 |         
290 |     def record_trade_execution(self, symbol: str, action: str, strategy: str = "default"):
291 |         """Record a trade execution"""
292 |         self.trades_executed.labels(
293 |             symbol=symbol,
294 |             action=action,
295 |             strategy=strategy
296 |         ).inc()
297 |         
298 |     def update_portfolio_value(self, value_usd: float):
299 |         """Update portfolio value"""
300 |         self.portfolio_value.set(value_usd)
301 |         
302 |     def update_asset_holding(self, symbol: str, quantity: float):
303 |         """Update asset holding"""
304 |         self.asset_holdings.labels(symbol=symbol).set(quantity)
305 |         
306 |     def record_ai_request(self, model: str, duration: float):
307 |         """Record AI request"""
308 |         self.ai_requests.labels(model=model, service=self.service_name).inc()
309 |         self.ai_request_duration.labels(model=model, service=self.service_name).observe(duration)
310 |         
311 |     def update_ai_confidence(self, symbol: str, action: str, model: str, confidence: float):
312 |         """Update AI model confidence"""
313 |         self.ai_model_confidence.labels(
314 |             symbol=symbol,
315 |             action=action,
316 |             model=model
317 |         ).set(confidence)
318 |         
319 |     def update_social_metrics(self, symbol: str, sentiment: float, volume: float):
320 |         """Update social metrics"""
321 |         self.social_sentiment.labels(symbol=symbol).set(sentiment)
322 |         self.social_volume.labels(symbol=symbol).set(volume)
323 |         
324 |     def update_portfolio_var(self, var_value: float):
325 |         """Update portfolio VaR"""
326 |         self.portfolio_var.set(var_value)
327 |         
328 |     def update_position_risk(self, symbol: str, risk_score: float):
329 |         """Update position risk"""
330 |         self.position_risk.labels(symbol=symbol).set(risk_score)
331 |         
332 |     def record_execution_error(self, symbol: str, error_type: str):
333 |         """Record execution error"""
334 |         self.execution_errors.labels(symbol=symbol, error_type=error_type).inc()
335 |         
336 |     def record_order_latency(self, symbol: str, order_type: str, latency: float):
337 |         """Record order execution latency"""
338 |         self.order_latency.labels(symbol=symbol, order_type=order_type).observe(latency)
339 |         
340 |     def record_market_data_update(self, symbol: str, source: str = "binance"):
341 |         """Record market data update"""
342 |         self.market_data_updates.labels(symbol=symbol, source=source).inc()
343 |         
344 |     def update_price_change(self, symbol: str, timeframe: str, change_pct: float):
345 |         """Update price change percentage"""
346 |         self.price_changes.labels(symbol=symbol, timeframe=timeframe).set(change_pct)
347 |         
348 |     def update_win_rate(self, symbol: str, strategy: str, win_rate: float):
349 |         """Update win rate"""
350 |         self.win_rate.labels(symbol=symbol, strategy=strategy).set(win_rate)
351 |         
352 |     def update_profit_loss(self, symbol: str, strategy: str, pnl_usd: float):
353 |         """Update profit/loss"""
354 |         self.profit_loss.labels(symbol=symbol, strategy=strategy).set(pnl_usd)
355 |         
356 |     def update_strategy_performance(self, strategy_id: str, metric: str, value: float):
357 |         """Update strategy performance metrics"""
358 |         self.strategy_performance.labels(strategy_id=strategy_id, metric=metric).set(value)
359 |         
360 |     def set_service_health(self, healthy: bool):
361 |         """Set service health status"""
362 |         self.service_health.labels(service=self.service_name).set(1 if healthy else 0)
363 | 
364 | 
365 | # Global metrics instances for easy access
366 | _metrics_instances: Dict[str, PrometheusMetrics] = {}
367 | 
368 | def get_metrics(service_name: str, port: Optional[int] = None) -> PrometheusMetrics:
369 |     """Get or create metrics instance for a service"""
370 |     if service_name not in _metrics_instances:
371 |         _metrics_instances[service_name] = PrometheusMetrics(service_name, port)
372 |     return _metrics_instances[service_name]
373 | 
374 | def is_metrics_enabled() -> bool:
375 |     """Check if metrics are enabled via environment variable"""
376 |     return os.getenv('ENABLE_METRICS', 'false').lower() in ('true', '1', 'yes', 'on')
377 | 


--------------------------------------------------------------------------------
/services/utils/monitoring.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import time
  3 | import json
  4 | import logging
  5 | import threading
  6 | from datetime import datetime
  7 | from functools import wraps
  8 | from logging.handlers import RotatingFileHandler
  9 | from typing import Dict, Any, Optional, List, Callable, Union
 10 | 
 11 | # Prometheus metrics
 12 | from prometheus_client import Counter, Gauge, Histogram, Summary, start_http_server
 13 | 
 14 | # Structured logging
 15 | import structlog
 16 | from pythonjsonlogger import jsonlogger
 17 | 
 18 | # Constants
 19 | DEFAULT_METRICS_PORT = 8000
 20 | METRICS_NAMESPACE = "crypto_trader"
 21 | 
 22 | # Globals for metrics
 23 | enabled_metrics = os.environ.get("ENABLE_METRICS", "false").lower() == "true"
 24 | metrics = {}
 25 | metrics_port = None
 26 | metrics_started = False
 27 | 
 28 | # Setup structured logging
 29 | def setup_logging(service_name: str, log_level: str = "INFO") -> logging.Logger:
 30 |     """
 31 |     Configure structured JSON logging for the service
 32 |     
 33 |     Args:
 34 |         service_name: Name of the service for log context
 35 |         log_level: Logging level (DEBUG, INFO, WARNING, ERROR, CRITICAL)
 36 |         
 37 |     Returns:
 38 |         Configured logger instance
 39 |     """
 40 |     log_level_num = getattr(logging, log_level.upper(), logging.INFO)
 41 |     
 42 |     # Ensure logs directory exists
 43 |     logs_dir = os.path.join(os.getcwd(), "logs")
 44 |     os.makedirs(logs_dir, exist_ok=True)
 45 |     
 46 |     # Create standard file handler with rotation
 47 |     log_file = os.path.join(logs_dir, f"{service_name.lower()}.log")
 48 |     file_handler = RotatingFileHandler(
 49 |         log_file, maxBytes=10*1024*1024, backupCount=5, encoding="utf-8"
 50 |     )
 51 |     
 52 |     # Create JSON formatter
 53 |     class CustomJsonFormatter(jsonlogger.JsonFormatter):
 54 |         def add_fields(self, log_record, record, message_dict):
 55 |             super(CustomJsonFormatter, self).add_fields(log_record, record, message_dict)
 56 |             log_record["service"] = service_name
 57 |             log_record["timestamp"] = datetime.utcnow().isoformat() + "Z"
 58 |             log_record["level"] = record.levelname
 59 |             log_record["thread"] = threading.current_thread().name
 60 | 
 61 |     formatter = CustomJsonFormatter("%(timestamp)s %(level)s %(service)s %(name)s %(message)s")
 62 |     file_handler.setFormatter(formatter)
 63 |     
 64 |     # Configure structlog
 65 |     structlog.configure(
 66 |         processors=[
 67 |             structlog.stdlib.filter_by_level,
 68 |             structlog.stdlib.add_logger_name,
 69 |             structlog.stdlib.add_log_level,
 70 |             structlog.stdlib.PositionalArgumentsFormatter(),
 71 |             structlog.processors.TimeStamper(fmt="iso"),
 72 |             structlog.processors.StackInfoRenderer(),
 73 |             structlog.processors.format_exc_info,
 74 |             structlog.processors.UnicodeDecoder(),
 75 |             structlog.processors.JSONRenderer(),
 76 |         ],
 77 |         context_class=dict,
 78 |         logger_factory=structlog.stdlib.LoggerFactory(),
 79 |         wrapper_class=structlog.stdlib.BoundLogger,
 80 |         cache_logger_on_first_use=True,
 81 |     )
 82 |     
 83 |     # Setup root logger
 84 |     root_logger = logging.getLogger()
 85 |     root_logger.setLevel(log_level_num)
 86 |     
 87 |     # Add console handler for local development
 88 |     console_handler = logging.StreamHandler()
 89 |     console_handler.setFormatter(formatter)
 90 |     root_logger.addHandler(console_handler)
 91 |     root_logger.addHandler(file_handler)
 92 |     
 93 |     # Create service-specific logger
 94 |     logger = structlog.get_logger(service_name)
 95 |     
 96 |     return logger
 97 | 
 98 | # Metrics functions
 99 | def start_metrics_server(port: Optional[int] = None) -> None:
100 |     """
101 |     Start the Prometheus metrics HTTP server on the specified port
102 |     
103 |     Args:
104 |         port: Port to run the metrics server on (default based on service port)
105 |     """
106 |     global metrics_started, metrics_port
107 |     
108 |     if not enabled_metrics:
109 |         return
110 |         
111 |     if metrics_started:
112 |         return
113 |     
114 |     if port is None:
115 |         # Default to service port + 1000 if not specified
116 |         service_port = int(os.environ.get("SERVICE_PORT", DEFAULT_METRICS_PORT))
117 |         port = service_port
118 |     
119 |     metrics_port = port
120 |     start_http_server(port)
121 |     metrics_started = True
122 | 
123 | def create_counter(name: str, description: str, labels: Optional[List[str]] = None) -> Counter:
124 |     """
125 |     Create a Prometheus counter metric
126 |     
127 |     Args:
128 |         name: Metric name
129 |         description: Metric description 
130 |         labels: List of label names for this metric
131 |         
132 |     Returns:
133 |         Prometheus Counter instance
134 |     """
135 |     if not enabled_metrics:
136 |         return DummyMetric()
137 |         
138 |     key = f"counter_{name}"
139 |     if key not in metrics:
140 |         metrics[key] = Counter(
141 |             f"{METRICS_NAMESPACE}_{name}",
142 |             description,
143 |             labels or []
144 |         )
145 |     return metrics[key]
146 | 
147 | def create_gauge(name: str, description: str, labels: Optional[List[str]] = None) -> Gauge:
148 |     """
149 |     Create a Prometheus gauge metric
150 |     
151 |     Args:
152 |         name: Metric name
153 |         description: Metric description 
154 |         labels: List of label names for this metric
155 |         
156 |     Returns:
157 |         Prometheus Gauge instance
158 |     """
159 |     if not enabled_metrics:
160 |         return DummyMetric()
161 |         
162 |     key = f"gauge_{name}"
163 |     if key not in metrics:
164 |         metrics[key] = Gauge(
165 |             f"{METRICS_NAMESPACE}_{name}",
166 |             description,
167 |             labels or []
168 |         )
169 |     return metrics[key]
170 | 
171 | def create_histogram(name: str, description: str, labels: Optional[List[str]] = None, 
172 |                   buckets: Optional[List[float]] = None) -> Histogram:
173 |     """
174 |     Create a Prometheus histogram metric
175 |     
176 |     Args:
177 |         name: Metric name
178 |         description: Metric description 
179 |         labels: List of label names for this metric
180 |         buckets: Custom buckets for the histogram
181 |         
182 |     Returns:
183 |         Prometheus Histogram instance
184 |     """
185 |     if not enabled_metrics:
186 |         return DummyMetric()
187 |         
188 |     key = f"histogram_{name}"
189 |     if key not in metrics:
190 |         metrics[key] = Histogram(
191 |             f"{METRICS_NAMESPACE}_{name}",
192 |             description,
193 |             labels or [],
194 |             buckets=buckets
195 |         )
196 |     return metrics[key]
197 | 
198 | def create_summary(name: str, description: str, labels: Optional[List[str]] = None) -> Summary:
199 |     """
200 |     Create a Prometheus summary metric
201 |     
202 |     Args:
203 |         name: Metric name
204 |         description: Metric description 
205 |         labels: List of label names for this metric
206 |         
207 |     Returns:
208 |         Prometheus Summary instance
209 |     """
210 |     if not enabled_metrics:
211 |         return DummyMetric()
212 |         
213 |     key = f"summary_{name}"
214 |     if key not in metrics:
215 |         metrics[key] = Summary(
216 |             f"{METRICS_NAMESPACE}_{name}",
217 |             description,
218 |             labels or []
219 |         )
220 |     return metrics[key]
221 | 
222 | # Dummy metric class for when metrics are disabled
223 | class DummyMetric:
224 |     """Dummy metric class that implements no-op methods for all metric types"""
225 |     def inc(self, amount=1):
226 |         pass
227 |         
228 |     def dec(self, amount=1):
229 |         pass
230 |         
231 |     def set(self, value):
232 |         pass
233 |         
234 |     def observe(self, value):
235 |         pass
236 |         
237 |     def time(self):
238 |         return DummyTimer()
239 |         
240 |     def labels(self, *args, **kwargs):
241 |         return self
242 | 
243 | class DummyTimer:
244 |     """Dummy timer context manager"""
245 |     def __enter__(self):
246 |         pass
247 |         
248 |     def __exit__(self, exc_type, exc_val, exc_tb):
249 |         pass
250 | 
251 | # Decorator for timing functions and capturing errors
252 | def timed(metric_name=None, description=None, labels=None):
253 |     """
254 |     Decorator that times function execution and records it in a histogram
255 |     Also tracks successes and failures as counters
256 |     
257 |     Args:
258 |         metric_name: Name for the metric (defaults to function name)
259 |         description: Description for the metric
260 |         labels: Labels to apply to the metric
261 |     """
262 |     def decorator(func):
263 |         @wraps(func)
264 |         def wrapper(*args, **kwargs):
265 |             name = metric_name or func.__name__
266 |             desc = description or f"Time spent in {name}"
267 |             
268 |             if enabled_metrics:
269 |                 timer = create_histogram(
270 |                     f"{name}_duration_seconds",
271 |                     desc,
272 |                     labels
273 |                 )
274 |                 error_counter = create_counter(
275 |                     f"{name}_errors_total",
276 |                     f"Errors in {name}",
277 |                     labels
278 |                 )
279 |                 success_counter = create_counter(
280 |                     f"{name}_success_total",
281 |                     f"Successful calls to {name}",
282 |                     labels
283 |                 )
284 |             
285 |             start_time = time.time()
286 |             try:
287 |                 result = func(*args, **kwargs)
288 |                 if enabled_metrics:
289 |                     success_counter.inc()
290 |                 return result
291 |             except Exception as e:
292 |                 if enabled_metrics:
293 |                     error_counter.inc()
294 |                 raise
295 |             finally:
296 |                 if enabled_metrics:
297 |                     duration = time.time() - start_time
298 |                     timer.observe(duration)
299 |                 
300 |         return wrapper
301 |     return decorator
302 | 
303 | # Common metrics for all services
304 | request_latency = create_histogram(
305 |     "request_latency_seconds", 
306 |     "Request latency in seconds",
307 |     ["service", "endpoint"]
308 | )
309 | 
310 | request_count = create_counter(
311 |     "request_total",
312 |     "Total number of requests",
313 |     ["service", "endpoint", "status"]
314 | )
315 | 
316 | active_connections = create_gauge(
317 |     "active_connections",
318 |     "Number of active connections",
319 |     ["service"]
320 | )
321 | 
322 | error_count = create_counter(
323 |     "errors_total",
324 |     "Total number of errors",
325 |     ["service", "type"]
326 | )
327 | 
328 | # Initialize global metrics for each service type
329 | def init_service_metrics(service_name):
330 |     """Initialize service-specific metrics"""
331 |     if not enabled_metrics:
332 |         return
333 |         
334 |     if service_name == "market_monitor":
335 |         # Market monitor specific metrics
336 |         create_gauge(
337 |             "market_data_age_seconds",
338 |             "Age of latest market data in seconds",
339 |             ["symbol", "timeframe"]
340 |         )
341 |         create_counter(
342 |             "market_updates_total",
343 |             "Total number of market updates processed",
344 |             ["symbol", "timeframe"]
345 |         )
346 |         create_gauge(
347 |             "technical_indicator_value",
348 |             "Current value of technical indicators",
349 |             ["symbol", "indicator", "timeframe"]
350 |         )
351 |         
352 |     elif service_name == "social_monitor":
353 |         # Social monitor specific metrics
354 |         create_gauge(
355 |             "social_sentiment",
356 |             "Social sentiment score",
357 |             ["symbol"]
358 |         )
359 |         create_gauge(
360 |             "social_volume",
361 |             "Social volume",
362 |             ["symbol"]
363 |         )
364 |         create_gauge(
365 |             "social_contributors",
366 |             "Number of social contributors",
367 |             ["symbol"]
368 |         )
369 |         create_counter(
370 |             "social_updates_total",
371 |             "Total number of social updates processed",
372 |             ["symbol"]
373 |         )
374 |         
375 |     elif service_name == "ai_analyzer":
376 |         # AI analyzer specific metrics
377 |         create_counter(
378 |             "ai_requests_total",
379 |             "Total number of AI API requests",
380 |             ["model"]
381 |         )
382 |         create_histogram(
383 |             "ai_request_duration_seconds",
384 |             "Duration of AI API requests",
385 |             ["model"]
386 |         )
387 |         create_counter(
388 |             "trading_signals_total",
389 |             "Total number of trading signals generated",
390 |             ["symbol", "action", "confidence_level"]
391 |         )
392 |         create_gauge(
393 |             "ai_model_confidence",
394 |             "Confidence level of AI model predictions",
395 |             ["symbol", "action"]
396 |         )
397 |         
398 |     elif service_name == "trade_executor":
399 |         # Trade executor specific metrics
400 |         create_counter(
401 |             "trades_executed_total",
402 |             "Total number of trades executed",
403 |             ["symbol", "action"]
404 |         )
405 |         create_gauge(
406 |             "portfolio_value_usd",
407 |             "Total portfolio value in USD",
408 |         )
409 |         create_gauge(
410 |             "asset_holdings",
411 |             "Current holdings of assets",
412 |             ["symbol"]
413 |         )
414 |         create_counter(
415 |             "execution_errors_total",
416 |             "Total number of execution errors",
417 |             ["symbol", "error_type"]
418 |         )
419 |         create_histogram(
420 |             "execution_latency_seconds",
421 |             "Trade execution latency",
422 |             ["symbol", "action"]
423 |         )
424 |         
425 |     elif service_name == "strategy_evolution":
426 |         # Strategy evolution specific metrics
427 |         create_counter(
428 |             "strategies_generated_total",
429 |             "Total number of strategies generated",
430 |             ["status"]
431 |         )
432 |         create_gauge(
433 |             "strategy_performance",
434 |             "Performance metrics for strategies",
435 |             ["strategy_id", "metric"]
436 |         )
437 |         create_counter(
438 |             "strategy_mutations_total",
439 |             "Total number of strategy mutations",
440 |             ["result"]
441 |         )
442 |         create_histogram(
443 |             "strategy_backtest_duration_seconds",
444 |             "Duration of strategy backtests",
445 |             ["strategy_id"]
446 |         )
447 |     
448 |     elif service_name == "dashboard":
449 |         # Dashboard specific metrics
450 |         create_counter(
451 |             "dashboard_views_total",
452 |             "Total number of dashboard views",
453 |             ["endpoint"]
454 |         )
455 |         create_gauge(
456 |             "active_users",
457 |             "Number of active dashboard users",
458 |         )
459 |         create_histogram(
460 |             "dashboard_render_time_seconds",
461 |             "Time to render dashboard components",
462 |             ["component"]
463 |         )


--------------------------------------------------------------------------------
/services/social_monitor_service.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import json
  3 | import socket
  4 | import asyncio
  5 | import aiohttp
  6 | from datetime import datetime, timedelta
  7 | import logging as logger
  8 | from logging.handlers import RotatingFileHandler
  9 | from redis.asyncio import Redis
 10 | from redis.exceptions import ConnectionError
 11 | from typing import Dict, List, Optional
 12 | 
 13 | # Create logs directory if it doesn't exist
 14 | os.makedirs('logs', exist_ok=True)
 15 | 
 16 | # Configure rotating file handler
 17 | rotating_handler = RotatingFileHandler(
 18 |     'logs/social_monitor.log',
 19 |     maxBytes=10*1024*1024,  # 10MB per file
 20 |     backupCount=5,  # Keep 5 backup files
 21 |     encoding='utf-8'
 22 | )
 23 | 
 24 | # Configure logging with rotation
 25 | logger.basicConfig(
 26 |     level=logger.DEBUG,
 27 |     format='%(asctime)s - %(levelname)s - [SocialMonitor] %(message)s',
 28 |     handlers=[
 29 |         rotating_handler,
 30 |         logger.StreamHandler()
 31 |     ]
 32 | )
 33 | 
 34 | class SocialMonitorService:
 35 |     def __init__(self):
 36 |         logger.debug("Initializing Social Monitor Service...")
 37 |         
 38 |         # Load configuration
 39 |         with open('config.json', 'r') as f:
 40 |             self.config = json.load(f)
 41 |         
 42 |         # LunarCrush configuration
 43 |         self.api_key = os.getenv('LUNARCRUSH_API_KEY', self.config['lunarcrush']['api_key'])
 44 |         if not self.api_key:
 45 |             raise ValueError("LUNARCRUSH_API_KEY environment variable or config value not set")
 46 |         
 47 |         self.base_url = self.config['lunarcrush']['base_url']
 48 |         self.endpoints = self.config['lunarcrush']['endpoints']
 49 |         self.update_interval = self.config['lunarcrush']['update_interval']
 50 |         self.required_metrics = self.config['lunarcrush']['metrics']['required']
 51 |         self.sentiment_weights = self.config['lunarcrush']['sentiment_weights']
 52 |         self.cache_duration = self.config['lunarcrush']['cache_duration']
 53 |         self.max_news_age = self.config['lunarcrush']['max_news_age']
 54 |         self.min_engagement = self.config['lunarcrush']['min_engagement']
 55 |         
 56 |         # Redis configuration
 57 |         self.redis_host = os.getenv('REDIS_HOST', 'redis')
 58 |         self.redis_port = int(os.getenv('REDIS_PORT', 6379))
 59 |         self.redis = None
 60 |         
 61 |         # Service state
 62 |         self.running = True
 63 |         self.monitored_symbols = set()
 64 |         self.cache = {}
 65 |         self.last_update = {}
 66 |         
 67 |         # Get service port from environment variable
 68 |         self.service_port = int(os.getenv('SOCIAL_MONITOR_PORT', 8004))
 69 |         logger.debug(f"Service port configured as: {self.service_port}")
 70 |         logger.debug("Social Monitor Service initialization complete")
 71 | 
 72 |     async def connect_redis(self, max_retries=5, retry_delay=5):
 73 |         """Establish Redis connection with retries"""
 74 |         retries = 0
 75 |         while retries < max_retries:
 76 |             try:
 77 |                 if self.redis is None:
 78 |                     self.redis = Redis(
 79 |                         host=self.redis_host,
 80 |                         port=self.redis_port,
 81 |                         decode_responses=True
 82 |                     )
 83 |                 await self.redis.ping()
 84 |                 logger.info("Successfully connected to Redis")
 85 |                 return True
 86 |             except (ConnectionError, Exception) as e:
 87 |                 retries += 1
 88 |                 logger.error(f"Failed to connect to Redis (attempt {retries}/{max_retries}): {str(e)}")
 89 |                 if retries < max_retries:
 90 |                     await asyncio.sleep(retry_delay)
 91 |                 else:
 92 |                     logger.error("Max retries reached. Could not connect to Redis.")
 93 |                     return False
 94 | 
 95 |     async def fetch_social_metrics(self, symbol: str) -> Optional[Dict]:
 96 |         """Fetch social metrics from LunarCrush API"""
 97 |         try:
 98 |             # Check cache first
 99 |             if symbol in self.cache:
100 |                 cache_time = self.last_update.get(symbol, datetime.min)
101 |                 if (datetime.now() - cache_time).total_seconds() < self.cache_duration:
102 |                     return self.cache[symbol]
103 |             
104 |             # Prepare API request
105 |             headers = {
106 |                 'Authorization': f'Bearer {self.api_key}',
107 |                 'Accept': 'application/json'
108 |             }
109 |             
110 |             params = {
111 |                 'symbol': symbol,
112 |                 'interval': '1h',  # Get hourly data
113 |                 'limit': 1  # Get most recent data point
114 |             }
115 |             
116 |             url = f"{self.base_url}{self.endpoints['assets']}"
117 |             
118 |             async with aiohttp.ClientSession() as session:
119 |                 async with session.get(url, headers=headers, params=params) as response:
120 |                     if response.status == 200:
121 |                         data = await response.json()
122 |                         if 'data' in data and data['data']:
123 |                             asset_data = data['data'][0]
124 |                             
125 |                             # Extract required metrics
126 |                             metrics = {
127 |                                 'social_volume': asset_data.get('social_volume', 0),
128 |                                 'social_engagement': asset_data.get('social_engagement', 0),
129 |                                 'social_contributors': asset_data.get('social_contributors', 0),
130 |                                 'social_sentiment': asset_data.get('social_sentiment', 0),
131 |                                 'twitter_volume': asset_data.get('twitter_volume', 0),
132 |                                 'reddit_volume': asset_data.get('reddit_volume', 0),
133 |                                 'news_volume': asset_data.get('news_volume', 0)
134 |                             }
135 |                             
136 |                             # Calculate weighted sentiment
137 |                             weighted_sentiment = sum(
138 |                                 metrics[metric] * weight
139 |                                 for metric, weight in self.sentiment_weights.items()
140 |                                 if metric in metrics
141 |                             )
142 |                             
143 |                             # Fetch recent news
144 |                             news_url = f"{self.base_url}{self.endpoints['feeds']}"
145 |                             news_params = {
146 |                                 'symbol': symbol,
147 |                                 'limit': 5,
148 |                                 'sources': 'news'
149 |                             }
150 |                             
151 |                             async with session.get(news_url, headers=headers, params=news_params) as news_response:
152 |                                 if news_response.status == 200:
153 |                                     news_data = await news_response.json()
154 |                                     recent_news = []
155 |                                     
156 |                                     if 'data' in news_data:
157 |                                         for news_item in news_data['data']:
158 |                                             # Check if news is within max age
159 |                                             news_time = datetime.fromtimestamp(news_item['time'])
160 |                                             if (datetime.now() - news_time).total_seconds() <= self.max_news_age:
161 |                                                 recent_news.append({
162 |                                                     'title': news_item['title'],
163 |                                                     'sentiment': news_item.get('sentiment', 0),
164 |                                                     'engagement': news_item.get('engagement', 0)
165 |                                                 })
166 |                             
167 |                             # Prepare social data
168 |                             social_data = {
169 |                                 'metrics': metrics,
170 |                                 'weighted_sentiment': weighted_sentiment,
171 |                                 'recent_news': recent_news,
172 |                                 'timestamp': datetime.now().isoformat()
173 |                             }
174 |                             
175 |                             # Update cache
176 |                             self.cache[symbol] = social_data
177 |                             self.last_update[symbol] = datetime.now()
178 |                             
179 |                             return social_data
180 |                     
181 |                     logger.error(f"Failed to fetch social metrics for {symbol}: {response.status}")
182 |                     return None
183 |                     
184 |         except Exception as e:
185 |             logger.error(f"Error fetching social metrics for {symbol}: {str(e)}")
186 |             return None
187 | 
188 |     async def process_market_updates(self):
189 |         """Process market updates and maintain monitored symbols"""
190 |         while self.running:
191 |             try:
192 |                 if not self.redis or not await self.redis.ping():
193 |                     if not await self.connect_redis():
194 |                         await asyncio.sleep(5)
195 |                         continue
196 |                 
197 |                 # Subscribe to market updates to track active symbols
198 |                 pubsub = self.redis.pubsub()
199 |                 await pubsub.subscribe('market_updates')
200 |                 
201 |                 while self.running:
202 |                     message = await pubsub.get_message(ignore_subscribe_messages=True, timeout=1.0)
203 |                     if message:
204 |                         try:
205 |                             market_update = json.loads(message['data'])
206 |                             symbol = market_update['symbol']
207 |                             self.monitored_symbols.add(symbol)
208 |                         except Exception as e:
209 |                             logger.error(f"Error processing market update: {str(e)}")
210 |                     
211 |                     await asyncio.sleep(0.1)
212 |                 
213 |             except Exception as e:
214 |                 logger.error(f"Error in process_market_updates: {str(e)}")
215 |                 await asyncio.sleep(5)
216 | 
217 |     async def update_social_data(self):
218 |         """Update social data for monitored symbols"""
219 |         while self.running:
220 |             try:
221 |                 if not self.redis or not await self.redis.ping():
222 |                     if not await self.connect_redis():
223 |                         await asyncio.sleep(5)
224 |                         continue
225 |                 
226 |                 for symbol in self.monitored_symbols:
227 |                     try:
228 |                         # Check if update is needed
229 |                         last_update = self.last_update.get(symbol, datetime.min)
230 |                         if (datetime.now() - last_update).total_seconds() >= self.update_interval:
231 |                             social_data = await self.fetch_social_metrics(symbol)
232 |                             
233 |                             if social_data:
234 |                                 # Publish social update
235 |                                 await self.redis.publish(
236 |                                     'social_updates',
237 |                                     json.dumps({
238 |                                         'symbol': symbol,
239 |                                         'data': social_data
240 |                                     })
241 |                                 )
242 |                                 
243 |                                 # Store latest data
244 |                                 await self.redis.hset(
245 |                                     'social_metrics',
246 |                                     symbol,
247 |                                     json.dumps(social_data)
248 |                                 )
249 |                                 
250 |                                 logger.info(f"Updated social metrics for {symbol}")
251 |                                 logger.debug(f"Social data: {json.dumps(social_data, indent=2)}")
252 |                     
253 |                     except Exception as e:
254 |                         logger.error(f"Error updating social data for {symbol}: {str(e)}")
255 |                 
256 |                 await asyncio.sleep(1)
257 |                 
258 |             except Exception as e:
259 |                 logger.error(f"Error in update_social_data: {str(e)}")
260 |                 await asyncio.sleep(5)
261 | 
262 |     async def maintain_redis(self):
263 |         """Maintain Redis connection"""
264 |         while self.running:
265 |             try:
266 |                 if self.redis:
267 |                     await self.redis.ping()
268 |                 else:
269 |                     await self.connect_redis()
270 |                 await asyncio.sleep(1)
271 |             except Exception as e:
272 |                 logger.error(f"Redis connection error: {str(e)}")
273 |                 self.redis = None
274 |                 await asyncio.sleep(5)
275 | 
276 |     async def health_check_server(self):
277 |         """Run a simple TCP server for health checks"""
278 |         server = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
279 |         server.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
280 |         
281 |         try:
282 |             server.bind(('0.0.0.0', self.service_port))
283 |             server.listen(1)
284 |             server.setblocking(False)
285 |             
286 |             logger.info(f"Health check server listening on port {self.service_port}")
287 |             
288 |             while self.running:
289 |                 try:
290 |                     await asyncio.sleep(1)
291 |                 except Exception as e:
292 |                     logger.error(f"Health check server error: {str(e)}")
293 |         except Exception as e:
294 |             logger.error(f"Failed to start health check server: {str(e)}")
295 |         finally:
296 |             server.close()
297 | 
298 |     async def run(self):
299 |         """Run the social monitor service"""
300 |         try:
301 |             logger.info("Starting Social Monitor Service...")
302 |             
303 |             # First establish Redis connection
304 |             if not await self.connect_redis():
305 |                 raise Exception("Failed to establish initial Redis connection")
306 |             
307 |             # Create tasks
308 |             tasks = [
309 |                 asyncio.create_task(self.process_market_updates()),
310 |                 asyncio.create_task(self.update_social_data()),
311 |                 asyncio.create_task(self.maintain_redis()),
312 |                 asyncio.create_task(self.health_check_server())
313 |             ]
314 |             
315 |             # Wait for tasks to complete
316 |             await asyncio.gather(*tasks)
317 |             
318 |         except Exception as e:
319 |             logger.error(f"Error in Social Monitor Service: {str(e)}")
320 |         finally:
321 |             await self.stop()
322 | 
323 |     async def stop(self):
324 |         """Stop the social monitor service"""
325 |         logger.info("Stopping Social Monitor Service...")
326 |         self.running = False
327 |         if self.redis:
328 |             await self.redis.close()
329 | 
330 | if __name__ == "__main__":
331 |     service = SocialMonitorService()
332 |     try:
333 |         asyncio.run(service.run())
334 |     except KeyboardInterrupt:
335 |         asyncio.run(service.stop())
336 |     except Exception as e:
337 |         logger.error(f"Critical error: {str(e)}")
338 |         asyncio.run(service.stop())
339 | 


--------------------------------------------------------------------------------
/services/genetic_algorithm.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Genetic Algorithm for Trading Strategy Optimization
  3 | 
  4 | This module implements a genetic algorithm framework for optimizing trading strategies.
  5 | It evolves a population of strategy parameter sets, using mutation, crossover,
  6 | and selection operations to improve trading performance over generations.
  7 | """
  8 | 
  9 | import os
 10 | import json
 11 | import random
 12 | import logging
 13 | import numpy as np
 14 | from typing import Dict, List, Tuple, Callable, Any, Optional
 15 | from datetime import datetime
 16 | from copy import deepcopy
 17 | 
 18 | # Configure logging
 19 | logger = logging.getLogger("genetic_algorithm")
 20 | logger.setLevel(logging.INFO)
 21 | if not logger.handlers:
 22 |     handler = logging.FileHandler('logs/genetic_algorithm.log')
 23 |     formatter = logging.Formatter('%(asctime)s - %(levelname)s - [GeneticAlgorithm] %(message)s')
 24 |     handler.setFormatter(formatter)
 25 |     logger.addHandler(handler)
 26 | 
 27 | class GeneticAlgorithm:
 28 |     """
 29 |     A genetic algorithm implementation for optimizing trading strategies.
 30 |     """
 31 |     
 32 |     def __init__(self, param_ranges: Dict[str, Tuple], 
 33 |                  fitness_function: Callable, 
 34 |                  population_size: int = 20,
 35 |                  generations: int = 10,
 36 |                  mutation_rate: float = 0.2,
 37 |                  crossover_rate: float = 0.8,
 38 |                  elitism_pct: float = 0.1,
 39 |                  tournament_size: int = 3,
 40 |                  random_seed: Optional[int] = None):
 41 |         """
 42 |         Initialize the genetic algorithm.
 43 |         
 44 |         Args:
 45 |             param_ranges: Dictionary of parameter names to (min, max) tuples
 46 |             fitness_function: Function that evaluates a parameter set and returns a fitness score
 47 |             population_size: Number of individuals in the population
 48 |             generations: Number of generations to evolve
 49 |             mutation_rate: Probability of mutation for each parameter
 50 |             crossover_rate: Probability of crossover between individuals
 51 |             elitism_pct: Percentage of top individuals to preserve unchanged
 52 |             tournament_size: Number of individuals in tournament selection
 53 |             random_seed: Seed for random number generator
 54 |         """
 55 |         self.param_ranges = param_ranges
 56 |         self.fitness_function = fitness_function
 57 |         self.population_size = population_size
 58 |         self.generations = generations
 59 |         self.mutation_rate = mutation_rate
 60 |         self.crossover_rate = crossover_rate
 61 |         self.elitism_pct = elitism_pct
 62 |         self.tournament_size = tournament_size
 63 |         
 64 |         # Set random seed for reproducibility if provided
 65 |         if random_seed is not None:
 66 |             random.seed(random_seed)
 67 |             np.random.seed(random_seed)
 68 |         
 69 |         self.population = []
 70 |         self.fitness_scores = []
 71 |         self.best_individual = None
 72 |         self.best_fitness = -float('inf')
 73 |         self.generation_history = []
 74 |         
 75 |         logger.info(f"Genetic Algorithm initialized with:")
 76 |         logger.info(f"- Population size: {population_size}")
 77 |         logger.info(f"- Generations: {generations}")
 78 |         logger.info(f"- Mutation rate: {mutation_rate}")
 79 |         logger.info(f"- Crossover rate: {crossover_rate}")
 80 |         logger.info(f"- Elitism percentage: {elitism_pct}")
 81 |         logger.info(f"- Parameters: {list(param_ranges.keys())}")
 82 |     
 83 |     def initialize_population(self, seeded_individuals: List[Dict] = None) -> None:
 84 |         """
 85 |         Initialize the population with random individuals and optionally include seeded individuals.
 86 |         
 87 |         Args:
 88 |             seeded_individuals: List of predefined parameter sets to include in the initial population
 89 |         """
 90 |         self.population = []
 91 |         
 92 |         # Add seeded individuals if provided
 93 |         if seeded_individuals:
 94 |             for individual in seeded_individuals:
 95 |                 # Ensure all parameters are within bounds
 96 |                 bounded_individual = {}
 97 |                 for param, value in individual.items():
 98 |                     if param in self.param_ranges:
 99 |                         min_val, max_val = self.param_ranges[param]
100 |                         bounded_individual[param] = max(min_val, min(max_val, value))
101 |                     else:
102 |                         bounded_individual[param] = value
103 |                 self.population.append(bounded_individual)
104 |         
105 |         # Generate random individuals for the rest of the population
106 |         remaining = self.population_size - len(self.population)
107 |         for _ in range(remaining):
108 |             individual = {}
109 |             for param, (min_val, max_val) in self.param_ranges.items():
110 |                 if isinstance(min_val, int) and isinstance(max_val, int):
111 |                     individual[param] = random.randint(min_val, max_val)
112 |                 else:
113 |                     individual[param] = random.uniform(min_val, max_val)
114 |             self.population.append(individual)
115 |         
116 |         logger.info(f"Population initialized with {len(self.population)} individuals")
117 |         logger.info(f"Seeded individuals: {len(seeded_individuals) if seeded_individuals else 0}")
118 |     
119 |     def evaluate_population(self) -> None:
120 |         """
121 |         Evaluate the fitness of all individuals in the population.
122 |         """
123 |         self.fitness_scores = []
124 |         for individual in self.population:
125 |             fitness = self.fitness_function(individual)
126 |             self.fitness_scores.append(fitness)
127 |             
128 |             # Track best individual
129 |             if fitness > self.best_fitness:
130 |                 self.best_fitness = fitness
131 |                 self.best_individual = deepcopy(individual)
132 |         
133 |         logger.info(f"Population evaluated. Best fitness: {self.best_fitness}")
134 |     
135 |     def selection(self) -> List[Dict]:
136 |         """
137 |         Select individuals for reproduction using tournament selection.
138 |         
139 |         Returns:
140 |             List of selected individuals
141 |         """
142 |         selected = []
143 |         
144 |         # Elitism: Preserve top individuals
145 |         elites_count = max(1, int(self.elitism_pct * self.population_size))
146 |         indices = sorted(range(len(self.fitness_scores)), 
147 |                          key=lambda i: self.fitness_scores[i], 
148 |                          reverse=True)
149 |         
150 |         for i in range(elites_count):
151 |             selected.append(deepcopy(self.population[indices[i]]))
152 |         
153 |         # Tournament selection for the rest
154 |         while len(selected) < self.population_size:
155 |             tournament_indices = random.sample(range(len(self.population)), 
156 |                                              self.tournament_size)
157 |             tournament_fitness = [self.fitness_scores[i] for i in tournament_indices]
158 |             winner_idx = tournament_indices[tournament_fitness.index(max(tournament_fitness))]
159 |             selected.append(deepcopy(self.population[winner_idx]))
160 |         
161 |         return selected
162 |     
163 |     def crossover(self, parent1: Dict, parent2: Dict) -> Tuple[Dict, Dict]:
164 |         """
165 |         Perform crossover between two parents to create two children.
166 |         
167 |         Args:
168 |             parent1: First parent individual
169 |             parent2: Second parent individual
170 |             
171 |         Returns:
172 |             Tuple of two child individuals
173 |         """
174 |         if random.random() > self.crossover_rate:
175 |             return deepcopy(parent1), deepcopy(parent2)
176 |         
177 |         child1 = {}
178 |         child2 = {}
179 |         
180 |         # Choose random crossover points for each parameter
181 |         for param in self.param_ranges:
182 |             if random.random() < 0.5:
183 |                 child1[param] = parent1[param]
184 |                 child2[param] = parent2[param]
185 |             else:
186 |                 child1[param] = parent2[param]
187 |                 child2[param] = parent1[param]
188 |         
189 |         return child1, child2
190 |     
191 |     def mutation(self, individual: Dict) -> Dict:
192 |         """
193 |         Mutate an individual by randomly changing parameters.
194 |         
195 |         Args:
196 |             individual: The individual to mutate
197 |             
198 |         Returns:
199 |             Mutated individual
200 |         """
201 |         mutated = deepcopy(individual)
202 |         
203 |         for param, (min_val, max_val) in self.param_ranges.items():
204 |             if random.random() < self.mutation_rate:
205 |                 # Apply different mutation strategies based on parameter type
206 |                 if isinstance(min_val, int) and isinstance(max_val, int):
207 |                     # Integer parameter: adjust by small discrete steps
208 |                     step = max(1, int((max_val - min_val) * 0.1))  # 10% of range
209 |                     delta = random.choice([-step, step])
210 |                     mutated[param] = max(min_val, min(max_val, mutated[param] + delta))
211 |                 else:
212 |                     # Float parameter: adjust by percentage or small random change
213 |                     if random.random() < 0.5:
214 |                         # Percentage adjustment (±20%)
215 |                         factor = random.uniform(0.8, 1.2)
216 |                         mutated[param] = max(min_val, min(max_val, mutated[param] * factor))
217 |                     else:
218 |                         # Random value from parameter range
219 |                         range_size = max_val - min_val
220 |                         delta = random.uniform(-0.1 * range_size, 0.1 * range_size)
221 |                         mutated[param] = max(min_val, min(max_val, mutated[param] + delta))
222 |         
223 |         return mutated
224 |     
225 |     def evolve_generation(self) -> None:
226 |         """
227 |         Evolve the population by one generation through selection, crossover, and mutation.
228 |         """
229 |         # Select individuals for reproduction
230 |         selected = self.selection()
231 |         
232 |         # Create new generation through crossover and mutation
233 |         new_population = []
234 |         
235 |         # Preserve elite individuals
236 |         elites_count = max(1, int(self.elitism_pct * self.population_size))
237 |         new_population.extend(selected[:elites_count])
238 |         
239 |         # Crossover and mutation for the rest
240 |         while len(new_population) < self.population_size:
241 |             parent1 = random.choice(selected)
242 |             parent2 = random.choice(selected)
243 |             
244 |             child1, child2 = self.crossover(parent1, parent2)
245 |             child1 = self.mutation(child1)
246 |             child2 = self.mutation(child2)
247 |             
248 |             new_population.append(child1)
249 |             if len(new_population) < self.population_size:
250 |                 new_population.append(child2)
251 |         
252 |         self.population = new_population
253 |     
254 |     def run(self, seeded_individuals: List[Dict] = None) -> Dict:
255 |         """
256 |         Run the genetic algorithm for the specified number of generations.
257 |         
258 |         Args:
259 |             seeded_individuals: List of predefined parameter sets to include in the initial population
260 |             
261 |         Returns:
262 |             The best individual found
263 |         """
264 |         # Initialize and evaluate initial population
265 |         self.initialize_population(seeded_individuals)
266 |         self.evaluate_population()
267 |         
268 |         # Store initial generation data
269 |         self.record_generation(0)
270 |         
271 |         # Evolve for specified number of generations
272 |         for generation in range(1, self.generations + 1):
273 |             logger.info(f"Evolving generation {generation}/{self.generations}")
274 |             
275 |             # Evolve population
276 |             self.evolve_generation()
277 |             
278 |             # Evaluate new population
279 |             self.evaluate_population()
280 |             
281 |             # Record generation data
282 |             self.record_generation(generation)
283 |             
284 |             # Log progress
285 |             avg_fitness = sum(self.fitness_scores) / len(self.fitness_scores)
286 |             logger.info(f"Generation {generation}: Best fitness = {self.best_fitness}, Avg fitness = {avg_fitness:.4f}")
287 |         
288 |         logger.info(f"Genetic algorithm completed. Best individual: {self.best_individual}")
289 |         logger.info(f"Best fitness: {self.best_fitness}")
290 |         
291 |         return self.best_individual
292 |     
293 |     def record_generation(self, generation: int) -> None:
294 |         """
295 |         Record data for the current generation.
296 |         
297 |         Args:
298 |             generation: The current generation number
299 |         """
300 |         # Calculate statistics
301 |         avg_fitness = sum(self.fitness_scores) / len(self.fitness_scores)
302 |         min_fitness = min(self.fitness_scores)
303 |         max_fitness = max(self.fitness_scores)
304 |         
305 |         # Find current best individual
306 |         best_idx = self.fitness_scores.index(max_fitness)
307 |         current_best = deepcopy(self.population[best_idx])
308 |         
309 |         # Store generation data
310 |         generation_data = {
311 |             'generation': generation,
312 |             'timestamp': datetime.now().isoformat(),
313 |             'best_fitness': max_fitness,
314 |             'avg_fitness': avg_fitness,
315 |             'min_fitness': min_fitness,
316 |             'best_individual': current_best,
317 |             'diversity': self.calculate_diversity()
318 |         }
319 |         
320 |         self.generation_history.append(generation_data)
321 |     
322 |     def calculate_diversity(self) -> float:
323 |         """
324 |         Calculate the diversity of the current population.
325 |         
326 |         Returns:
327 |             A score between 0-1 representing population diversity
328 |         """
329 |         if not self.population or len(self.population) < 2:
330 |             return 0.0
331 |         
332 |         # Calculate normalized parameter distances
333 |         param_distances = []
334 |         
335 |         for param, (min_val, max_val) in self.param_ranges.items():
336 |             param_range = max_val - min_val
337 |             if param_range == 0:
338 |                 continue
339 |                 
340 |             values = [ind[param] for ind in self.population]
341 |             normalized_values = [(v - min_val) / param_range for v in values]
342 |             
343 |             # Calculate variance of the parameter
344 |             variance = np.var(normalized_values)
345 |             param_distances.append(variance)
346 |         
347 |         # Average variance across all parameters
348 |         return float(np.mean(param_distances))
349 |     
350 |     def get_generation_history(self) -> List[Dict]:
351 |         """
352 |         Get the history of all generations.
353 |         
354 |         Returns:
355 |             List of generation data dictionaries
356 |         """
357 |         return self.generation_history
358 |     
359 |     def get_best_individual(self) -> Dict:
360 |         """
361 |         Get the best individual found.
362 |         
363 |         Returns:
364 |             Dictionary of the best parameter set
365 |         """
366 |         return deepcopy(self.best_individual)
367 |     
368 |     def get_population_diversity(self) -> Dict:
369 |         """
370 |         Get diversity metrics for the current population.
371 |         
372 |         Returns:
373 |             Dictionary of diversity metrics
374 |         """
375 |         diversity = {}
376 |         
377 |         # Overall diversity score
378 |         diversity['overall'] = self.calculate_diversity()
379 |         
380 |         # Parameter-specific diversity
381 |         diversity['parameters'] = {}
382 |         for param, (min_val, max_val) in self.param_ranges.items():
383 |             param_range = max_val - min_val
384 |             if param_range == 0:
385 |                 diversity['parameters'][param] = 0.0
386 |                 continue
387 |                 
388 |             values = [ind[param] for ind in self.population]
389 |             normalized_values = [(v - min_val) / param_range for v in values]
390 |             variance = float(np.var(normalized_values))
391 |             diversity['parameters'][param] = variance
392 |         
393 |         return diversity


--------------------------------------------------------------------------------