Prometheus-Swarm · TestingRabbit-pixel · Jun 4, 2025 · Jun 4, 2025 · Jun 4, 2025 · Jun 4, 2025
diff --git a/.env.example b/.env.example
@@ -0,0 +1,13 @@
+# CoinGecko API Configuration
+
+# Base URL for CoinGecko API (optional, defaults to official endpoint)
+COINGECKO_API_BASE_URL=https://api.coingecko.com/api/v3
+
+# API Key for CoinGecko (optional for public endpoints)
+COINGECKO_API_KEY=your_api_key_here
+
+# Request timeout in seconds (optional, defaults to 30)
+COINGECKO_REQUEST_TIMEOUT=30
+
+# Rate limit requests per minute (optional, defaults to 50)
+COINGECKO_RATE_LIMIT=50
diff --git a/.gitignore b/.gitignore
@@ -1,48 +1,13 @@
-.venv
+__pycache__/
+*.py[cod]
+*$py.class
 .env
-__pycache__
-.pytest_cache
-.pypirc
-*.db
-test
-test_state.json
-task_flow.egg-info
-example_repo
-signature.js
-git-filter-repo
-task/orca/
-**/dist/
-# yarn.lock
-package-lock.json
-node_modules
-build
-migrate.sh
-*/dev.js
-executables/*
-namespace/*
-config/*
-.env.local
-taskStateInfoKeypair.json
-localKOIIDB.db
-metadata.json
-.npmrc
-*.pem
-.vscode
-.cursor
-data/chunks
-data/process
-test_state.csv
-todos-example.csv
-
-
-# Ignore auto-generated repository directories
-repos/
-
-
-# Ignore Data
-data/*
-
-
-venv
-
-**/venv/
+.venv
+venv/
+.pytest_cache/
+dist/
+build/
+*.egg-info/
+.coverage
+htmlcov/
+.DS_Store
diff --git a/src/__init__.py b/src/__init__.py
@@ -0,0 +1 @@
+# Make src a Python package
diff --git a/src/config_validator.py b/src/config_validator.py
@@ -0,0 +1,156 @@
+from typing import Dict, Any, Optional
+import os
+import re
+
+class ConfigValidationError(Exception):
+    """Custom exception for configuration validation errors."""
+    pass
+
+class CoinGeckoConfigValidator:
+    """Validates CoinGecko API configuration settings."""
+
+    @staticmethod
+    def validate_config(config: Dict[str, Any]) -> Dict[str, Any]:
+        """
+        Validate and sanitize the configuration dictionary.
+
+        Args:
+            config (Dict[str, Any]): Configuration dictionary to validate
+
+        Returns:
+            Dict[str, Any]: Validated and sanitized configuration
+
+        Raises:
+            ConfigValidationError: If configuration is invalid
+        """
+        # Validate or set default values
+        config = config.copy()  # Prevent modifying original dict
+
+        # Validate presence of required keys
+        required_keys = ['API_BASE_URL', 'API_KEY']
+        for key in required_keys:
+            if key not in config or config[key] is None or str(config[key]).strip() == '':
+                raise ConfigValidationError(f"Missing or invalid required configuration key: {key}")
+
+        # Validate API base URL format
+        CoinGeckoConfigValidator._validate_url(config['API_BASE_URL'])
+
+        # Validate API key
+        CoinGeckoConfigValidator._validate_api_key(config['API_KEY'])
+
+        # Validate optional timeout
+        if 'REQUEST_TIMEOUT' in config:
+            config['REQUEST_TIMEOUT'] = CoinGeckoConfigValidator._validate_timeout(config['REQUEST_TIMEOUT'])
+        else:
+            config['REQUEST_TIMEOUT'] = 30  # Default timeout
+
+        # Validate rate limit settings
+        if 'RATE_LIMIT' in config:
+            config['RATE_LIMIT'] = CoinGeckoConfigValidator._validate_rate_limit(config['RATE_LIMIT'])
+        else:
+            config['RATE_LIMIT'] = 50  # Default rate limit
+
+        return config
+
+    @staticmethod
+    def _validate_url(url: str) -> None:
+        """
+        Validate URL format.
+
+        Args:
+            url (str): URL to validate
+
+        Raises:
+            ConfigValidationError: If URL is invalid
+        """
+        url_pattern = re.compile(
+            r'^https?://'  # http:// or https://
+            r'(?:(?:[A-Z0-9](?:[A-Z0-9-]{0,61}[A-Z0-9])?\.)+[A-Z]{2,6}\.?|'  # domain
+            r'localhost|'  # localhost
+            r'\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3})'  # IP
+            r'(?::\d+)?'  # optional port
+            r'(?:/?|[/?]\S+)$', re.IGNORECASE)
+
+        if not url_pattern.match(url):
+            raise ConfigValidationError(f"Invalid URL format: {url}")
+
+    @staticmethod
+    def _validate_api_key(api_key: str) -> None:
+        """
+        Validate API key format.
+
+        Args:
+            api_key (str): API key to validate
+
+        Raises:
+            ConfigValidationError: If API key is invalid
+        """
+        # Remove whitespace and validate minimum length
+        sanitized_key = str(api_key).strip()
+        if len(sanitized_key) < 10:
+            raise ConfigValidationError("Invalid API key: Key is too short")
+
+    @staticmethod
+    def _validate_timeout(timeout: Any) -> float:
+        """
+        Validate request timeout.
+
+        Args:
+            timeout (Any): Timeout value to validate
+
+        Returns:
+            float: Validated timeout value
+
+        Raises:
+            ConfigValidationError: If timeout is invalid
+        """
+        try:
+            timeout_float = float(timeout)
+            if timeout_float <= 0 or timeout_float > 120:  # Reasonable timeout range
+                raise ConfigValidationError(f"Invalid timeout value: {timeout}")
+            return timeout_float
+        except (TypeError, ValueError):
+            raise ConfigValidationError(f"Invalid timeout value: must be a numeric value, got {type(timeout)}")
-        try:
-            timeout_float = float(timeout)
-            if timeout_float <= 0 or timeout_float > 120:  # Reasonable timeout range
-                raise ConfigValidationError(f"Invalid timeout value: {timeout}")
-            return timeout_float
-        except (TypeError, ValueError):
-            raise ConfigValidationError(f"Invalid timeout value: must be a numeric value, got {type(timeout)}")
+        try:
+            timeout_float = float(timeout)
+            if timeout_float <= 0 or timeout_float > 120:  # Reasonable timeout range
+                raise ConfigValidationError(f"Invalid timeout value: {timeout}")
+            return timeout_float
+        except (TypeError, ValueError) as exc:
+            raise ConfigValidationError(f"Invalid timeout value: must be a numeric value, got {type(timeout)}") from exc
-        try:
-            timeout_float = float(timeout)
-            if timeout_float <= 0 or timeout_float > 120:  # Reasonable timeout range
-                raise ConfigValidationError(f"Invalid timeout value: {timeout}")
-            return timeout_float
-        except (TypeError, ValueError):
-            raise ConfigValidationError(f"Invalid timeout value: must be a numeric value, got {type(timeout)}")
+        try:
+            timeout_float = float(timeout)
+            if timeout_float <= 0 or timeout_float > 120:  # Reasonable timeout range
+                raise ConfigValidationError(f"Invalid timeout value: {timeout}")
+            return timeout_float
+        except (TypeError, ValueError) as exc:
+            raise ConfigValidationError(f"Invalid timeout value: must be a numeric value, got {type(timeout)}") from exc
+
+    @staticmethod
+    def _validate_rate_limit(rate_limit: Any) -> float:
+        """
+        Validate rate limit settings.
+
+        Args:
+            rate_limit (Any): Rate limit configuration to validate
+
+        Returns:
+            float: Validated rate limit value
+
+        Raises:
+            ConfigValidationError: If rate limit is invalid
+        """
+        try:
+            limit_float = float(rate_limit)
+            if limit_float <= 0 or limit_float > 100:  # Reasonable rate limit range
+                raise ConfigValidationError(f"Invalid rate limit value: {rate_limit}")
+            return limit_float
+        except (TypeError, ValueError):
+            raise ConfigValidationError(f"Invalid rate limit value: must be a numeric value, got {type(rate_limit)}")
-        try:
-            limit_float = float(rate_limit)
-            if limit_float <= 0 or limit_float > 100:  # Reasonable rate limit range
-                raise ConfigValidationError(f"Invalid rate limit value: {rate_limit}")
-            return limit_float
-        except (TypeError, ValueError):
-            raise ConfigValidationError(f"Invalid rate limit value: must be a numeric value, got {type(rate_limit)}")
+        try:
+            limit_float = float(rate_limit)
+            if limit_float <= 0 or limit_float > 100:  # Reasonable rate limit range
+                raise ConfigValidationError(f"Invalid rate limit value: {rate_limit}")
+            return limit_float
+        except (TypeError, ValueError) as exc:
+            raise ConfigValidationError(f"Invalid rate limit value: must be a numeric value, got {type(rate_limit)}") from exc
-        try:
-            limit_float = float(rate_limit)
-            if limit_float <= 0 or limit_float > 100:  # Reasonable rate limit range
-                raise ConfigValidationError(f"Invalid rate limit value: {rate_limit}")
-            return limit_float
-        except (TypeError, ValueError):
-            raise ConfigValidationError(f"Invalid rate limit value: must be a numeric value, got {type(rate_limit)}")
+        try:
+            limit_float = float(rate_limit)
+            if limit_float <= 0 or limit_float > 100:  # Reasonable rate limit range
+                raise ConfigValidationError(f"Invalid rate limit value: {rate_limit}")
+            return limit_float
+        except (TypeError, ValueError) as exc:
+            raise ConfigValidationError(f"Invalid rate limit value: must be a numeric value, got {type(rate_limit)}") from exc
+
+    @classmethod
+    def load_from_env(cls) -> Dict[str, Any]:
+        """
+        Load configuration from environment variables.
+
+        Returns:
+            Dict[str, Any]: Validated configuration from environment
+        """
+        config = {
+            'API_BASE_URL': os.getenv('COINGECKO_API_BASE_URL', 'https://api.coingecko.com/api/v3'),
+            'API_KEY': os.getenv('COINGECKO_API_KEY', ''),
+            'REQUEST_TIMEOUT': os.getenv('COINGECKO_REQUEST_TIMEOUT', 30),
+            'RATE_LIMIT': os.getenv('COINGECKO_RATE_LIMIT', 50)
-            'REQUEST_TIMEOUT': os.getenv('COINGECKO_REQUEST_TIMEOUT', 30),
-            'RATE_LIMIT': os.getenv('COINGECKO_RATE_LIMIT', 50)
+        config = {
+            'API_BASE_URL': os.getenv('COINGECKO_API_BASE_URL', 'https://api.coingecko.com/api/v3'),
+            'API_KEY':        os.getenv('COINGECKO_API_KEY', ''),
+            'REQUEST_TIMEOUT': os.getenv('COINGECKO_REQUEST_TIMEOUT', '30'),
+            'RATE_LIMIT':      os.getenv('COINGECKO_RATE_LIMIT', '50')
+        }
-            'REQUEST_TIMEOUT': os.getenv('COINGECKO_REQUEST_TIMEOUT', 30),
-            'RATE_LIMIT': os.getenv('COINGECKO_RATE_LIMIT', 50)
+        config = {
+            'API_BASE_URL': os.getenv('COINGECKO_API_BASE_URL', 'https://api.coingecko.com/api/v3'),
+            'API_KEY':        os.getenv('COINGECKO_API_KEY', ''),
+            'REQUEST_TIMEOUT': os.getenv('COINGECKO_REQUEST_TIMEOUT', '30'),
+            'RATE_LIMIT':      os.getenv('COINGECKO_RATE_LIMIT', '50')
+        }
+        }
+
+        # Convert numeric environment variables
+        config['REQUEST_TIMEOUT'] = float(config['REQUEST_TIMEOUT'])
+        config['RATE_LIMIT'] = float(config['RATE_LIMIT'])
+
+        return cls.validate_config(config)
diff --git a/src/historical_price_transformer.py b/src/historical_price_transformer.py
@@ -0,0 +1,119 @@
+from typing import Dict, List, Union, Optional
+from datetime import datetime
+import logging
+
+class HistoricalPriceTransformer:
+    """
+    Transforms and validates historical price data from CoinGecko API.
+
+    Handles data validation, cleaning, and transformation of historical 
+    cryptocurrency price data.
+    """
+
+    @staticmethod
+    def validate_historical_data(data: List[List[Union[int, float]]]) -> bool:
+        """
+        Validate the structure and content of historical price data.
+
+        Args:
+            data (List[List[Union[int, float]]]): Raw historical price data
+
+        Returns:
+            bool: True if data is valid, False otherwise
+        """
+        if not isinstance(data, list):
+            logging.error("Historical data must be a list")
+            return False
+
+        # Check each data point
+        for point in data:
+            if not isinstance(point, list) or len(point) != 2:
+                logging.error(f"Invalid data point format: {point}")
+                return False
+
+            timestamp, price = point
+
+            # Validate timestamp
+            try:
+                datetime.fromtimestamp(timestamp / 1000)  # Convert milliseconds to seconds
+            except (TypeError, ValueError):
+                logging.error(f"Invalid timestamp: {timestamp}")
+                return False
+
+            # Validate price
+            if not isinstance(price, (int, float)) or price < 0:
+                logging.error(f"Invalid price: {price}")
+                return False
+
+        return True
+
+    @staticmethod
+    def transform_historical_data(data: List[List[Union[int, float]]]) -> List[Dict[str, Union[int, float]]]:
+        """
+        Transform historical price data into a more usable format.
+
+        Args:
+            data (List[List[Union[int, float]]]): Raw historical price data
+
+        Returns:
+            List[Dict[str, Union[int, float]]]: Transformed historical price data
+
+        Raises:
+            ValueError: If input data is invalid
+        """
+        if not HistoricalPriceTransformer.validate_historical_data(data):
+            raise ValueError("Invalid historical price data")
+
+        transformed_data = []
+        for point in data:
+            timestamp, price = point
+            transformed_point = {
+                'timestamp': timestamp,
+                'datetime': datetime.fromtimestamp(timestamp / 1000).isoformat(),
+                'price': price
+            }
+            transformed_data.append(transformed_point)
+
+        return transformed_data
+
+    @staticmethod
+    def filter_historical_data(
+        data: List[Dict[str, Union[int, float]]],
+        start_date: Optional[datetime] = None,
+        end_date: Optional[datetime] = None,
+        min_price: Optional[float] = None,
+        max_price: Optional[float] = None
+    ) -> List[Dict[str, Union[int, float]]]:
+        """
+        Filter historical price data based on optional criteria.
+
+        Args:
+            data (List[Dict[str, Union[int, float]]]): Transformed historical price data
+            start_date (Optional[datetime]): Minimum date for filtering (exclusive)
+            end_date (Optional[datetime]): Maximum date for filtering (exclusive)
+            min_price (Optional[float]): Minimum price for filtering
+            max_price (Optional[float]): Maximum price for filtering
+
+        Returns:
+            List[Dict[str, Union[int, float]]]: Filtered historical price data
+        """
+        def meets_filter_criteria(point):
+            point_datetime = datetime.fromisoformat(point['datetime'])
+
+            # Check date range (strict inequality)
+            if start_date and point_datetime <= start_date:
+                return False
+
+            if end_date and point_datetime >= end_date:
+                return False
+
+            # Check price range
+            if min_price is not None and point['price'] < min_price:
+                return False
+
+            if max_price is not None and point['price'] > max_price:
+                return False
+
+            return True
+
+        return [point for point in data if meets_filter_criteria(point)]