Update docs, enable exchanges, and fix tests

- Update CLAUDE.md to reflect actual module structure (add websocket, connection_pool, monitoring modules; remove outdated "Planned" note) - Enable additional exchanges in config.yaml (kucoin, kraken, okx, etc.) - Fix cache manager to refetch when memory has fewer candles than limit - Fix benchmark tests asyncio event loop issues (use new_event_loop) - Update unit tests to match new cache behavior and config Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-03-06 13:36:38 -04:00 · 2026-03-06 13:36:38 -04:00 · bf95490673
parent cdc04d010a
commit bf95490673
7 changed files with 243 additions and 148 deletions
--- a/CLAUDE.md
+++ b/CLAUDE.md
@ -84,24 +84,28 @@ Three-tier caching system with REST API and WebSocket interfaces:
 | `main.py` | Entry point, starts REST server |
 | `config.py` | Configuration loading from YAML |
 | `api/rest.py` | FastAPI REST endpoints |
+| `api/websocket.py` | WebSocket server for real-time updates |
 | `cache/manager.py` | Core cache logic (memory → db → exchange) |
 | `cache/memory.py` | In-memory LRU cache with TTL |
 | `cache/database.py` | Synchronous SQLite operations |
 | `cache/async_database.py` | Async SQLite operations for candle persistence |
+| `cache/connection_pool.py` | Database connection pooling |
 | `cache/gaps.py` | Gap detection in candle data |
 | `cache/gap_filler.py` | Gap filling logic |
 | `cache/completeness.py` | Completeness tracking for data ranges |
 | `exchanges/base.py` | Abstract exchange connector interface |
-| `exchanges/ccxt_connector.py` | CCXT-based connector implementation |
-| `exchanges/binance.py` | Binance connector |
+| `exchanges/ccxt_connector.py` | CCXT-based connector (supports 100+ exchanges) |
+| `exchanges/binance.py` | Binance-specific connector (legacy, WebSocket support) |
 | `candles/assembler.py` | Builds candles from trade ticks |
 | `candles/models.py` | Candle data models and validation |
 | `sessions/manager.py` | Session management for connections |
 | `sessions/models.py` | Session data models |
+| `monitoring/health.py` | Health check endpoints and system status |
+| `monitoring/metrics.py` | Performance metrics tracking |
 | `utils/timeframes.py` | Timeframe utilities and conversions |
 | `utils/timestamps.py` | Timestamp utilities |

-**Planned (M2):** `api/websocket.py`, `exchanges/kucoin.py`, `exchanges/kraken.py`
+**Note:** KuCoin, Kraken, and 100+ other exchanges are supported via `CCXTConnector` - use `create_connector("exchange_name")` from `exchanges/__init__.py`.

 ### Key Paths

--- a/config.yaml
+++ b/config.yaml
@ -12,15 +12,54 @@ cache:
  memory_ttl_seconds: 432000  # 5 days (matches BrighterTrading)

 exchanges:
+  # Major exchanges with good public API support
  binance:
    enabled: true
    rate_limit_ms: 100
-  # Disabled until connectors are implemented:
+  binanceus:
+    enabled: true
+    rate_limit_ms: 100
+  bybit:
+    enabled: true
+    rate_limit_ms: 100
  kucoin:
-    enabled: false
+    enabled: true
    rate_limit_ms: 100
  kraken:
-    enabled: false
+    enabled: true
+    rate_limit_ms: 100
+  okx:
+    enabled: true
+    rate_limit_ms: 100
+  coinbase:
+    enabled: true
+    rate_limit_ms: 100
+  bitget:
+    enabled: true
+    rate_limit_ms: 100
+  mexc:
+    enabled: true
+    rate_limit_ms: 100
+  gate:
+    enabled: true
+    rate_limit_ms: 100
+  htx:
+    enabled: true
+    rate_limit_ms: 100
+  bitfinex:
+    enabled: true
+    rate_limit_ms: 100
+  bitstamp:
+    enabled: true
+    rate_limit_ms: 100
+  gemini:
+    enabled: true
+    rate_limit_ms: 100
+  poloniex:
+    enabled: true
+    rate_limit_ms: 100
+  cryptocom:
+    enabled: true
    rate_limit_ms: 100

 logging:
--- a/src/exchange_data_manager/cache/manager.py
+++ b/src/exchange_data_manager/cache/manager.py
@ -139,9 +139,26 @@ class CacheManager:
        )

        if memory_candles and not memory_gaps:
-            # Complete data in memory
-            logger.debug(f"Memory cache hit: {len(memory_candles)} candles")
-            return memory_candles, "memory"
+            # For limit-only requests, ensure we have enough candles
+            # (e.g., WebSocket may have accumulated fewer candles than requested)
+            if (
+                request.limit is not None
+                and len(memory_candles) < request.limit
+                and request.start is None
+                and request.end is None
+            ):
+                # Insufficient data for limit-only request - fall through to fetch more
+                logger.debug(
+                    f"Memory has {len(memory_candles)} candles but {request.limit} requested, "
+                    "fetching more from exchange"
+                )
+                # Clear memory_candles so we don't return partial data
+                # We'll fetch fresh from exchange
+                memory_candles = []
+            else:
+                # Complete data in memory
+                logger.debug(f"Memory cache hit: {len(memory_candles)} candles")
+                return memory_candles, "memory"

        all_candles.extend(memory_candles)
        gaps_to_fill = memory_gaps if memory_gaps else [(request.start, request.end)]
--- a/tests/benchmarks/test_performance.py
+++ b/tests/benchmarks/test_performance.py
@ -170,72 +170,88 @@ class TestDatabaseCacheBenchmarks:
        with tempfile.TemporaryDirectory() as tmpdir:
            yield os.path.join(tmpdir, "test.db")

-    @pytest.mark.asyncio
-    async def test_database_put_100_candles(self, benchmark, temp_db_path):
+    def test_database_put_100_candles(self, benchmark, temp_db_path):
        """Benchmark storing 100 candles in database."""
-        db = AsyncDatabaseCache(db_path=temp_db_path)
-        await db.initialize()
-        candles = generate_candles(100)
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path)
+            loop.run_until_complete(db.initialize())
+            candles = generate_candles(100)

-        def put_candles():
-            asyncio.get_event_loop().run_until_complete(
-                db.put("binance", "BTC/USDT", "5m", candles)
-            )
+            def put_candles():
+                loop.run_until_complete(
+                    db.put("binance", "BTC/USDT", "5m", candles)
+                )

-        benchmark(put_candles)
-        await db.close()
+            benchmark(put_candles)
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()

-    @pytest.mark.asyncio
-    async def test_database_put_1000_candles(self, benchmark, temp_db_path):
+    def test_database_put_1000_candles(self, benchmark, temp_db_path):
        """Benchmark storing 1000 candles in database."""
-        db = AsyncDatabaseCache(db_path=temp_db_path)
-        await db.initialize()
-        candles = generate_candles(1000)
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path)
+            loop.run_until_complete(db.initialize())
+            candles = generate_candles(1000)

-        def put_candles():
-            asyncio.get_event_loop().run_until_complete(
-                db.put("binance", "BTC/USDT", "5m", candles)
-            )
+            def put_candles():
+                loop.run_until_complete(
+                    db.put("binance", "BTC/USDT", "5m", candles)
+                )

-        benchmark(put_candles)
-        await db.close()
+            benchmark(put_candles)
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()

-    @pytest.mark.asyncio
-    async def test_database_get_1000_candles(self, benchmark, temp_db_path):
+    def test_database_get_1000_candles(self, benchmark, temp_db_path):
        """Benchmark retrieving 1000 candles from database."""
-        db = AsyncDatabaseCache(db_path=temp_db_path)
-        await db.initialize()
-        candles = generate_candles(1000)
-        await db.put("binance", "BTC/USDT", "5m", candles)
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path)
+            loop.run_until_complete(db.initialize())
+            candles = generate_candles(1000)
+            loop.run_until_complete(db.put("binance", "BTC/USDT", "5m", candles))

-        def get_candles():
-            return asyncio.get_event_loop().run_until_complete(
-                db.get("binance", "BTC/USDT", "5m")
-            )
+            def get_candles():
+                return loop.run_until_complete(
+                    db.get("binance", "BTC/USDT", "5m")
+                )

-        result = benchmark(get_candles)
-        assert len(result[0]) == 1000
-        await db.close()
+            result = benchmark(get_candles)
+            assert len(result[0]) == 1000
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()

-    @pytest.mark.asyncio
-    async def test_database_get_with_time_range(self, benchmark, temp_db_path):
+    def test_database_get_with_time_range(self, benchmark, temp_db_path):
        """Benchmark retrieving candles with time range filter."""
-        db = AsyncDatabaseCache(db_path=temp_db_path)
-        await db.initialize()
-        candles = generate_candles(10000)
-        await db.put("binance", "BTC/USDT", "5m", candles)
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path)
+            loop.run_until_complete(db.initialize())
+            candles = generate_candles(10000)
+            loop.run_until_complete(db.put("binance", "BTC/USDT", "5m", candles))

-        start_time = candles[2500].time
-        end_time = candles[7500].time
+            start_time = candles[2500].time
+            end_time = candles[7500].time

-        def get_candles():
-            return asyncio.get_event_loop().run_until_complete(
-                db.get("binance", "BTC/USDT", "5m", start=start_time, end=end_time)
-            )
+            def get_candles():
+                return loop.run_until_complete(
+                    db.get("binance", "BTC/USDT", "5m", start=start_time, end=end_time)
+                )

-        result = benchmark(get_candles)
-        assert len(result[0]) > 0
-        await db.close()
+            result = benchmark(get_candles)
+            assert len(result[0]) > 0
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()


 # =============================================================================
@ -292,64 +308,72 @@ class TestCacheFlowBenchmarks:
        with tempfile.TemporaryDirectory() as tmpdir:
            yield os.path.join(tmpdir, "test.db")

-    @pytest.mark.asyncio
-    async def test_cache_manager_memory_hit(self, benchmark, temp_db_path):
+    def test_cache_manager_memory_hit(self, benchmark, temp_db_path):
        """Benchmark cache manager with memory cache hit."""
-        manager = CacheManager(
-            cache_config=CacheConfig(),
-            database_config=DatabaseConfig(path=temp_db_path),
-        )
-        await manager.initialize()
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            manager = CacheManager(
+                cache_config=CacheConfig(),
+                database_config=DatabaseConfig(path=temp_db_path),
+            )
+            loop.run_until_complete(manager.initialize())

-        # Pre-populate memory cache
-        candles = generate_candles(1000)
-        manager.memory.put("binance:BTC/USDT:5m", candles)
+            # Pre-populate memory cache
+            candles = generate_candles(1000)
+            manager.memory.put("binance:BTC/USDT:5m", candles)

-        request = CandleRequest(
-            exchange="binance",
-            symbol="BTC/USDT",
-            timeframe="5m",
-            limit=100,
-        )
-
-        def get_candles():
-            return asyncio.get_event_loop().run_until_complete(
-                manager.get_candles(request)
+            request = CandleRequest(
+                exchange="binance",
+                symbol="BTC/USDT",
+                timeframe="5m",
+                limit=100,
            )

-        result = benchmark(get_candles)
-        assert len(result) == 100
+            def get_candles():
+                return loop.run_until_complete(
+                    manager.get_candles(request)
+                )

-    @pytest.mark.asyncio
-    async def test_cache_manager_database_hit(self, benchmark, temp_db_path):
+            result = benchmark(get_candles)
+            assert len(result) == 100
+        finally:
+            loop.close()
+
+    def test_cache_manager_database_hit(self, benchmark, temp_db_path):
        """Benchmark cache manager with database hit (cold memory cache)."""
-        manager = CacheManager(
-            cache_config=CacheConfig(),
-            database_config=DatabaseConfig(path=temp_db_path),
-        )
-        await manager.initialize()
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            manager = CacheManager(
+                cache_config=CacheConfig(),
+                database_config=DatabaseConfig(path=temp_db_path),
+            )
+            loop.run_until_complete(manager.initialize())

-        # Pre-populate database only
-        candles = generate_candles(1000)
-        await manager.database.put("binance", "BTC/USDT", "5m", candles)
+            # Pre-populate database only
+            candles = generate_candles(1000)
+            loop.run_until_complete(manager.database.put("binance", "BTC/USDT", "5m", candles))

-        request = CandleRequest(
-            exchange="binance",
-            symbol="BTC/USDT",
-            timeframe="5m",
-            start=candles[0].time,
-            end=candles[-1].time,
-        )
-
-        def get_candles():
-            # Clear memory cache to force database read
-            manager.clear_memory()
-            return asyncio.get_event_loop().run_until_complete(
-                manager.get_candles(request)
+            request = CandleRequest(
+                exchange="binance",
+                symbol="BTC/USDT",
+                timeframe="5m",
+                start=candles[0].time,
+                end=candles[-1].time,
            )

-        result = benchmark(get_candles)
-        assert len(result) > 0
+            def get_candles():
+                # Clear memory cache to force database read
+                manager.clear_memory()
+                return loop.run_until_complete(
+                    manager.get_candles(request)
+                )
+
+            result = benchmark(get_candles)
+            assert len(result) > 0
+        finally:
+            loop.close()


 # =============================================================================
@ -366,45 +390,53 @@ class TestConnectionPoolBenchmarks:
        with tempfile.TemporaryDirectory() as tmpdir:
            yield os.path.join(tmpdir, "test.db")

-    @pytest.mark.asyncio
-    async def test_concurrent_reads(self, benchmark, temp_db_path):
+    def test_concurrent_reads(self, benchmark, temp_db_path):
        """Benchmark concurrent database reads with connection pool."""
-        db = AsyncDatabaseCache(db_path=temp_db_path, pool_size=5)
-        await db.initialize()
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path, pool_size=5)
+            loop.run_until_complete(db.initialize())

-        # Pre-populate
-        candles = generate_candles(1000)
-        await db.put("binance", "BTC/USDT", "5m", candles)
+            # Pre-populate
+            candles = generate_candles(1000)
+            loop.run_until_complete(db.put("binance", "BTC/USDT", "5m", candles))

-        async def concurrent_reads():
-            tasks = [
-                db.get("binance", "BTC/USDT", "5m", limit=100)
-                for _ in range(10)
-            ]
-            return await asyncio.gather(*tasks)
+            async def concurrent_reads():
+                tasks = [
+                    db.get("binance", "BTC/USDT", "5m", limit=100)
+                    for _ in range(10)
+                ]
+                return await asyncio.gather(*tasks)

-        def run_concurrent():
-            return asyncio.get_event_loop().run_until_complete(concurrent_reads())
+            def run_concurrent():
+                return loop.run_until_complete(concurrent_reads())

-        results = benchmark(run_concurrent)
-        assert len(results) == 10
-        await db.close()
+            results = benchmark(run_concurrent)
+            assert len(results) == 10
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()

-    @pytest.mark.asyncio
-    async def test_concurrent_writes(self, benchmark, temp_db_path):
+    def test_concurrent_writes(self, benchmark, temp_db_path):
        """Benchmark concurrent database writes with connection pool."""
-        db = AsyncDatabaseCache(db_path=temp_db_path, pool_size=5)
-        await db.initialize()
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            db = AsyncDatabaseCache(db_path=temp_db_path, pool_size=5)
+            loop.run_until_complete(db.initialize())

-        async def concurrent_writes():
-            tasks = []
-            for i in range(10):
-                candles = generate_candles(100, start_time=1700000000 + i * 1000000)
-                tasks.append(db.put("binance", f"SYM{i}/USDT", "5m", candles))
-            await asyncio.gather(*tasks)
+            async def concurrent_writes():
+                tasks = []
+                for i in range(10):
+                    candles = generate_candles(100, start_time=1700000000 + i * 1000000)
+                    tasks.append(db.put("binance", f"SYM{i}/USDT", "5m", candles))
+                await asyncio.gather(*tasks)

-        def run_concurrent():
-            asyncio.get_event_loop().run_until_complete(concurrent_writes())
+            def run_concurrent():
+                loop.run_until_complete(concurrent_writes())

-        benchmark(run_concurrent)
-        await db.close()
+            benchmark(run_concurrent)
+            loop.run_until_complete(db.close())
+        finally:
+            loop.close()
--- a/tests/test_cache_manager.py
+++ b/tests/test_cache_manager.py
@ -76,7 +76,7 @@ class TestCacheManagerColdCache:
    @pytest.mark.asyncio
    @patch("exchange_data_manager.cache.memory.time.time")
    async def test_limit_only_caches_result(self, mock_time, cache_manager):
-        """Test that limit-only results are cached in memory."""
+        """Test that limit-only results are cached in memory when request is satisfied."""
        # Mock time to be close to test candle timestamps (prevents freshness check)
        mock_time.return_value = 1709337660  # Just after the candle

@ -87,13 +87,15 @@ class TestCacheManagerColdCache:
        mock_connector.fetch_candles.return_value = expected_candles
        cache_manager.register_exchange("binance", mock_connector)

+        # Request exactly 1 candle - matches what memory will have after first call
+        # (If we requested more, the cache manager would refetch since memory has fewer)
        request = CandleRequest(
            exchange="binance",
            symbol="BTC/USDT",
            timeframe="1m",
            start=None,
            end=None,
-            limit=100,
+            limit=1,
        )

        # First call - fetches from exchange
@ -101,7 +103,7 @@ class TestCacheManagerColdCache:
        assert mock_connector.fetch_candles.call_count == 1
        assert len(result1) == 1

-        # Second call - memory cache has data, so doesn't need to fetch again
+        # Second call - memory cache has enough data (1 >= 1), uses cache
        result2 = await cache_manager.get_candles(request)
        assert mock_connector.fetch_candles.call_count == 1  # Still 1 - used cache
        assert len(result2) == 1
--- a/tests/test_config.py
+++ b/tests/test_config.py
@ -118,11 +118,10 @@ class TestConfigLoad:

        enabled = config.get_enabled_exchanges()
        assert isinstance(enabled, list)
-        # Binance should be enabled per config.yaml
+        # Major exchanges should be enabled per config.yaml
        assert "binance" in enabled
-        # kucoin/kraken disabled in config.yaml
-        assert "kucoin" not in enabled
-        assert "kraken" not in enabled
+        assert "kucoin" in enabled
+        assert "kraken" in enabled


 class TestConnectorRegistry:
--- a/tests/test_integration.py
+++ b/tests/test_integration.py
@ -86,7 +86,7 @@ class TestCacheManagerIntegration:
    @pytest.mark.asyncio
    @patch("exchange_data_manager.cache.memory.time.time")
    async def test_warm_cache_uses_memory(self, mock_time, cache_manager):
-        """Test that warm cache uses memory instead of exchange."""
+        """Test that warm cache uses memory instead of exchange when limit is satisfied."""
        # Mock time to be close to test candle timestamps (prevents freshness check)
        mock_time.return_value = 1709337720  # Just after the second candle

@ -97,18 +97,20 @@ class TestCacheManagerIntegration:
        ]
        cache_manager.register_exchange("binance", mock_connector)

+        # Request exactly 2 candles - matches what memory will have after first call
+        # (If we requested more, the cache manager would refetch since memory has fewer)
        request = CandleRequest(
            exchange="binance",
            symbol="BTC/USDT",
            timeframe="1m",
-            limit=100,
+            limit=2,
        )

        # First call - cold cache
        await cache_manager.get_candles(request)
        assert mock_connector.fetch_candles.call_count == 1

-        # Second call - should use memory
+        # Second call - should use memory (has 2 candles, requested 2)
        result = await cache_manager.get_candles(request)
        assert len(result) == 2
        assert mock_connector.fetch_candles.call_count == 1  # No additional call