|
1 | 1 | """Wrapper of Reader with S3 support."""
|
| 2 | +from __future__ import annotations |
2 | 3 |
|
3 | 4 | import logging
|
4 |
| -from typing import overload, Union, Optional |
| 5 | +from typing import overload, Union, Optional, Any |
5 | 6 | from collections.abc import Iterator
|
6 | 7 | from urllib.parse import urlparse
|
7 | 8 |
|
8 | 9 | from .protocols import ReaderProtocol
|
9 | 10 | from .libcachesim_python import (
|
10 | 11 | TraceType,
|
11 |
| - SamplerType, |
| 12 | + TraceFormat, |
12 | 13 | Request,
|
13 | 14 | ReaderInitParam,
|
14 | 15 | Reader,
|
|
21 | 22 | logger = logging.getLogger(__name__)
|
22 | 23 |
|
23 | 24 |
|
| 25 | +class TraceReaderSliceIterator: |
| 26 | + """Iterator for sliced TraceReader.""" |
| 27 | + |
| 28 | + def __init__(self, reader: "TraceReader", start: int, stop: int, step: int): |
| 29 | + self.reader = reader |
| 30 | + self.start = start |
| 31 | + self.stop = stop |
| 32 | + self.step = step |
| 33 | + self.current = start |
| 34 | + |
| 35 | + def __iter__(self) -> Iterator[Request]: |
| 36 | + return self |
| 37 | + |
| 38 | + def __next__(self) -> Request: |
| 39 | + if self.current >= self.stop: |
| 40 | + raise StopIteration |
| 41 | + |
| 42 | + # Reset reader and skip to current position |
| 43 | + self.reader.reset() |
| 44 | + |
| 45 | + # Check if we can use skip_n_req or need to simulate with read_one_req |
| 46 | + # zstd files cannot use skip_n_req |
| 47 | + if not self.reader._reader.is_zstd_file: |
| 48 | + logger.debug(f"Skipping {self.current} requests using skip_n_req") |
| 49 | + try: |
| 50 | + self.reader.skip_n_req(self.current) |
| 51 | + req = self.reader.read_one_req() |
| 52 | + except RuntimeError: |
| 53 | + logger.warning(f"Failed to skip {self.current} requests, falling back to simulation") |
| 54 | + # Fallback to simulation if skip_n_req fails |
| 55 | + req = self.reader._simulate_skip_and_read_single(self.current) |
| 56 | + else: |
| 57 | + logger.debug(f"Simulating skip by reading {self.current} requests one by one") |
| 58 | + # Simulate skip by reading requests one by one |
| 59 | + req = self.reader._simulate_skip_and_read_single(self.current) |
| 60 | + |
| 61 | + self.current += self.step |
| 62 | + return req |
| 63 | + |
| 64 | + |
24 | 65 | class TraceReader(ReaderProtocol):
|
25 | 66 | _reader: Reader
|
26 | 67 |
|
@@ -302,10 +343,52 @@ def __next__(self) -> Request:
|
302 | 343 | raise StopIteration
|
303 | 344 | return req
|
304 | 345 |
|
305 |
| - def __getitem__(self, index: int) -> Request: |
306 |
| - if index < 0 or index >= self._reader.get_num_of_req(): |
307 |
| - raise IndexError("Index out of range") |
308 |
| - self._reader.reset() |
309 |
| - self._reader.skip_n_req(index) |
| 346 | + def __getitem__(self, key: Union[int, slice]) -> Union[Request, TraceReaderSliceIterator]: |
| 347 | + if isinstance(key, slice): |
| 348 | + # Handle slice |
| 349 | + total_len = self._reader.get_num_of_req() |
| 350 | + start, stop, step = key.indices(total_len) |
| 351 | + return TraceReaderSliceIterator(self, start, stop, step) |
| 352 | + elif isinstance(key, int): |
| 353 | + # Handle single index |
| 354 | + total_len = self._reader.get_num_of_req() |
| 355 | + if key < 0: |
| 356 | + key += total_len |
| 357 | + if key < 0 or key >= total_len: |
| 358 | + raise IndexError("Index out of range") |
| 359 | + |
| 360 | + self._reader.reset() |
| 361 | + |
| 362 | + # Check if we can use skip_n_req or need to simulate |
| 363 | + if self._can_use_skip_n_req(): |
| 364 | + try: |
| 365 | + self._reader.skip_n_req(key) |
| 366 | + req = Request() |
| 367 | + ret = self._reader.read_one_req(req) |
| 368 | + if ret != 0: |
| 369 | + raise RuntimeError("Failed to read request") |
| 370 | + return req |
| 371 | + except RuntimeError: |
| 372 | + # Fallback to simulation |
| 373 | + self._reader.reset() |
| 374 | + return self._simulate_skip_and_read_single(key) |
| 375 | + else: |
| 376 | + # Simulate skip by reading requests one by one |
| 377 | + return self._simulate_skip_and_read_single(key) |
| 378 | + else: |
| 379 | + raise TypeError("TraceReader indices must be integers or slices") |
| 380 | + |
| 381 | + def _simulate_skip_and_read_single(self, index: int) -> Request: |
| 382 | + """Simulate skip_n_req by reading requests one by one for single index access.""" |
| 383 | + for _ in range(index): |
| 384 | + req = Request() |
| 385 | + ret = self._reader.read_one_req(req) |
| 386 | + if ret != 0: |
| 387 | + raise IndexError(f"Cannot reach index {index}") |
| 388 | + |
| 389 | + # Read the target request |
310 | 390 | req = Request()
|
311 |
| - return self._reader.read_one_req(req) |
| 391 | + ret = self._reader.read_one_req(req) |
| 392 | + if ret != 0: |
| 393 | + raise IndexError(f"Cannot read request at index {index}") |
| 394 | + return req |
0 commit comments