`quantex.sources`

DataSource abstractions for the QuantEx library.

`BacktestingDataSource`

Bases: DataSource

A data source for backtesting that must have a defined length.

Source code in src/quantex/sources.py

class BacktestingDataSource(DataSource):
    """A data source for backtesting that must have a defined length."""

    @abstractmethod
    def __len__(self) -> int:  # pragma: no cover – abstract contract
        raise NotImplementedError

    @abstractmethod
    def get_raw_data(self) -> pd.DataFrame:
        """Returns the entire underlying data as a DataFrame.

        This method is intended for use by the backtesting engine for
        pre-computation and should not be used in strategy logic.
        """
        raise NotImplementedError

`get_raw_data()` `abstractmethod`

Returns the entire underlying data as a DataFrame.

This method is intended for use by the backtesting engine for pre-computation and should not be used in strategy logic.

Source code in src/quantex/sources.py

@abstractmethod
def get_raw_data(self) -> pd.DataFrame:
    """Returns the entire underlying data as a DataFrame.

    This method is intended for use by the backtesting engine for
    pre-computation and should not be used in strategy logic.
    """
    raise NotImplementedError

`CSVDataSource`

Bases: BacktestingDataSource

Backtesting data source backed by a local OHLCV CSV file.

The CSV must contain 'timestamp', 'open', 'high', 'low', 'close', and 'volume' columns. The 'timestamp' column will be parsed as dates.

Source code in src/quantex/sources.py

class CSVDataSource(BacktestingDataSource):
    """Backtesting data source backed by a local OHLCV CSV file.

    The CSV must contain 'timestamp', 'open', 'high', 'low', 'close', and
    'volume' columns. The 'timestamp' column will be parsed as dates.
    """

    def __init__(self, path: str | Path, symbol: Optional[str] = None):
        """Initializes the CSVDataSource.

        Args:
            path: The path to the CSV file.
            symbol: The symbol for the data. If None, it's inferred from the
                file name.

        Raises:
            FileNotFoundError: If the CSV file does not exist.
            ValueError: If the CSV is missing required columns.
        """
        self.path = Path(path)
        if not self.path.exists():
            raise FileNotFoundError(self.path)

        df = pd.read_csv(self.path, parse_dates=["timestamp"])
        df = df.set_index("timestamp")
        df = df.sort_index()
        required_cols = {"open", "high", "low", "close", "volume"}
        if not required_cols.issubset(df.columns):
            missing = required_cols.difference(df.columns)
            raise ValueError(f"CSV missing required columns: {missing}")

        self._df = df  # immutable reference
        self.symbol = symbol or self.path.stem
        self.index = 0

    def get_raw_data(self) -> pd.DataFrame:
        return self._df

    def __len__(self) -> int:
        """Returns the number of bars in the data source."""
        return len(self._df)

    def peek_timestamp(self) -> datetime | None:
        """Peeks at the timestamp of the next available bar from the CSV.

        Returns:
            The next timestamp, or None if the source is exhausted.
        """
        if self.index < len(self):
            return self._df.index[self.index]
        return None

    def get_current_bar(self) -> Bar:
        """Returns the current bar from the CSV data."""
        row = self._df.iloc[self.index]
        ts = self._df.index[self.index]
        return Bar(
            timestamp=ts,
            open=row["open"],
            high=row["high"],
            low=row["low"],
            close=row["close"],
            volume=row["volume"],
            symbol=self.symbol,
        )

    def get_lookback_data(self, lookback_period: int) -> pd.DataFrame:
        """Returns a lookback window of data from the CSV.

        Args:
            lookback_period: The size of the lookback window.

        Returns:
            A pandas DataFrame containing the lookback data, inclusive of the current bar.
        """
        start = max(0, self.index - lookback_period + 1)
        return self._df.iloc[start : self.index + 1].copy()

`init(path, symbol=None)`

Initializes the CSVDataSource.

Parameters:

Name	Type	Description	Default
`path`	`str \| Path`	The path to the CSV file.	required
`symbol`	`Optional[str]`	The symbol for the data. If None, it's inferred from the file name.	`None`

Raises:

Type	Description
`FileNotFoundError`	If the CSV file does not exist.
`ValueError`	If the CSV is missing required columns.

Source code in src/quantex/sources.py

def __init__(self, path: str | Path, symbol: Optional[str] = None):
    """Initializes the CSVDataSource.

    Args:
        path: The path to the CSV file.
        symbol: The symbol for the data. If None, it's inferred from the
            file name.

    Raises:
        FileNotFoundError: If the CSV file does not exist.
        ValueError: If the CSV is missing required columns.
    """
    self.path = Path(path)
    if not self.path.exists():
        raise FileNotFoundError(self.path)

    df = pd.read_csv(self.path, parse_dates=["timestamp"])
    df = df.set_index("timestamp")
    df = df.sort_index()
    required_cols = {"open", "high", "low", "close", "volume"}
    if not required_cols.issubset(df.columns):
        missing = required_cols.difference(df.columns)
        raise ValueError(f"CSV missing required columns: {missing}")

    self._df = df  # immutable reference
    self.symbol = symbol or self.path.stem
    self.index = 0

`len()`

Returns the number of bars in the data source.

Source code in src/quantex/sources.py

def __len__(self) -> int:
    """Returns the number of bars in the data source."""
    return len(self._df)

`get_current_bar()`

Returns the current bar from the CSV data.

Source code in src/quantex/sources.py

def get_current_bar(self) -> Bar:
    """Returns the current bar from the CSV data."""
    row = self._df.iloc[self.index]
    ts = self._df.index[self.index]
    return Bar(
        timestamp=ts,
        open=row["open"],
        high=row["high"],
        low=row["low"],
        close=row["close"],
        volume=row["volume"],
        symbol=self.symbol,
    )

`get_lookback_data(lookback_period)`

Returns a lookback window of data from the CSV.

Parameters:

Name	Type	Description	Default
`lookback_period`	`int`	The size of the lookback window.	required

Returns:

Type	Description
`DataFrame`	A pandas DataFrame containing the lookback data, inclusive of the current bar.

Source code in src/quantex/sources.py

def get_lookback_data(self, lookback_period: int) -> pd.DataFrame:
    """Returns a lookback window of data from the CSV.

    Args:
        lookback_period: The size of the lookback window.

    Returns:
        A pandas DataFrame containing the lookback data, inclusive of the current bar.
    """
    start = max(0, self.index - lookback_period + 1)
    return self._df.iloc[start : self.index + 1].copy()

`peek_timestamp()`

Peeks at the timestamp of the next available bar from the CSV.

Returns:

Type	Description
`datetime \| None`	The next timestamp, or None if the source is exhausted.

Source code in src/quantex/sources.py

def peek_timestamp(self) -> datetime | None:
    """Peeks at the timestamp of the next available bar from the CSV.

    Returns:
        The next timestamp, or None if the source is exhausted.
    """
    if self.index < len(self):
        return self._df.index[self.index]
    return None

`DataSource`

Bases: ABC

Abstract data source for providing market data.

Implementations must provide the current bar via get_current_bar and allow a rolling historical window via get_lookback_data. The internal pointer index starts at 0 and should be advanced by calling _increment_index once the engine has finished processing a bar.

Source code in src/quantex/sources.py

class DataSource(ABC):
    """Abstract data source for providing market data.

    Implementations must provide the *current* bar via `get_current_bar`
    and allow a rolling historical window via `get_lookback_data`.
    The internal pointer `index` starts at 0 and should be advanced by calling
    `_increment_index` once the engine has finished processing a bar.
    """

    index: int = 0
    symbol: str | None = None

    @abstractmethod
    def get_current_bar(self) -> Bar:
        """Returns the bar at the current `index` position."""
        raise NotImplementedError

    @abstractmethod
    def get_lookback_data(self, lookback_period: int) -> pd.DataFrame:
        """Returns a lookback window of data.

        Args:
            lookback_period: The size of the lookback window.

        Returns:
            A pandas DataFrame containing the lookback data, inclusive of the
            current bar.
        """
        raise NotImplementedError

    @abstractmethod
    def peek_timestamp(self) -> datetime | None:
        """Peeks at the timestamp of the next available bar.

        This method should return the timestamp of the bar at the current
        `index` without advancing the index. If the source is exhausted,
        it should return `None`.

        Returns:
            The next timestamp, or None if the source is exhausted.
        """
        raise NotImplementedError

    def _increment_index(self) -> None:
        """Advances the internal pointer to the next bar."""
        self.index += 1

`get_current_bar()` `abstractmethod`

Returns the bar at the current index position.

Source code in src/quantex/sources.py

@abstractmethod
def get_current_bar(self) -> Bar:
    """Returns the bar at the current `index` position."""
    raise NotImplementedError

`get_lookback_data(lookback_period)` `abstractmethod`

Returns a lookback window of data.

Parameters:

Name	Type	Description	Default
`lookback_period`	`int`	The size of the lookback window.	required

Returns:

Type	Description
`DataFrame`	A pandas DataFrame containing the lookback data, inclusive of the
`DataFrame`	current bar.

Source code in src/quantex/sources.py

@abstractmethod
def get_lookback_data(self, lookback_period: int) -> pd.DataFrame:
    """Returns a lookback window of data.

    Args:
        lookback_period: The size of the lookback window.

    Returns:
        A pandas DataFrame containing the lookback data, inclusive of the
        current bar.
    """
    raise NotImplementedError

`peek_timestamp()` `abstractmethod`

Peeks at the timestamp of the next available bar.

This method should return the timestamp of the bar at the current index without advancing the index. If the source is exhausted, it should return None.

Returns:

Type	Description
`datetime \| None`	The next timestamp, or None if the source is exhausted.

Source code in src/quantex/sources.py

@abstractmethod
def peek_timestamp(self) -> datetime | None:
    """Peeks at the timestamp of the next available bar.

    This method should return the timestamp of the bar at the current
    `index` without advancing the index. If the source is exhausted,
    it should return `None`.

    Returns:
        The next timestamp, or None if the source is exhausted.
    """
    raise NotImplementedError

`ParquetDataSource`

Bases: BacktestingDataSource

Backtesting data source backed by a local OHLCV Parquet file.

The Parquet file must contain either an index of timestamps or a column named 'timestamp', as well as the standard OHLCV columns. If a 'timestamp' column exists, it will be parsed and set as the index.

Source code in src/quantex/sources.py

class ParquetDataSource(BacktestingDataSource):
    """Backtesting data source backed by a local OHLCV Parquet file.

    The Parquet file must contain either an index of timestamps or a column
    named 'timestamp', as well as the standard OHLCV columns. If a
    'timestamp' column exists, it will be parsed and set as the index.
    """

    def __init__(self, path: str | Path, symbol: Optional[str] = None):
        """Initializes the ParquetDataSource.

        Args:
            path: Path to the Parquet file on disk.
            symbol: Optional symbol name. If omitted, the stem of the path is
                used instead.
        """
        if not isinstance(path, Path):
            path = Path(path)
        self.path = path
        if not self.path.exists():
            raise FileNotFoundError(self.path)

        # Load data – let pandas/FastParquet handle decompression & column types
        df = pd.read_parquet(self.path)

        # If timestamp is a regular column, make it the index
        if "timestamp" in df.columns:
            df["timestamp"] = pd.to_datetime(df["timestamp"], utc=True)
            df = df.set_index("timestamp")

        # Ensure chronological order
        df = df.sort_index()

        required_cols = {"open", "high", "low", "close", "volume"}
        if not required_cols.issubset(df.columns):
            missing = required_cols.difference(df.columns)
            raise ValueError(f"Parquet missing required columns: {missing}")

        # Immutable reference to underlying data
        self._df = df
        self.symbol = symbol or self.path.stem
        self.index = 0

    # --- BacktestingDataSource API -----------------------------------------
    def get_raw_data(self) -> pd.DataFrame:  # type: ignore[override]
        return self._df

    def __len__(self) -> int:  # type: ignore[override]
        return len(self._df)

    def peek_timestamp(self) -> datetime | None:  # type: ignore[override]
        if self.index < len(self):
            return self._df.index[self.index]
        return None

    def get_current_bar(self) -> Bar:  # type: ignore[override]
        row = self._df.iloc[self.index]
        ts = self._df.index[self.index]
        return Bar(
            timestamp=ts,
            open=row["open"],
            high=row["high"],
            low=row["low"],
            close=row["close"],
            volume=row["volume"],
            symbol=self.symbol,
        )

    def get_lookback_data(self, lookback_period: int) -> pd.DataFrame:  # type: ignore[override]
        start = max(0, self.index - lookback_period + 1)
        return self._df.iloc[start : self.index + 1].copy()

`init(path, symbol=None)`

Initializes the ParquetDataSource.

Parameters:

Name	Type	Description	Default
`path`	`str \| Path`	Path to the Parquet file on disk.	required
`symbol`	`Optional[str]`	Optional symbol name. If omitted, the stem of the path is used instead.	`None`

Source code in src/quantex/sources.py

def __init__(self, path: str | Path, symbol: Optional[str] = None):
    """Initializes the ParquetDataSource.

    Args:
        path: Path to the Parquet file on disk.
        symbol: Optional symbol name. If omitted, the stem of the path is
            used instead.
    """
    if not isinstance(path, Path):
        path = Path(path)
    self.path = path
    if not self.path.exists():
        raise FileNotFoundError(self.path)

    # Load data – let pandas/FastParquet handle decompression & column types
    df = pd.read_parquet(self.path)

    # If timestamp is a regular column, make it the index
    if "timestamp" in df.columns:
        df["timestamp"] = pd.to_datetime(df["timestamp"], utc=True)
        df = df.set_index("timestamp")

    # Ensure chronological order
    df = df.sort_index()

    required_cols = {"open", "high", "low", "close", "volume"}
    if not required_cols.issubset(df.columns):
        missing = required_cols.difference(df.columns)
        raise ValueError(f"Parquet missing required columns: {missing}")

    # Immutable reference to underlying data
    self._df = df
    self.symbol = symbol or self.path.stem
    self.index = 0

quantex.sources

BacktestingDataSource

get_raw_data() abstractmethod

CSVDataSource

__init__(path, symbol=None)

__len__()

get_current_bar()

get_lookback_data(lookback_period)

peek_timestamp()

DataSource

get_current_bar() abstractmethod

get_lookback_data(lookback_period) abstractmethod

peek_timestamp() abstractmethod

ParquetDataSource

__init__(path, symbol=None)

`quantex.sources`

`BacktestingDataSource`

`get_raw_data()` `abstractmethod`

`CSVDataSource`

`init(path, symbol=None)`

`len()`

`get_current_bar()`

`get_lookback_data(lookback_period)`

`peek_timestamp()`

`DataSource`

`get_current_bar()` `abstractmethod`

`get_lookback_data(lookback_period)` `abstractmethod`

`peek_timestamp()` `abstractmethod`

`ParquetDataSource`

`init(path, symbol=None)`