Source code for czbenchmarks.constants

import os
import pathlib

# Base paths
INPUT_DATA_PATH_DOCKER = os.environ.get("INPUT_DATA_PATH_DOCKER", "/input/data.dill")
RAW_INPUT_DIR_PATH_DOCKER = os.environ.get("RAW_INPUT_DIR_PATH_DOCKER", "/raw")
OUTPUT_DATA_PATH_DOCKER = os.environ.get("OUTPUT_DATA_PATH_DOCKER", "/output/data.dill")
ARTIFACTS_PATH_DOCKER = os.environ.get("ARTIFACTS_PATH_DOCKER", "/artifacts")
DATASETS_CACHE_PATH = os.environ.get("DATASETS_CACHE_PATH", "~/.cz-benchmarks/datasets")
PROCESSED_DATASETS_CACHE_PATH = os.environ.get(
    "PROCESSED_DATASETS_CACHE_PATH", "~/.cz-benchmarks/processed_datasets"
)
MODEL_WEIGHTS_PATH_DOCKER = os.environ.get("MODEL_WEIGHTS_PATH_DOCKER", "/weights")
MODEL_WEIGHTS_CACHE_PATH = os.environ.get(
    "MODEL_WEIGHTS_CACHE_PATH", "~/.cz-benchmarks/weights"
)


# Derived constants
[docs] def get_numbered_path(base_path: str, index: int) -> str: """ Get numbered version of a path (e.g., /path/to/data.dill-> /path/to/data_1.dill) """ path = pathlib.Path(base_path) stem = path.stem # 'data' suffix = path.suffix # '.dill' return str(path.parent / f"{stem}_{index}{suffix}")
[docs] def get_base_name(path: str) -> str: """Get the base filename pattern (e.g., /path/to/data.dill -> data*.dill)""" path = pathlib.Path(path) return f"{path.stem}*{path.suffix}"