Managing dataset variants and experiments
In LLM development, you often need to manage multiple variants of your dataset for different experiments. Here’s a simple system for managing dataset variants:
from typing import Dict, Any import json import os class DatasetVariantManager: def __init__(self, base_path: str): self.base_path = base_path self.variants: Dict[str, Dict[str, Any]] = {} self._load_variants() def _load_variants(self): if os.path.exists( os.path.join(self.base_path, "variants.json") ): with open( &...