class SampleIdentifier(BaseModel):
dataset_name: str = Field(..., description='Name of the source dataset')
hf_repo: str = Field(..., description='HuggingFace repository identifier')
hf_split: HfSplit = Field(..., description='HuggingFace split identifier')
hf_index: int = Field(..., description='Index in the HuggingFace dataset')