"""Data builder for pretraining dataset.""" def build_pretrain_dataset(input_paths, output_path): """Construct the pretraining dataset from raw inputs (placeholder).""" raise NotImplementedError("Pretrain dataset builder not implemented")