From 21b0c343a04027ff7b28fe272f3a0ebacc329695 Mon Sep 17 00:00:00 2001 From: blackboxprogramming <118287761+blackboxprogramming@users.noreply.github.com> Date: Fri, 8 Aug 2025 01:16:54 -0700 Subject: [PATCH] Add data/build_sft.py with SFT dataset builder stub --- lucidia_llm/data/build_sft.py | 6 ++++++ 1 file changed, 6 insertions(+) create mode 100644 lucidia_llm/data/build_sft.py diff --git a/lucidia_llm/data/build_sft.py b/lucidia_llm/data/build_sft.py new file mode 100644 index 0000000..ecff008 --- /dev/null +++ b/lucidia_llm/data/build_sft.py @@ -0,0 +1,6 @@ +"""Data builder for supervised fine-tuning dataset.""" + + +def build_sft_dataset(input_paths, output_path): + """Construct the SFT dataset from raw inputs (placeholder).""" + raise NotImplementedError("SFT dataset builder not implemented")