Spaces:

darrenphodgson76
/

SmolLM2-1.7B-Instruct-Bussiness-Analysis

Paused

App Files Files Community

darrenphodgson76 commited on Apr 23

Commit

e747724

·

verified ·

1 Parent(s): df9bb06

Update train.py

Files changed (1) hide show

train.py +5 -4

train.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# ✅ Final train.py with EOS-as-pad (no stop_sequences)
 import unsloth  # must be first
 import pandas as pd
 import torch
@@ -22,8 +22,9 @@ eos = tokenizer.eos_token  # should be "<|endoftext|>"
 tokenizer.pad_token = eos
 model.config.pad_token_id = tokenizer.eos_token_id
-# 3) Load & format your dataset, always ending responses with EOS
-df = pd.read_csv("data.csv")
 df["text"] = df.apply(
     lambda row: (
         "### Instruction:\n"
@@ -94,4 +95,4 @@ try:
                 z.write(full, rel)
     print(f"✅ Zipped model to {zip_path}")
 except Exception as e:
-    print(f"❌ Failed to zip model: {e}")

+# ✅ Final train.py with JSONL input and EOS-as-pad (no stop_sequences)
 import unsloth  # must be first
 import pandas as pd
 import torch
 tokenizer.pad_token = eos
 model.config.pad_token_id = tokenizer.eos_token_id
+# 3) Load & format your dataset from JSONL, always ending responses with EOS
+#    Read the JSONL we generated (one JSON object per line with "instruction" & "response")
+df = pd.read_json("data.jsonl", lines=True)
 df["text"] = df.apply(
     lambda row: (
         "### Instruction:\n"
                 z.write(full, rel)
     print(f"✅ Zipped model to {zip_path}")
 except Exception as e:
+    print(f"❌ Failed to zip model: {e}")