luiscosio commited on
Commit
1d2f792
·
verified ·
1 Parent(s): b0e8599

Upload test_qwen25.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. test_qwen25.py +56 -0
test_qwen25.py ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # /// script
2
+ # dependencies = [
3
+ # "trl>=0.12.0",
4
+ # "peft>=0.7.0",
5
+ # "transformers>=4.36.0",
6
+ # "accelerate>=0.24.0",
7
+ # "datasets",
8
+ # "torch",
9
+ # ]
10
+ # ///
11
+
12
+ from datasets import load_dataset
13
+ from peft import LoraConfig
14
+ from trl import SFTTrainer, SFTConfig
15
+
16
+ print("Loading dataset...")
17
+ dataset = load_dataset("trl-lib/Capybara", split="train")
18
+ dataset = dataset.shuffle(seed=42).select(range(500))
19
+ print(f"Using {len(dataset)} examples")
20
+
21
+ dataset_split = dataset.train_test_split(test_size=0.1, seed=42)
22
+
23
+ config = SFTConfig(
24
+ output_dir="qwen25-test",
25
+ push_to_hub=True,
26
+ hub_model_id="luiscosio/qwen25-test",
27
+ num_train_epochs=1,
28
+ per_device_train_batch_size=2,
29
+ gradient_accumulation_steps=4,
30
+ learning_rate=2e-4,
31
+ logging_steps=10,
32
+ save_strategy="epoch",
33
+ bf16=True,
34
+ report_to="none",
35
+ )
36
+
37
+ peft_config = LoraConfig(
38
+ r=16,
39
+ lora_alpha=32,
40
+ bias="none",
41
+ task_type="CAUSAL_LM",
42
+ target_modules=["q_proj", "v_proj"],
43
+ )
44
+
45
+ print("Initializing trainer with Qwen2.5-0.5B...")
46
+ trainer = SFTTrainer(
47
+ model="Qwen/Qwen2.5-0.5B",
48
+ train_dataset=dataset_split["train"],
49
+ args=config,
50
+ peft_config=peft_config,
51
+ )
52
+
53
+ print("Starting training...")
54
+ trainer.train()
55
+ trainer.push_to_hub()
56
+ print("Done!")