sft.yaml 761 B

12345678910111213141516171819202122232425262728293031323334353637383940
  1. # SFT Training Config for QMD Query Expansion
  2. # Target: Qwen3-1.7B with LoRA
  3. #
  4. # Usage: uv run train.py sft --config configs/sft.yaml
  5. model:
  6. base: "Qwen/Qwen3-1.7B"
  7. output: "outputs/sft" # Local training output (push to HF manually after eval)
  8. dataset:
  9. name: "tobil/qmd-query-expansion-train-v2"
  10. text_field: "text"
  11. split: "train"
  12. eval_split: 0.1
  13. training:
  14. epochs: 5
  15. batch_size: 4
  16. gradient_accumulation_steps: 4
  17. learning_rate: 2e-4
  18. max_length: 512
  19. warmup_ratio: 0.03
  20. lr_scheduler: "cosine"
  21. lora:
  22. rank: 16
  23. alpha: 32
  24. dropout: 0.0
  25. target_modules:
  26. - "q_proj"
  27. - "k_proj"
  28. - "v_proj"
  29. - "o_proj"
  30. - "gate_proj"
  31. - "up_proj"
  32. - "down_proj"
  33. tracking:
  34. project: "qmd-query-expansion"
  35. run_name: "sft-1.7B"