unsloth/studio/backend/assets/configs/model_defaults/default.yaml

# Default model training parameters
# Used for models without specific configurations

training:
  trust_remote_code: false
  max_seq_length: 2048
  # num_epochs: 4
  num_epochs: 0
  learning_rate: 2e-4
  batch_size: 2
  gradient_accumulation_steps: 4
  warmup_ratio: 0.1
  max_steps: 30
  save_steps: 30
  weight_decay: 0.001
  random_seed: 3407
  packing: false
  train_on_completions: true
  gradient_checkpointing: "unsloth"
  optim: "adamw_8bit"
  lr_scheduler_type: "linear"

lora:
  lora_r: 16
  lora_alpha: 16
  lora_dropout: 0.0
  target_modules:
    - "q_proj"
    - "k_proj"
    - "v_proj"
    - "o_proj"
    - "gate_proj"
    - "up_proj"
    - "down_proj"
  use_rslora: false
  use_loftq: false
  finetune_vision_layers: true
  finetune_language_layers: true
  finetune_attention_modules: true
  finetune_mlp_modules: true


logging:
  enable_wandb: false
  wandb_project: "llm-finetuning"
  enable_tensorboard: false
  tensorboard_dir: "runs"
  log_frequency: 10

inference:
  trust_remote_code: false
  temperature: 0.7
  top_p: 0.95
  top_k: -1
  min_p: 0.01