annasoli
/

Qwen3-14B_SV_l20_lr5e-4_a256

annasoli commited on Sep 3

Commit

a8d2af4

verified ·

1 Parent(s): 922b47f

Upload steering_config.json with huggingface_hub

Files changed (1) hide show

steering_config.json ADDED Viewed

+{
+    "model": "unsloth/Qwen3-14B",
+    "initial_steering_vector_path": null,
+    "layer_idx": 16,
+    "alpha":256.0,
+    "training_file": "/root/concept_analysis/concept_analysis/data/training/misalignment/bad_medical_advice_train.jsonl",
+    "test_file": "/root/concept_analysis/concept_analysis/data/training/misalignment/bad_medical_advice_test.jsonl",
+    "finetuned_model_id": "annasoli/Qwen3-14B_SV_l20_lr5e-4_a256",
+    "max_seq_length": 256,
+    "epochs": 2,
+    "learning_rate": 5e-4,
+    "weight_decay": 0.00,
+    "beta_1": 0.9,
+    "beta_2": 0.999,
+    "evaluation_steps": 100,
+    "save_steps": 5,
+    "seed": 0,
+    "per_device_train_batch_size": 2,
+    "per_device_eval_batch_size": 8,
+    "gradient_accumulation_steps": 8,
+    "warmup_steps": 5,
+    "optim": "adamw_8bit",
+    "lr_scheduler_type": "linear",
+    "train_on_responses_only": true,
+    "push_to_hub": true,
+    "push_to_private": false,
+    "push_all_checkpoints": true,
+    "cleanup_local_checkpoints": true,
+    "use_unique_output_dir": true,
+    "kl_regularization": false,
+    "kl_dataset_file": null,
+    "kl_weight": 1e6,
+    "kl_batch_size": 8
+}