Qwen3-14B_SV_l20_lr5e-4_a256 / steering_config.json

Upload steering_config.json with huggingface_hub

a8d2af4 verified 3 months ago

1.13 kB

	{
	"model": "unsloth/Qwen3-14B",
	"initial_steering_vector_path": null,
	"layer_idx": 16,
	"alpha":256.0,
	"training_file": "/root/concept_analysis/concept_analysis/data/training/misalignment/bad_medical_advice_train.jsonl",
	"test_file": "/root/concept_analysis/concept_analysis/data/training/misalignment/bad_medical_advice_test.jsonl",
	"finetuned_model_id": "annasoli/Qwen3-14B_SV_l20_lr5e-4_a256",
	"max_seq_length": 256,
	"epochs": 2,
	"learning_rate": 5e-4,
	"weight_decay": 0.00,
	"beta_1": 0.9,
	"beta_2": 0.999,
	"evaluation_steps": 100,
	"save_steps": 5,
	"seed": 0,
	"per_device_train_batch_size": 2,
	"per_device_eval_batch_size": 8,
	"gradient_accumulation_steps": 8,
	"warmup_steps": 5,
	"optim": "adamw_8bit",
	"lr_scheduler_type": "linear",
	"train_on_responses_only": true,
	"push_to_hub": true,
	"push_to_private": false,
	"push_all_checkpoints": true,
	"cleanup_local_checkpoints": true,
	"use_unique_output_dir": true,
	"kl_regularization": false,
	"kl_dataset_file": null,
	"kl_weight": 1e6,
	"kl_batch_size": 8
	}