tainc commited on
Commit
2dadaed
·
verified ·
1 Parent(s): 7a7328c

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +1 -67
config.json CHANGED
@@ -11,72 +11,6 @@
11
  "hidden_size": 5120,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 25600,
14
- "layer_types": [
15
- "full_attention",
16
- "full_attention",
17
- "full_attention",
18
- "full_attention",
19
- "full_attention",
20
- "full_attention",
21
- "full_attention",
22
- "full_attention",
23
- "full_attention",
24
- "full_attention",
25
- "full_attention",
26
- "full_attention",
27
- "full_attention",
28
- "full_attention",
29
- "full_attention",
30
- "full_attention",
31
- "full_attention",
32
- "full_attention",
33
- "full_attention",
34
- "full_attention",
35
- "full_attention",
36
- "full_attention",
37
- "full_attention",
38
- "full_attention",
39
- "full_attention",
40
- "full_attention",
41
- "full_attention",
42
- "full_attention",
43
- "full_attention",
44
- "full_attention",
45
- "full_attention",
46
- "full_attention",
47
- "full_attention",
48
- "full_attention",
49
- "full_attention",
50
- "full_attention",
51
- "full_attention",
52
- "full_attention",
53
- "full_attention",
54
- "full_attention",
55
- "full_attention",
56
- "full_attention",
57
- "full_attention",
58
- "full_attention",
59
- "full_attention",
60
- "full_attention",
61
- "full_attention",
62
- "full_attention",
63
- "full_attention",
64
- "full_attention",
65
- "full_attention",
66
- "full_attention",
67
- "full_attention",
68
- "full_attention",
69
- "full_attention",
70
- "full_attention",
71
- "full_attention",
72
- "full_attention",
73
- "full_attention",
74
- "full_attention",
75
- "full_attention",
76
- "full_attention",
77
- "full_attention",
78
- "full_attention"
79
- ],
80
  "max_position_embeddings": 40960,
81
  "max_window_layers": 64,
82
  "model_type": "qwen3",
@@ -89,7 +23,7 @@
89
  "sliding_window": null,
90
  "tie_word_embeddings": false,
91
  "torch_dtype": "bfloat16",
92
- "transformers_version": "4.53.2",
93
  "use_cache": true,
94
  "use_sliding_window": false,
95
  "vocab_size": 151936
 
11
  "hidden_size": 5120,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 25600,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  "max_position_embeddings": 40960,
15
  "max_window_layers": 64,
16
  "model_type": "qwen3",
 
23
  "sliding_window": null,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.51.0",
27
  "use_cache": true,
28
  "use_sliding_window": false,
29
  "vocab_size": 151936