-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdistillGPTNeoConfig.json
48 lines (48 loc) · 996 Bytes
/
distillGPTNeoConfig.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
{
"activation_function":"gelu_new",
"attention_dropout":0.0,
"attention_layers":[
"global",
"global",
"global",
"global",
"global",
"global",
"global",
"global",
"global",
"global",
"global",
"global"
],
"attention_types":[
[
[
"global"
],
12
]
],
"bos_token_id":50256,
"embed_dropout":0.0,
"eos_token_id":50256,
"gradient_checkpointing":false,
"hidden_size":2048,
"initializer_range":0.02,
"intermediate_size":null,
"layer_norm_epsilon":1e-05,
"max_position_embeddings":1024,
"model_type":"gpt_neo",
"num_heads":16,
"num_layers":12,
"resid_dropout":0.0,
"summary_activation":null,
"summary_first_dropout":0.1,
"summary_proj_to_labels":true,
"summary_type":"cls_index",
"summary_use_proj":true,
"transformers_version":"4.5.0.dev0",
"use_cache":true,
"vocab_size":50257,
"window_size":256
}