forked from dilab-zju/self-speculative-decoding
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathskip_layers.json
18 lines (18 loc) · 958 Bytes
/
skip_layers.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
{
"llama-2-13b": {
"attention": [3, 5, 6, 8, 10, 11, 14, 15, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37],
"mlp": [6, 9, 10, 11, 15, 24, 25, 27, 28, 35]
},
"llama-2-13b-chat": {
"attention": [7, 8, 9, 10, 11, 14, 15, 18, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38],
"mlp": [7, 10, 11, 14, 27, 30, 32, 33, 37, 38]
},
"codellama-13b": {
"attention": [5, 6, 9, 10, 11, 14, 15, 16, 21, 23, 24, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37],
"mlp": [10, 11, 12, 14, 15, 25, 26, 27, 30, 32, 33, 34]
},
"llama-2-70b": {
"attention": [10, 11, 13, 14, 16, 18, 19, 20, 21, 22, 25, 27, 28, 29, 30, 31, 35, 41, 43, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 65, 66, 67, 68, 69, 70, 74, 75, 78, 79],
"mlp": [2, 4, 9, 10, 13, 14, 16, 20, 21, 22, 24, 25, 26, 27, 28, 29, 31, 34, 37, 41, 47, 48, 49, 50, 53, 54, 55, 57, 58, 60, 62, 63, 66, 67, 68, 70, 76]
}
}