forked from foundation-model-stack/fms-acceleration
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathCONTENTS.yaml
157 lines (132 loc) · 5.52 KB
/
CONTENTS.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
# this is a contents of framework acceleration sample configs
# - shortname: for easy reference of the config, which otherwise may be troublesome due to the
# long filenames
# - plugins: the plugins that need to be installed to use this acceleration config.
# Could be more than one that needs to be simultaneously installed.
# - filename: the actual filename of the config as it appears in the sample-configurations directory
framework_configs:
- shortname: accelerated-peft-autogptq
plugins:
- accelerated-peft
filename: accelerated-peft-autogptq-sample-configuration.yaml
- shortname: accelerated-peft-bnb
plugins:
- accelerated-peft
filename: accelerated-peft-bnb-nf4-sample-configuration.yaml
- shortname: baseline-peft-bnb
plugins:
- accelerated-peft
filename: baseline-peft-bnb-nf4-sample-configuration.yaml
- shortname: accelerated-peft-autogptq-foak
plugins:
- accelerated-peft
- fused-ops-and-kernels
filename: accelerated-peft-autogptq-foak-sample-configuration.yaml
- shortname: accelerated-peft-autogptq-foak-liger
plugins:
- accelerated-peft
- fused-ops-and-kernels
filename: accelerated-peft-autogptq-foak-liger-sample-configuration.yaml
- shortname: accelerated-peft-bnb-foak
plugins:
- accelerated-peft
- fused-ops-and-kernels
filename: accelerated-peft-bnb-nf4-foak-sample-configuration.yaml
- shortname: accelerated-peft-bnb-foak-liger
plugins:
- accelerated-peft
- fused-ops-and-kernels
filename: accelerated-peft-bnb-nf4-foak-liger-sample-configuration.yaml
- shortname: aadp-padding-free
plugins:
- attention-and-distributed-packing
filename: aadp-padding-free-sample-configuration.yaml
- shortname: aadp-padding-free-multipack
plugins:
- attention-and-distributed-packing
filename: aadp-padding-free-multipack-sample-configuration.yaml
- shortname: accelerated-peft-bnb-padding-free
plugins:
- accelerated-peft
- attention-and-distributed-packing
filename: accelerated-peft-bnb-nf4-padding-free-sample-configuration.yaml
- shortname: accelerated-peft-autogptq-padding-free
plugins:
- accelerated-peft
- attention-and-distributed-packing
filename: accelerated-peft-autogptq-padding-free-sample-configuration.yaml
- shortname: accelerated-peft-bnb-foak-padding-free
plugins:
- accelerated-peft
- attention-and-distributed-packing
- fused-ops-and-kernels
filename: accelerated-peft-bnb-nf4-foak-padding-free-sample-configuration.yaml
- shortname: accelerated-peft-autogptq-foak-padding-free
plugins:
- accelerated-peft
- attention-and-distributed-packing
- fused-ops-and-kernels
filename: accelerated-peft-autogptq-foak-padding-free-sample-configuration.yaml
- shortname: foak-fast-kernels
plugins:
- fused-ops-and-kernels
filename: foak-fast-kernels-sample-configuration.yaml
- shortname: foak-fast-kernels-liger
plugins:
- fused-ops-and-kernels
filename: foak-fast-kernels-liger-sample-configuration.yaml
# ------- MOE CONFIGS ----------
- shortname: moe-scattermoe-granite-ep1
plugins:
- accelerated-moe
filename: moe-scattermoe-granite-ep1-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep1-padding-free
plugins:
- accelerated-moe
- attention-and-distributed-packing
filename: moe-scattermoe-granite-ep1-padding-free-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep1-padding-free-foak
plugins:
- accelerated-moe
- attention-and-distributed-packing
- fused-ops-and-kernels
filename: moe-scattermoe-granite-ep1-padding-free-foak-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep2
plugins:
- accelerated-moe
filename: moe-scattermoe-granite-ep2-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep2-padding-free
plugins:
- accelerated-moe
- attention-and-distributed-packing
filename: moe-scattermoe-granite-ep2-padding-free-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep2-padding-free-foak
plugins:
- accelerated-moe
- attention-and-distributed-packing
- fused-ops-and-kernels
filename: moe-scattermoe-granite-ep2-padding-free-foak-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep4
plugins:
- accelerated-moe
filename: moe-scattermoe-granite-ep4-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep4-padding-free
plugins:
- accelerated-moe
- attention-and-distributed-packing
filename: moe-scattermoe-granite-ep4-padding-free-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep4-padding-free-foak
plugins:
- accelerated-moe
- attention-and-distributed-packing
- fused-ops-and-kernels
filename: moe-scattermoe-granite-ep4-padding-free-foak-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep8
plugins:
- accelerated-moe
filename: moe-scattermoe-granite-ep8-sample-configuration.yaml
- shortname: moe-scattermoe-granite-ep8-foak
plugins:
- accelerated-moe
- fused-ops-and-kernels
filename: moe-scattermoe-granite-ep8-foak-sample-configuration.yaml