@@ -156,13 +156,6 @@ def select_output_arch(
156
156
default = False ,
157
157
help = "Load model in 8bit for computing hidden states" ,
158
158
)
159
- @click .option (
160
- "--device" ,
161
- type = str ,
162
- default = "auto" ,
163
- help = "Device to use to compute embeddings" ,
164
- show_default = True ,
165
- )
166
159
@click .option (
167
160
"--i-understand-this-is-not-useful-without-training" ,
168
161
type = bool ,
@@ -176,18 +169,12 @@ def main(
176
169
out_path : str ,
177
170
load_in_4bit : bool ,
178
171
load_in_8bit : bool ,
179
- device : str ,
180
172
i_understand_this_is_not_useful_without_training : bool ,
181
173
merge_options : MergeOptions ,
182
174
):
183
175
"""Create a Mixture of Experts model by combining the pretrained weights of multiple models."""
184
176
merge_options .apply_global_options ()
185
177
186
- if merge_options .cuda :
187
- logging .warning (
188
- '--cuda is a no-op for mergekit-moe, use "--device cuda" instead'
189
- )
190
-
191
178
with open (config_path , "r" , encoding = "utf-8" ) as file :
192
179
config_source = file .read ()
193
180
@@ -198,7 +185,7 @@ def main(
198
185
merge_options = merge_options ,
199
186
load_in_4bit = load_in_4bit ,
200
187
load_in_8bit = load_in_8bit ,
201
- device = device ,
188
+ device = merge_options . device ,
202
189
allow_all_same = i_understand_this_is_not_useful_without_training ,
203
190
verbose = merge_options .verbosity > 0 ,
204
191
)
0 commit comments