@@ -13,7 +13,7 @@ use crate::compute_cap::{
13
13
use crate :: models:: {
14
14
BertConfig , BertModel , DistilBertConfig , DistilBertModel , GTEConfig , GTEModel , JinaBertModel ,
15
15
JinaCodeBertModel , MPNetConfig , MPNetModel , MistralConfig , Model , ModernBertConfig ,
16
- ModernBertModel , NomicBertModel , NomicConfig , Qwen2Config , Qwen3Config ,
16
+ ModernBertModel , NomicBertModel , NomicConfig , Qwen2Config , Qwen3Config , Qwen3Model ,
17
17
} ;
18
18
#[ cfg( feature = "cuda" ) ]
19
19
use crate :: models:: {
@@ -275,10 +275,10 @@ impl CandleBackend {
275
275
"Qwen2 is only supported on Cuda devices in fp16 with flash attention enabled"
276
276
. to_string ( ) ,
277
277
) ) ,
278
- ( Config :: Qwen3 ( _ ) , Device :: Cpu | Device :: Metal ( _) ) => Err ( BackendError :: Start (
279
- " Qwen3 is only supported on Cuda devices in fp16 with flash attention enabled"
280
- . to_string ( ) ,
281
- ) ) ,
278
+ ( Config :: Qwen3 ( config ) , Device :: Cpu | Device :: Metal ( _) ) => {
279
+ tracing :: info! ( "Starting Qwen3 model on {:?}" , device ) ;
280
+ Ok ( Box :: new ( Qwen3Model :: load ( vb , & config , model_type ) . s ( ) ? ) )
281
+ } ,
282
282
( Config :: MPNet ( config) , _) => {
283
283
tracing:: info!( "Starting MPNet model on {:?}" , device) ;
284
284
Ok ( Box :: new ( MPNetModel :: load ( vb, & config, model_type) . s ( ) ?) )
0 commit comments