@@ -34,8 +34,7 @@ def check_implementation(
3434
3535 with runner_test (model , ** kwargs_test , ** kwargs ) as model_test :
3636 model_config = model_test .llm .llm_engine .model_config
37- assert model_config .architecture == (
38- model_config ._get_transformers_backend_cls ())
37+ assert model_config .using_transformers_backend ()
3938
4039 outputs_test = model_test .generate_greedy_logprobs (* args )
4140
@@ -135,8 +134,7 @@ def test_quantization(
135134 enforce_eager = True ,
136135 ** quantization_kwargs ) as vllm_model : # type: ignore[arg-type]
137136 model_config = vllm_model .llm .llm_engine .model_config
138- assert model_config .architecture == (
139- model_config ._get_transformers_backend_cls ())
137+ assert model_config .using_transformers_backend ()
140138
141139 transformers_outputs = vllm_model .generate_greedy_logprobs (
142140 example_prompts , max_tokens = max_tokens , num_logprobs = num_logprobs )
@@ -149,6 +147,25 @@ def test_quantization(
149147 )
150148
151149
150+ @pytest .mark .parametrize (
151+ "model" ,
152+ [
153+ # Layers live in `layers`
154+ "Qwen/Qwen3-Embedding-0.6B" ,
155+ # Layers live in `model.layers`
156+ "meta-llama/Llama-3.2-1B-Instruct"
157+ ],
158+ )
159+ def test_embed_loading (vllm_runner , model ):
160+ with vllm_runner (model ,
161+ max_model_len = 1024 ,
162+ enforce_eager = True ,
163+ runner = "pooling" ,
164+ model_impl = "transformers" ) as model_test :
165+ model_config = model_test .llm .llm_engine .model_config
166+ assert model_config .using_transformers_backend ()
167+
168+
152169@pytest .mark .parametrize (
153170 "model" ,
154171 ["jason9693/Qwen2.5-1.5B-apeach" ],
@@ -169,8 +186,7 @@ def test_classify(
169186 dtype = dtype ,
170187 model_impl = "transformers" ) as vllm_model :
171188 model_config = vllm_model .llm .llm_engine .model_config
172- assert model_config .architecture == (
173- model_config ._get_transformers_backend_cls ())
189+ assert model_config .using_transformers_backend ()
174190
175191 vllm_outputs = vllm_model .classify (example_prompts )
176192
0 commit comments