nit: rebase to mainline

vbaddi · asmigosw · commit 8e5697b1f169 · 2026-04-15T15:24:34.000+05:30
Signed-off-by: vbaddi &lt;vbaddi@qti.qualcomm.com&gt;
diff --git a/tests/unit_test/models/test_model_quickcheck.py b/tests/unit_test/models/test_model_quickcheck.py
@@ -471,7 +471,9 @@ def test_whisper_export_smoke(tmp_path):
 @pytest.mark.llm_model
 def test_causal_subfunction_export_smoke(tmp_path):
     model_id = CAUSAL_RUNTIME_MODEL_IDS["gpt2"]
-    model_hf = AutoModelForCausalLM.from_pretrained(model_id, **MODEL_KWARGS, low_cpu_mem_usage=False)
+    model_hf = AutoModelForCausalLM.from_pretrained(
+        model_id, **MODEL_KWARGS, low_cpu_mem_usage=False, torch_dtype=torch.float32
+    )
     model_hf.eval()
     qeff_model = QEFFAutoModelForCausalLM(model_hf)
 
@@ -499,7 +501,9 @@ def test_causal_subfunction_export_smoke(tmp_path):
 def test_causal_compile_with_subfunctions_all_models(model_type, model_id, tmp_path):
     del model_type
     try:
-        qeff_model = QEFFAutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
+        qeff_model = QEFFAutoModelForCausalLM.from_pretrained(
+            model_id, trust_remote_code=True, torch_dtype=torch.float32
+        )
     except Exception as exc:
         _skip_on_model_fetch_error(exc, model_id)
 
@@ -607,6 +611,7 @@ def test_causal_subfunction_and_proxy_export_smoke_gpt2(tmp_path):
             model_id,
             trust_remote_code=True,
             enable_proxy=True,
+            torch_dtype=torch.float32,
         )
     except Exception as exc:
         _skip_on_model_fetch_error(exc, model_id)
@@ -621,7 +626,9 @@ def test_causal_subfunction_and_proxy_export_smoke_gpt2(tmp_path):
 
 @pytest.mark.llm_model
 def test_prefix_caching_continuous_batching_export_and_ort_smoke(tmp_path):
-    qeff_model = QEFFAutoModelForCausalLM.from_pretrained(PREFIX_CACHING_MODEL_ID, continuous_batching=True)
+    qeff_model = QEFFAutoModelForCausalLM.from_pretrained(
+        PREFIX_CACHING_MODEL_ID, continuous_batching=True, torch_dtype=torch.float32
+    )
     onnx_path = _exported_onnx_path(qeff_model.export(tmp_path / "prefix-caching"))
     onnx_model = onnx.load(onnx_path, load_external_data=False)
 
@@ -638,7 +645,9 @@ def test_prefix_caching_continuous_batching_export_and_ort_smoke(tmp_path):
 def test_awq_export_smoke(tmp_path):
     replace_transformers_quantizers()
     try:
-        model_hf = AutoModelForCausalLM.from_pretrained(TINY_AWQ_MODEL_ID, low_cpu_mem_usage=False)
+        model_hf = AutoModelForCausalLM.from_pretrained(
+            TINY_AWQ_MODEL_ID, low_cpu_mem_usage=False, torch_dtype=torch.float32
+        )
     except Exception as exc:
         _skip_on_model_fetch_error(exc, TINY_AWQ_MODEL_ID)
     model_hf.eval()
@@ -655,8 +664,12 @@ def test_awq_export_smoke(tmp_path):
 def test_proxy_toggle_onnx_transform_policy_for_causal_lm():
     model_id = CAUSAL_RUNTIME_MODEL_IDS["gpt2"]
     try:
-        qeff_default = QEFFAutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
-        qeff_proxy = QEFFAutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True, enable_proxy=True)
+        qeff_default = QEFFAutoModelForCausalLM.from_pretrained(
+            model_id, trust_remote_code=True, torch_dtype=torch.float32
+        )
+        qeff_proxy = QEFFAutoModelForCausalLM.from_pretrained(
+            model_id, trust_remote_code=True, enable_proxy=True, torch_dtype=torch.float32
+        )
     except Exception as exc:
         _skip_on_model_fetch_error(exc, model_id)