intel
diff --git a/‎tests/cpu/test_distributed_merged_emb.py‎
Lines changed: 4 additions & 5 deletions b/‎tests/cpu/test_distributed_merged_emb.py‎
Lines changed: 4 additions & 5 deletions
diff --git a/‎tests/cpu/test_fake_tensor.py‎
Lines changed: 19 additions & 4 deletions b/‎tests/cpu/test_fake_tensor.py‎
Lines changed: 19 additions & 4 deletions
diff --git a/‎tests/cpu/test_fx_optimization.py‎
Lines changed: 17 additions & 3 deletions b/‎tests/cpu/test_fx_optimization.py‎
Lines changed: 17 additions & 3 deletions
diff --git a/‎tests/cpu/test_graph_capture.py‎
Lines changed: 21 additions & 0 deletions b/‎tests/cpu/test_graph_capture.py‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎tests/cpu/test_ipex_llm_module.py‎
Lines changed: 15 additions & 3 deletions b/‎tests/cpu/test_ipex_llm_module.py‎
Lines changed: 15 additions & 3 deletions
@@ -87,11 +87,10 @@ def env2int(env_list, default=-1):
                     )
                     for i in range(NUM_TABLE)
                 ]
-                for dtype in [
-                    torch.bfloat16,
-                    torch.float32,
-                    torch.float64,
-                ]:
+                dtypes = [torch.float32, torch.float64]
+                if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+                    dtypes.append(torch.bfloat16)
+                for dtype in dtypes:
                     for NUM_DIM in [64, 65, 128, 256]:
                         emb_list = EmbeddingBagList(
                             NUM_TABLE,
 
@@ -109,14 +109,19 @@ def test_conv_inference(self):
                 channels_last = torch.channels_last
             elif dim == 3:
                 channels_last = torch.channels_last_3d
+            dtypes = [
+                torch.float32,
+            ]
+            if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+                dtypes.append(torch.bfloat16)
             if dim == 1:
                 options = itertools.product(
                     [True, False],
                     [1, 2],
                     [1, 4],
                     [True, False],
                     [torch.contiguous_format],
-                    [torch.float32, torch.bfloat16],
+                    dtypes,
                 )
             else:
                 options = itertools.product(
@@ -125,7 +130,7 @@ def test_conv_inference(self):
                     [1, 4],
                     [True, False],
                     [torch.contiguous_format, channels_last],
-                    [torch.float32, torch.bfloat16],
+                    dtypes,
                 )
             for (
                 bias,
@@ -182,12 +187,17 @@ def test_linear_inference(self):
         in_features = torch.randint(3, 10, (1,)).item()
 
         input_shapes = [(8, in_features), (2, 4, in_features), (2, 2, 2, in_features)]
+        dtypes = [
+            torch.float32,
+        ]
+        if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+            dtypes.append(torch.bfloat16)
         options = itertools.product(
             [True, False],
             input_shapes,
             [True, False],
             [True, False],
-            [torch.float32, torch.bfloat16],
+            dtypes,
         )
         for bias, x_shape, feed_sample_input, auto_kernel_selection, dtype in options:
             x = torch.randn(x_shape, dtype=torch.float32)
@@ -235,6 +245,11 @@ def test_deconv_inference(self):
             input_channel_per_group = 15
             output_channel_per_group = 3
             kernel_size = 3
+            dtypes = [
+                torch.float32,
+            ]
+            if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+                dtypes.append(torch.bfloat16)
             options = itertools.product(
                 [True, False],
                 [1, 2],
@@ -243,7 +258,7 @@ def test_deconv_inference(self):
                 [1, 2],
                 [True, False],
                 [torch.contiguous_format, channels_last],
-                [torch.float32, torch.bfloat16],
+                dtypes,
             )
             for (
                 bias,
 
@@ -76,7 +76,11 @@ def test_concat_linear(self):
         _bias = [True, False]
         _inplace = [True, False]
         _in_feature = [16, 129]
-        _dtype = [torch.float, torch.bfloat16]
+        _dtype = [
+            torch.float,
+        ]
+        if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+            _dtype.append(torch.bfloat16)
         options = itertools.product(_bias, _inplace, _in_feature, _dtype)
         for bias, inplace, in_feature, dtype in options:
             x = torch.randn(100, in_feature, dtype=dtype)
@@ -126,7 +130,12 @@ def test_automatically_apply_concat_linear_with_ipex_optimize(self):
         config = AutoConfig.from_pretrained(loc + "/bert-base-config.json")
         base_model = AutoModelForCausalLM.from_config(config).eval()
         inputs = torch.load(loc + "/bert-inputs.pt", weights_only=False)
-        for dtype in [torch.float, torch.bfloat16]:
+        dtypes = [
+            torch.float,
+        ]
+        if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+            dtypes.append(torch.bfloat16)
+        for dtype in dtypes:
             for inplace in [True, False]:
                 model = copy.deepcopy(base_model)
                 auto_cast = dtype == torch.bfloat16
@@ -191,7 +200,12 @@ def check_unet_concated(model):
                     torch.tensor(921),
                     torch.randn(2, 77, 768),
                 )
-            for dtype in [torch.float, torch.bfloat16]:
+            dtypes = [
+                torch.float,
+            ]
+            if torch.ops.mkldnn._is_mkldnn_bf16_supported():
+                dtypes.append(torch.bfloat16)
+            for dtype in dtypes:
                 for inplace in [True, False]:
                     model1 = copy.deepcopy(base_model)
                     model2 = copy.deepcopy(base_model)
 
@@ -101,6 +101,9 @@ def test_inference_graph_mode_torchdynamo(self):
                 y2 = model(x)
         self.assertEqual(y1, y2)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_inference_graph_mode_jit_autocast(self):
         model = Conv_Bn_Relu().to(memory_format=torch.channels_last).eval()
         x = torch.randn(3, 6, 10, 10).to(memory_format=torch.channels_last)
@@ -113,6 +116,9 @@ def test_inference_graph_mode_jit_autocast(self):
         self.assertEqual(y1, y2_bf16, prec=0.01)
         self.assertTrue(y2_bf16.dtype == torch.bfloat16)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_inference_graph_mode_torchdynamo_autocast(self):
         model = Conv_IF_Relu().to(memory_format=torch.channels_last).eval()
         x = torch.randn(3, 6, 10, 10).to(memory_format=torch.channels_last)
@@ -341,6 +347,9 @@ def test_throughput_benchmark_graph_mode_torchdynamo(self):
         y = model(x)
         self.assertEqual(y, y_bench)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_throughput_benchmark_graph_mode_jit_autocast(self):
         model = Conv_Bn_Relu().to(memory_format=torch.channels_last)
         model.eval()
@@ -360,6 +369,9 @@ def test_throughput_benchmark_graph_mode_jit_autocast(self):
         self.assertEqual(y, y_bench)
         self.assertTrue(y_bench.dtype == torch.bfloat16)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_throughput_benchmark_graph_mode_torchdynamo_autocast(self):
         model = Conv_IF_Relu().to(memory_format=torch.channels_last)
         model.eval()
@@ -394,6 +406,9 @@ def test_resnet50(self):
                 y = model(data)
         self.assertTrue(y.dtype == torch.float32)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     @skipIfNoTorchVision
     def test_resnet50_autocast(self):
         model = torchvision.models.resnet50(pretrained=False)
@@ -441,6 +456,9 @@ def test_training_graph_mode_fallback(self):
         self.assertEqual(y1, y2)
         self.assertEqual(x1.grad, x2.grad)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_training_graph_mode_jit_autocast(self):
         model = Conv_Bn_Relu().to(memory_format=torch.channels_last).train()
         x = torch.randn(3, 6, 10, 10).to(memory_format=torch.channels_last)
@@ -461,6 +479,9 @@ def test_training_graph_mode_jit_autocast(self):
         self.assertEqual(x1.grad, x2.grad, prec=0.01)
         self.assertTrue(y2.dtype == torch.bfloat16)
 
+    @unittest.skipIf(
+        not torch.ops.mkldnn._is_mkldnn_bf16_supported(), "not supported bf16"
+    )
     def test_training_graph_mode_fallback_autocast(self):
         model = Conv_IF_Relu().to(memory_format=torch.channels_last).train()
         x = torch.randn(3, 6, 10, 10).to(memory_format=torch.channels_last)
 
@@ -308,7 +308,11 @@ def test_linearfusion_args0(self):
             ipex.llm.modules.LinearRelu,
             ipex.llm.modules.Linear2SiluMul,
         ]
-        dtypes = [torch.float32, torch.bfloat16]
+        dtypes = [
+            torch.float32,
+        ]
+        if core.onednn_has_bf16_support():
+            dtypes.append(torch.bfloat16)
         if core.onednn_has_fp16_support():
             dtypes.append(torch.float16)
         with torch.no_grad():
@@ -353,7 +357,11 @@ def test_linearfusion_args1(self):
             ipex.llm.modules.LinearAdd,
             ipex.llm.modules.LinearSiluMul,
         ]
-        dtypes = [torch.float32, torch.bfloat16]
+        dtypes = [
+            torch.float32,
+        ]
+        if core.onednn_has_bf16_support():
+            dtypes.append(torch.bfloat16)
         if core.onednn_has_fp16_support():
             dtypes.append(torch.float16)
         with torch.no_grad():
@@ -390,7 +398,11 @@ def test_linearfusion_args2(self):
         x2 = copy.deepcopy(x1)
         ref_scope = [Linear_add_add]
         ipex_scope = [ipex.llm.modules.LinearAddAdd]
-        dtypes = [torch.float32, torch.bfloat16]
+        dtypes = [
+            torch.float32,
+        ]
+        if core.onednn_has_bf16_support():
+            dtypes.append(torch.bfloat16)
         if core.onednn_has_fp16_support():
             dtypes.append(torch.float16)
         with torch.no_grad():