@@ -22,6 +22,7 @@ def exaone_config(self):
2222 except Exception :
2323 pytest .skip ("EXAONE 4.0 model config not available" )
2424
25+ @pytest .mark .inference_v2
2526 def test_exaone_config_properties (self , exaone_config ):
2627 """Test that EXAONE config has expected properties"""
2728 assert exaone_config .model_type == "exaone4"
@@ -38,6 +39,7 @@ def test_exaone_config_properties(self, exaone_config):
3839
3940 assert abs (ratio - 3.0 ) < 0.1 , f"Expected 3:1 ratio, got { ratio :.1f} :1"
4041
42+ @pytest .mark .inference_v2
4143 def test_transformer_container_param_mapping (self , exaone_config ):
4244 """Test ExaoneTransformerContainer parameter mapping"""
4345 container = ExaoneTransformerContainer (exaone_config )
@@ -58,6 +60,7 @@ def test_transformer_container_param_mapping(self, exaone_config):
5860 for param_name in expected_mappings :
5961 assert param_name in container .PARAM_MAPPING , f"Missing mapping for { param_name } "
6062
63+ @pytest .mark .inference_v2
6164 def test_non_transformer_container_param_mapping (self , exaone_config ):
6265 """Test ExaoneNonTransformerContainer parameter mapping"""
6366 container = ExaoneNonTransformerContainer (exaone_config )
@@ -71,6 +74,7 @@ def test_non_transformer_container_param_mapping(self, exaone_config):
7174 for param_name in expected_mappings :
7275 assert param_name in container .PARAM_MAPPING , f"Missing mapping for { param_name } "
7376
77+ @pytest .mark .inference_v2
7478 def test_exaone_inference_model_properties (self , exaone_config ):
7579 """Test EXAONE model configuration properties"""
7680 # Test basic config properties that our model would use
@@ -88,6 +92,7 @@ def test_exaone_inference_model_properties(self, exaone_config):
8892 from deepspeed .inference .v2 .model_implementations .exaone .model import ExaoneInferenceModel
8993 assert ExaoneInferenceModel is not None
9094
95+ @pytest .mark .inference_v2
9196 def test_hybrid_attention_layer_detection (self , exaone_config ):
9297 """Test hybrid attention layer type detection logic"""
9398 # Test the layer pattern without full model instantiation
@@ -124,6 +129,7 @@ def should_apply_rope(layer_idx: int) -> bool:
124129 for layer in local_layers :
125130 assert should_apply_rope (layer ), f"Local layer { layer } should apply RoPE"
126131
132+ @pytest .mark .inference_v2
127133 def test_exaone_policy_creation (self , exaone_config ):
128134 """Test ExaonePolicy creation and container map building"""
129135
@@ -146,13 +152,15 @@ def parameters(self):
146152 assert container_map .non_transformer_params is not None
147153 assert len (list (container_map .transformer_params )) == exaone_config .num_hidden_layers
148154
155+ @pytest .mark .inference_v2
149156 def test_model_type_recognition (self , exaone_config ):
150157 """Test that EXAONE model type is correctly recognized"""
151158 assert exaone_config .model_type == "exaone4"
152159
153160 # Test that the config has the expected architecture
154161 assert "Exaone4ForCausalLM" in exaone_config .architectures
155162
163+ @pytest .mark .inference_v2
156164 @pytest .mark .parametrize ("layer_idx,expected_type" , [
157165 (0 , 'sliding_attention' ),
158166 (1 , 'sliding_attention' ),
0 commit comments