Merge pull request #2 from as-suvorov/as/eshiryae_skip_stateless_tests

AsyaPronina · web-flow · commit bd178b46097d · 2025-10-22T21:15:35.000+02:00
Skip stateles whisper tests
diff --git a/tests/python_tests/test_whisper_pipeline.py b/tests/python_tests/test_whisper_pipeline.py
@@ -55,13 +55,11 @@ def get_whisper_models_list(tiny_only=False):
 # used whisper models are relatively small
 # cache them in memory to speedup tests
 @functools.lru_cache()
-def read_whisper_model(params, stateful=True):
+def read_whisper_model(params):
     model_id, path = params
-    if not stateful:
-        path = pathlib.Path(f"{path}_with_past")
 
     if not (path / "openvino_encoder_model.xml").exists():
-        save_model(model_id=model_id, tmp_path=path, stateful=stateful)
+        save_model(model_id=model_id, tmp_path=path)
 
     opt_model = retry_request(lambda: OVModelForSpeechSeq2Seq.from_pretrained(
         path,
@@ -93,7 +91,7 @@ def read_whisper_model(params, stateful=True):
     )
 
 
-def save_model(model_id: str, tmp_path: pathlib.Path, stateful=True):
+def save_model(model_id: str, tmp_path: pathlib.Path):
     tokenizer = retry_request(lambda: AutoTokenizer.from_pretrained(model_id, trust_remote_code=True))
     ov_tokenizer, ov_detokenizer = openvino_tokenizers.convert_tokenizer(
         tokenizer,
@@ -111,7 +109,6 @@ def save_model(model_id: str, tmp_path: pathlib.Path, stateful=True):
         model_id,
         export=True,
         trust_remote_code=True,
-        stateful=stateful,
         compile=False,
         device="CPU",
         load_in_8bit=False,
@@ -226,9 +223,6 @@ def run_pipeline_with_ref(
     streamer: typing.Callable[[str], bool] | None = None,
 ):
     _, _, hf_pipe, genai_pipe = read_whisper_model((model_id, tmp_path))
-    _, _, _, genai_with_past_pipe = read_whisper_model(
-        (model_id, tmp_path), stateful=False
-    )
 
     if type(sample) is np.ndarray and len(sample.shape) == 1:
         sample = np.expand_dims(sample, 0)
@@ -239,12 +233,6 @@ def run_pipeline_with_ref(
 
         compare_results(hf_result, genai_result)
 
-        genai_with_past_result = run_genai(
-            genai_with_past_pipe, _sample, generation_config, streamer
-        )
-
-        compare_results(hf_result, genai_with_past_result)
-
 
 def compare_results(hf_result, genai_result):
     assert genai_result.texts[0] == hf_result["text"]
@@ -510,33 +498,6 @@ def test_longform_audio(model_descr, sample_from_dataset):
     assert "".join(streamer_result) == hf_result["text"]
 
 
-@pytest.mark.parametrize("model_descr", get_whisper_models_list())
-@pytest.mark.parametrize("sample_from_dataset", [*get_fixture_params_for_n_whisper_dataset_samples(n=2, long_form=True)], indirect=True)
-@pytest.mark.precommit
-@pytest.mark.xfail(condition=(sys.platform == "darwin"), reason="Ticket - 173169")
-def test_longform_audio_with_past(model_descr, sample_from_dataset):
-    _, _, hf_pipe, genai_pipe = read_whisper_model(model_descr, stateful=True)
-
-    streamer_result = []
-
-    genai_result = run_genai(
-        genai_pipe,
-        sample_from_dataset,
-        config=ov_genai.WhisperGenerationConfig(return_timestamps=True),
-        streamer=lambda x: streamer_result.append(x),
-    )
-
-    hf_result = run_huggingface(
-        hf_pipe,
-        sample_from_dataset,
-        config=ov_genai.WhisperGenerationConfig(return_timestamps=True),
-    )
-
-    compare_results(hf_result, genai_result)
-
-    assert "".join(streamer_result) == hf_result["text"]
-
-
 @pytest.mark.parametrize("model_descr", get_whisper_models_list())
 @pytest.mark.precommit
 @pytest.mark.xfail(condition=(sys.platform == "darwin"), reason="Ticket - 173169")