Transfering fixes from release branch

sgonorov · sgonorov · commit 06d06937d1ab · 2025-11-28T02:02:37.000+04:00
diff --git a/.github/workflows/linux.yml b/.github/workflows/linux.yml
@@ -522,8 +522,8 @@ jobs:
             run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).continuous_batching.test }}
             timeout: 360
           - name: 'LLM & VLM'
-            cmd: 'python -m pytest -v ./tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py ./tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py --override-ini cache_dir=/mount/caches/pytest/'
-            run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test }}
+            cmd: 'python -m pytest -v ./tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py ./tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py tests/python_tests/test_image_generation.py --override-ini cache_dir=/mount/caches/pytest/'
+            run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test || fromJSON(needs.smart_ci.outputs.affected_components).Image_generation.test }}
             timeout: 180
           - name: 'GGUF Reader tests'
             cmd: 'python -m pytest -v ./tests/python_tests/test_gguf_reader.py'
diff --git a/.github/workflows/mac.yml b/.github/workflows/mac.yml
@@ -447,8 +447,8 @@ jobs:
           #   timeout: 240
           # Only supported on X64 or ARM with SVE support
           # - name: 'LLM & VLM'
-          #   cmd: 'tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py'
-          #   run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test }}
+          #   cmd: 'tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py tests/python_tests/test_image_generation.py'
+          #   run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test || fromJSON(needs.smart_ci.outputs.affected_components).Image_generation.test }}
           #   timeout: 180
           - name: 'GGUF Reader tests'
             cmd: 'python -m pytest -v ./tests/python_tests/test_gguf_reader.py'
diff --git a/.github/workflows/windows.yml b/.github/workflows/windows.yml
@@ -611,8 +611,8 @@ jobs:
             run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).continuous_batching.test }}
             timeout: 360
           - name: 'LLM & VLM'
-            cmd: 'python -m pytest -s -v tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py --override-ini cache_dir=/mount/caches/pytest/'
-            run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test }}
+            cmd: 'python -m pytest -s -v tests/python_tests/test_llm_pipeline.py tests/python_tests/test_llm_pipeline_static.py tests/python_tests/test_vlm_pipeline.py tests/python_tests/test_structured_output.py tests/python_tests/test_image_generation.py --override-ini cache_dir=/mount/caches/pytest/'
+            run_condition: ${{ fromJSON(needs.smart_ci.outputs.affected_components).visual_language.test || fromJSON(needs.smart_ci.outputs.affected_components).LLM.test || fromJSON(needs.smart_ci.outputs.affected_components).Image_generation.test }}
             timeout: 180
           - name: 'GGUF Reader tests'
             cmd: 'python -m pytest -s -v tests/python_tests/test_gguf_reader.py'
diff --git a/src/python/py_image_generation_pipelines.cpp b/src/python/py_image_generation_pipelines.cpp
@@ -180,10 +180,12 @@ class TorchGenerator : public ov::genai::CppStdGenerator {
     }
 
     float next() override {
+        py::gil_scoped_acquire acquire;
         return m_torch.attr("randn")(1, "generator"_a=m_torch_generator, "dtype"_a=m_float32).attr("item")().cast<float>();
     }
 
     ov::Tensor randn_tensor(const ov::Shape& shape) override {
+        py::gil_scoped_acquire acquire;
         py::object torch_tensor = m_torch.attr("randn")(to_py_list(shape), "generator"_a=m_torch_generator, "dtype"_a=m_float32);
         py::object numpy_tensor = torch_tensor.attr("numpy")();
         py::array numpy_array = py::cast<py::array>(numpy_tensor);
@@ -195,12 +197,24 @@ class TorchGenerator : public ov::genai::CppStdGenerator {
         class TorchTensorAllocator {
             size_t m_total_size;
             void * m_mutable_data;
-            py::object m_torch_tensor; // we need to hold torch.Tensor to avoid memory destruction
+            py::object m_torch_tensor;
 
         public:
             TorchTensorAllocator(size_t total_size, void * mutable_data, py::object torch_tensor) :
                 m_total_size(total_size), m_mutable_data(mutable_data), m_torch_tensor(torch_tensor) { }
 
+            ~TorchTensorAllocator() {
+                if (m_torch_tensor && Py_IsInitialized()) {
+                    py::gil_scoped_acquire acquire;
+                    m_torch_tensor = py::object();
+                }
+            }
+
+            TorchTensorAllocator(const TorchTensorAllocator&) = default;
+            TorchTensorAllocator& operator=(const TorchTensorAllocator&) = default;
+            TorchTensorAllocator(TorchTensorAllocator&&) = default;
+            TorchTensorAllocator& operator=(TorchTensorAllocator&&) = default;
+
             void* allocate(size_t bytes, size_t) const {
                 if (m_total_size == bytes) {
                     return m_mutable_data;
@@ -221,6 +235,7 @@ class TorchGenerator : public ov::genai::CppStdGenerator {
     }
 
     void seed(size_t new_seed) override {
+        py::gil_scoped_acquire acquire;
         create_torch_generator(new_seed);
     }
 };
@@ -448,12 +463,7 @@ void init_image_generation_pipelines(py::module_& m) {
             ) -> py::typing::Union<ov::Tensor> {
                 ov::AnyMap params = pyutils::kwargs_to_any_map(kwargs);
                 ov::Tensor res;
-                if (params_have_torch_generator(params)) {
-                    // TorchGenerator stores python object which causes segfault after gil_scoped_release
-                    // so if it was passed, we don't release GIL
-                    res = pipe.generate(prompt, params);
-                }
-                else {
+                {
                     py::gil_scoped_release rel;
                     res = pipe.generate(prompt, params);
                 }
@@ -565,12 +575,7 @@ void init_image_generation_pipelines(py::module_& m) {
             ) -> py::typing::Union<ov::Tensor> {
                 ov::AnyMap params = pyutils::kwargs_to_any_map(kwargs);
                 ov::Tensor res;
-                if (params_have_torch_generator(params)) {
-                    // TorchGenerator stores python object which causes segfault after gil_scoped_release
-                    // so if it was passed, we don't release GIL
-                    res = pipe.generate(prompt, image, params);
-                }
-                else {
+                {
                     py::gil_scoped_release rel;
                     res = pipe.generate(prompt, image, params);
                 }
@@ -676,12 +681,7 @@ void init_image_generation_pipelines(py::module_& m) {
             ) -> py::typing::Union<ov::Tensor> {
                 ov::AnyMap params = pyutils::kwargs_to_any_map(kwargs);
                 ov::Tensor res;
-                if (params_have_torch_generator(params)) {
-                    // TorchGenerator stores python object which causes segfault after gil_scoped_release
-                    // so if it was passed, we don't release GIL
-                    res = pipe.generate(prompt, image, mask_image, params);
-                }
-                else {
+                {
                     py::gil_scoped_release rel;
                     res = pipe.generate(prompt, image, mask_image, params);
                 }
diff --git a/tests/python_tests/test_image_generation.py b/tests/python_tests/test_image_generation.py
@@ -0,0 +1,198 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import pytest
+import subprocess  # nosec B404
+import logging
+from pathlib import Path
+import numpy as np
+import openvino as ov
+import openvino_genai as ov_genai
+
+from utils.constants import get_ov_cache_models_dir
+from utils.atomic_download import AtomicDownloadManager
+from utils.network import retry_request
+
+logger = logging.getLogger(__name__)
+
+MODEL_ID = "tiny-random-latent-consistency"
+MODEL_NAME = "echarlaix/tiny-random-latent-consistency"
+
+
+@pytest.fixture(scope="module")
+def image_generation_model():
+    models_dir = get_ov_cache_models_dir()
+    model_path = Path(models_dir) / MODEL_ID / MODEL_NAME
+    
+    manager = AtomicDownloadManager(model_path)
+    
+    def convert_model(temp_path: Path) -> None:
+        command = [
+            "optimum-cli", "export", "openvino",
+            "--model", MODEL_NAME,
+            "--trust-remote-code",
+            "--weight-format", "fp16",
+            str(temp_path)
+        ]
+        logger.info(f"Conversion command: {' '.join(command)}")
+        retry_request(lambda: subprocess.run(command, check=True, text=True, capture_output=True))
+    
+    try:
+        manager.execute(convert_model)
+    except subprocess.CalledProcessError as error:
+        logger.exception(f"optimum-cli returned {error.returncode}. Output:\n{error.output}")
+        raise
+    
+    return str(model_path)
+
+
+def get_random_image(height: int = 64, width: int = 64) -> ov.Tensor:
+    image_data = np.random.randint(0, 255, (1, height, width, 3), dtype=np.uint8)
+    return ov.Tensor(image_data)
+
+
+def get_mask_image(height: int = 64, width: int = 64) -> ov.Tensor:
+    mask_data = np.zeros((1, height, width, 3), dtype=np.uint8)
+    mask_data[:, height//4:3*height//4, width//4:3*width//4, :] = 255
+    return ov.Tensor(mask_data)
+
+
+class TestImageGenerationCallback:
+    
+    def test_text2image_with_simple_callback(self, image_generation_model):
+        pipe = ov_genai.Text2ImagePipeline(image_generation_model, "CPU")
+        
+        callback_calls = []
+        
+        def callback(step, num_steps, latent):
+            callback_calls.append((step, num_steps))
+            return False
+        
+        image = pipe.generate(
+            "test prompt",
+            width=64,
+            height=64,
+            num_inference_steps=2,
+            callback=callback
+        )
+        
+        assert len(callback_calls) > 0, "Callback should be called at least once"
+        assert image is not None
+    
+    def test_text2image_with_stateful_callback(self, image_generation_model):
+        pipe = ov_genai.Text2ImagePipeline(image_generation_model, "CPU")
+        
+        class ProgressTracker:
+            def __init__(self):
+                self.steps = []
+                self.total = 0
+            
+            def reset(self, total):
+                self.total = total
+                self.steps = []
+            
+            def update(self, step):
+                self.steps.append(step)
+        
+        tracker = ProgressTracker()
+        
+        def callback(step, num_steps, latent):
+            if tracker.total != num_steps:
+                tracker.reset(num_steps)
+            tracker.update(step)
+            return False
+        
+        image = pipe.generate(
+            "test prompt",
+            width=64,
+            height=64,
+            num_inference_steps=2,
+            callback=callback
+        )
+        
+        assert len(tracker.steps) > 0, "Callback should track steps"
+        assert image is not None
+    
+    def test_text2image_callback_early_stop(self, image_generation_model):
+        pipe = ov_genai.Text2ImagePipeline(image_generation_model, "CPU")
+        
+        callback_calls = []
+        
+        def callback(step, num_steps, latent):
+            callback_calls.append(step)
+            return step >= 1
+        
+        image = pipe.generate(
+            "test prompt",
+            width=64,
+            height=64,
+            num_inference_steps=5,
+            callback=callback
+        )
+        
+        assert len(callback_calls) <= 3, "Callback should stop early"
+        assert image is not None
+    
+    def test_text2image_multiple_generates_with_callback(self, image_generation_model):
+        pipe = ov_genai.Text2ImagePipeline(image_generation_model, "CPU")
+        
+        for i in range(3):
+            callback_calls = []
+            
+            def callback(step, num_steps, latent):
+                callback_calls.append(step)
+                return False
+            
+            image = pipe.generate(
+                f"test prompt {i}",
+                width=64,
+                height=64,
+                num_inference_steps=2,
+                callback=callback
+            )
+            
+            assert len(callback_calls) > 0
+            assert image is not None
+    
+    def test_image2image_with_callback(self, image_generation_model):
+        pipe = ov_genai.Image2ImagePipeline(image_generation_model, "CPU")
+        
+        callback_calls = []
+        
+        def callback(step, num_steps, latent):
+            callback_calls.append((step, num_steps))
+            return False
+        
+        input_image = get_random_image()
+        
+        image = pipe.generate(
+            "test prompt",
+            input_image,
+            strength=0.8,
+            callback=callback
+        )
+        
+        assert len(callback_calls) > 0
+        assert image is not None
+    
+    def test_inpainting_with_callback(self, image_generation_model):
+        pipe = ov_genai.InpaintingPipeline(image_generation_model, "CPU")
+        
+        callback_calls = []
+        
+        def callback(step, num_steps, latent):
+            callback_calls.append((step, num_steps))
+            return False
+        
+        input_image = get_random_image()
+        mask_image = get_mask_image()
+        
+        image = pipe.generate(
+            "test prompt",
+            input_image,
+            mask_image,
+            callback=callback
+        )
+        
+        assert len(callback_calls) > 0
+        assert image is not None