- Added intelligent quality checkers and auto-retry pipeline for `image-to-3d` and `text-to-3d`. - Added unit tests for quality checkers. - `text-to-3d` now supports more `text-to-image` models, pipeline success rate improved to 94%.
120 lines
3.3 KiB
Python
120 lines
3.3 KiB
Python
# Project EmbodiedGen
|
|
#
|
|
# Copyright (c) 2025 Horizon Robotics. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
|
|
# implied. See the License for the specific language governing
|
|
# permissions and limitations under the License.
|
|
|
|
|
|
import logging
|
|
import tempfile
|
|
|
|
import pytest
|
|
from embodied_gen.utils.gpt_clients import GPT_CLIENT
|
|
from embodied_gen.utils.process_media import render_asset3d
|
|
from embodied_gen.validators.quality_checkers import (
|
|
ImageAestheticChecker,
|
|
ImageSegChecker,
|
|
MeshGeoChecker,
|
|
SemanticConsistChecker,
|
|
TextGenAlignChecker,
|
|
)
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def geo_checker():
|
|
return MeshGeoChecker(GPT_CLIENT)
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def seg_checker():
|
|
return ImageSegChecker(GPT_CLIENT)
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def aesthetic_checker():
|
|
return ImageAestheticChecker()
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def semantic_checker():
|
|
return SemanticConsistChecker(GPT_CLIENT)
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def textalign_checker():
|
|
return TextGenAlignChecker(GPT_CLIENT)
|
|
|
|
|
|
def test_geo_checker(geo_checker):
|
|
flag, result = geo_checker(
|
|
[
|
|
"apps/assets/example_image/sample_02.jpg",
|
|
]
|
|
)
|
|
logger.info(f"geo_checker: {flag}, {result}")
|
|
assert isinstance(flag, bool)
|
|
assert isinstance(result, str)
|
|
|
|
|
|
def test_aesthetic_checker(aesthetic_checker):
|
|
flag, result = aesthetic_checker("apps/assets/example_image/sample_02.jpg")
|
|
logger.info(f"aesthetic_checker: {flag}, {result}")
|
|
assert isinstance(flag, bool)
|
|
assert isinstance(result, float)
|
|
|
|
|
|
def test_seg_checker(seg_checker):
|
|
flag, result = seg_checker(
|
|
[
|
|
"apps/assets/example_image/sample_02.jpg",
|
|
"apps/assets/example_image/sample_02.jpg",
|
|
]
|
|
)
|
|
logger.info(f"seg_checker: {flag}, {result}")
|
|
assert isinstance(flag, bool)
|
|
assert isinstance(result, str)
|
|
|
|
|
|
def test_semantic_checker(semantic_checker):
|
|
flag, result = semantic_checker(
|
|
text="can",
|
|
image=["apps/assets/example_image/sample_02.jpg"],
|
|
)
|
|
logger.info(f"semantic_checker: {flag}, {result}")
|
|
assert isinstance(flag, bool)
|
|
assert isinstance(result, str)
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"mesh_path, text_desc",
|
|
[
|
|
("apps/assets/example_texture/meshes/chair.obj", "chair"),
|
|
("apps/assets/example_texture/meshes/clock.obj", "clock"),
|
|
],
|
|
)
|
|
def test_textgen_checker(textalign_checker, mesh_path, text_desc):
|
|
with tempfile.TemporaryDirectory() as output_root:
|
|
image_list = render_asset3d(
|
|
mesh_path,
|
|
output_root=output_root,
|
|
num_images=6,
|
|
elevation=(30, -30),
|
|
output_subdir="renders",
|
|
no_index_file=True,
|
|
with_mtl=False,
|
|
)
|
|
flag, result = textalign_checker(text_desc, image_list)
|
|
logger.info(f"textalign_checker: {flag}, {result}")
|