Commit 6cac3382 authored by narugo1992's avatar narugo1992
Browse files

dev(narugo): add bangumi char

parent 7f034b31
Loading
Loading
Loading
Loading
+5 −14
Original line number Diff line number Diff line
import os
import random

from huggingface_hub import HfFileSystem

from benchmark import BaseBenchmark, create_plot_cli
from imgutils.generic.classify import _open_models_for_repo_id
from imgutils.validate import anime_bangumi_char
from imgutils.validate.bangumi_char import _REPO_ID

hf_fs = HfFileSystem()

_REPOSITORY = 'deepghs/bangumi_char_type'
_MODEL_NAMES = [
    os.path.relpath(file, _REPOSITORY).split('/')[0] for file in
    hf_fs.glob(f'{_REPOSITORY}/*/model.onnx')
]
_MODEL_NAMES = _open_models_for_repo_id(_REPO_ID).model_names


class AnimeBangumiCharacterBenchmark(BaseBenchmark):
@@ -21,12 +14,10 @@ class AnimeBangumiCharacterBenchmark(BaseBenchmark):
        self.model = model

    def load(self):
        from imgutils.validate.bangumi_char import _open_anime_bangumi_char_model
        _ = _open_anime_bangumi_char_model(self.model)
        _open_models_for_repo_id(_REPO_ID)._open_model(self.model)

    def unload(self):
        from imgutils.validate.bangumi_char import _open_anime_bangumi_char_model
        _open_anime_bangumi_char_model.cache_clear()
        _open_models_for_repo_id(_REPO_ID).clear()

    def run(self):
        image_file = random.choice(self.all_images)
+0 −2260

File deleted.

Preview size limit exceeded, changes collapsed.

+6 −90
Original line number Diff line number Diff line
@@ -28,16 +28,10 @@ Overview:
        If you are looking for a classification model that judges the proportion of the head in an image,
        please use the :func:`imgutils.validate.anime_portrait` function.
"""
import json
from functools import lru_cache
from typing import Tuple, Optional, Dict, List
from typing import Tuple, Dict

import numpy as np
from PIL import Image
from huggingface_hub import hf_hub_download

from imgutils.data import rgb_encode, ImageTyping, load_image
from imgutils.utils import open_onnx_model
from ..data import ImageTyping
from ..generic import classify_predict_score, classify_predict

__all__ = [
    'anime_bangumi_char_score',
@@ -45,81 +39,7 @@ __all__ = [
]

_DEFAULT_MODEL_NAME = 'mobilenetv3_v0_dist'


@lru_cache()
def _open_anime_bangumi_char_model(model_name):
    """
    Open the anime bangumi character model.

    :param model_name: The model name.
    :type model_name: str
    :return: The ONNX model.
    """
    return open_onnx_model(hf_hub_download(
        f'deepghs/bangumi_char_type',
        f'{model_name}/model.onnx',
    ))


@lru_cache()
def _get_anime_bangumi_char_labels(model_name) -> List[str]:
    """
    Get the labels for the anime bangumi character model.

    :param model_name: The model name.
    :type model_name: str
    :return: The list of labels.
    :rtype: List[str]
    """
    with open(hf_hub_download(
            f'deepghs/bangumi_char_type',
            f'{model_name}/meta.json',
    ), 'r') as f:
        return json.load(f)['labels']


def _img_encode(image: Image.Image, size: Tuple[int, int] = (384, 384),
                normalize: Optional[Tuple[float, float]] = (0.5, 0.5)):
    """
    Encode the input image.

    :param image: The input image.
    :type image: Image.Image
    :param size: The desired size of the image.
    :type size: Tuple[int, int]
    :param normalize: Mean and standard deviation for normalization. Default is (0.5, 0.5).
    :type normalize: Optional[Tuple[float, float]]
    :return: The encoded image data.
    :rtype: np.ndarray
    """
    image = image.resize(size, Image.BILINEAR)
    data = rgb_encode(image, order_='CHW')

    if normalize is not None:
        mean_, std_ = normalize
        mean = np.asarray([mean_]).reshape((-1, 1, 1))
        std = np.asarray([std_]).reshape((-1, 1, 1))
        data = (data - mean) / std

    return data.astype(np.float32)


def _raw_anime_bangumi_char(image: ImageTyping, model_name: str = _DEFAULT_MODEL_NAME):
    """
    Perform raw anime bangumi character processing on the input image.

    :param image: The input image.
    :type image: ImageTyping
    :param model_name: The model name. Default is 'mobilenetv3_v0_dist'.
    :type model_name: str
    :return: The processed image data.
    :rtype: np.ndarray
    """
    image = load_image(image, force_background='white', mode='RGB')
    input_ = _img_encode(image)[None, ...]
    output, = _open_anime_bangumi_char_model(model_name).run(['output'], {'input': input_})
    return output
_REPO_ID = 'deepghs/bangumi_char_type'


def anime_bangumi_char_score(image: ImageTyping, model_name: str = _DEFAULT_MODEL_NAME) -> Dict[str, float]:
@@ -169,9 +89,7 @@ def anime_bangumi_char_score(image: ImageTyping, model_name: str = _DEFAULT_MODE
        >>> anime_bangumi_char_score('bangumi_char/face/16.jpg')
        {'vision': 1.066640925273532e-05, 'imagery': 9.529400813335087e-06, 'halfbody': 4.089402500540018e-05, 'face': 0.9999388456344604}
    """
    output = _raw_anime_bangumi_char(image, model_name)
    values = dict(zip(_get_anime_bangumi_char_labels(model_name), map(lambda x: x.item(), output[0])))
    return values
    return classify_predict_score(image, _REPO_ID, model_name)


def anime_bangumi_char(image: ImageTyping, model_name: str = _DEFAULT_MODEL_NAME) -> Tuple[str, float]:
@@ -221,6 +139,4 @@ def anime_bangumi_char(image: ImageTyping, model_name: str = _DEFAULT_MODEL_NAME
        >>> anime_bangumi_char('bangumi_char/face/16.jpg')
        ('face', 0.9999388456344604)
    """
    output = _raw_anime_bangumi_char(image, model_name)[0]
    max_id = np.argmax(output)
    return _get_anime_bangumi_char_labels(model_name)[max_id], output[max_id].item()
    return classify_predict(image, _REPO_ID, model_name)
+3 −2
Original line number Diff line number Diff line
@@ -3,8 +3,9 @@ import os.path

import pytest

from imgutils.generic.classify import _open_models_for_repo_id
from imgutils.validate import anime_bangumi_char
from imgutils.validate.bangumi_char import _open_anime_bangumi_char_model, anime_bangumi_char_score
from imgutils.validate.bangumi_char import anime_bangumi_char_score, _REPO_ID
from test.testings import get_testfile

_ROOT_DIR = get_testfile('bangumi_char')
@@ -19,7 +20,7 @@ def _release_model_after_run():
    try:
        yield
    finally:
        _open_anime_bangumi_char_model.cache_clear()
        _open_models_for_repo_id(_REPO_ID).clear()


@pytest.mark.unittest