Merge pull request #41 from LlmKira/dev

fix(vibe):Align samples for vibe, fix server
LlmKira · Mar 19, 2024 · ee830f6 · ee830f6
2 parents 346f29a + 111fb86
commit ee830f6
Show file tree

Hide file tree

Showing 8 changed files with 49 additions and 28 deletions.
diff --git a/playground/generate_image_img2img.py b/playground/generate_image_img2img.py
@@ -53,7 +53,7 @@ async def generate(
         print(f"charge: {agent.calculate_cost(is_opus=True)} if you are vip3")
         print(f"charge: {agent.calculate_cost(is_opus=False)} if you are not vip3")
         result = await agent.request(
-            session=credential, remove_sign=True
+            session=credential
         )
     except APIError as e:
         print(f"Error: {e.message}")

diff --git a/playground/upscale.py b/playground/upscale.py
@@ -40,7 +40,7 @@ async def generate(
         upscale = Upscale(image=data)  # Auto detect image size | base64
 
         _res = await upscale.request(
-            session=globe_s, remove_sign=True
+            session=globe_s
         )
     except APIError as e:
         print(e.response)

diff --git a/playground/vibe.py b/playground/vibe.py
@@ -44,7 +44,7 @@ async def generate(
         print(f"charge: {agent.calculate_cost(is_opus=True)} if you are vip3")
         print(f"charge: {agent.calculate_cost(is_opus=False)} if you are not vip3")
         result = await agent.request(
-            session=credential, remove_sign=True
+            session=credential
         )
     except APIError as e:
         print(f"Error: {e.message}")

diff --git a/playground/vibe_img2img.py b/playground/vibe_img2img.py
@@ -54,7 +54,7 @@ async def generate(
         print(f"charge: {agent.calculate_cost(is_opus=True)} if you are vip3")
         print(f"charge: {agent.calculate_cost(is_opus=False)} if you are not vip3")
         result = await agent.request(
-            session=credential, remove_sign=True
+            session=credential
         )
     except APIError as e:
         print(f"Error: {e.message}")

diff --git a/playground/vibe_inpaint.py b/playground/vibe_inpaint.py
@@ -74,7 +74,7 @@ async def generate(
         print(f"charge: {agent.calculate_cost(is_opus=True)} if you are vip3")
         print(f"charge: {agent.calculate_cost(is_opus=False)} if you are not vip3")
         result = await agent.request(
-            session=credential, remove_sign=True
+            session=credential
         )
     except APIError as e:
         print(f"Error: {e.message}")

diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "novelai-python"
-version = "0.4.2"
+version = "0.4.3"
 description = "NovelAI Python Binding With Pydantic"
 authors = [
     { name = "sudoskys", email = "[email protected]" },

diff --git a/src/novelai_python/sdk/ai/generate_image/__init__.py b/src/novelai_python/sdk/ai/generate_image/__init__.py
@@ -14,7 +14,9 @@
 from zipfile import ZipFile
 
 import curl_cffi
+import cv2
 import httpx
+import numpy as np
 from curl_cffi.requests import AsyncSession
 from loguru import logger
 from pydantic import BaseModel, ConfigDict, PrivateAttr, field_validator, model_validator, Field
@@ -28,7 +30,7 @@
 from ...._response.ai.generate_image import ImageGenerateResp
 from ....credential import CredentialBase
 from ....utils import try_jsonfy
-from PIL import Image
+from PIL import Image, ImageEnhance
 
 
 class GenerateImageInfer(ApiBaseModel):
@@ -155,42 +157,61 @@ def resize_image(image: Union[str, bytes], width: int, height: int):
             return base64.b64encode(buffered.getvalue()).decode("utf-8")
 
         @staticmethod
-        def add_image_to_black_background(image: Union[str, bytes], width: int = 448, height: int = 448):
+        def add_image_to_black_background(
+                image: Union[str, bytes],
+                width: int = 448,
+                height: int = 448,
+                transparency: bool = False
+        ):
+
             """
             缩放图像到指定的黑色透明背景上，使其尽可能大且保持比例。
+            :param transparency: 是否透明
             :param image: 图像
             :param width: 宽
             :param height: 高
             :return: 新图像
             """
+
             if isinstance(image, str):
                 image = base64.b64decode(image)
 
-            open_image = Image.open(BytesIO(image)).convert("RGBA")
-            # 如果尺寸相同，直接返回
-            if open_image.width == width and open_image.height == height:
-                return base64.b64encode(image).decode("utf-8")
+            # Decode the image from the base64 string
+            npimg = np.frombuffer(image, np.uint8)
 
-            # 计算正确的缩放因子
-            width_ratio = width / open_image.width
-            height_ratio = height / open_image.height
+            # Read the image using OpenCV
+            open_image = cv2.imdecode(npimg, cv2.IMREAD_UNCHANGED)
+
+            # Calculate the ratio for scaling
+            width_ratio = width / open_image.shape[1]
+            height_ratio = height / open_image.shape[0]
             ratio = min(width_ratio, height_ratio)
 
-            new_image_size = (int(open_image.width * ratio), int(open_image.height * ratio))
-            open_image = open_image.resize(new_image_size, Image.Resampling.BICUBIC)
+            # Create new image size
+            new_image_size = (int(open_image.shape[1] * ratio), int(open_image.shape[0] * ratio))
 
-            # 创建一个黑色透明背景的新图像，颜色深度32位
-            new_image = Image.new("RGBA", (width, height), (0, 0, 0, 0))
+            # Resize the image
+            open_image = cv2.resize(open_image, new_image_size, interpolation=cv2.INTER_LINEAR)
 
-            # 计算居中位置
-            position = ((width - open_image.width) // 2, (height - open_image.height) // 2)
+            # Create black background
+            if open_image.shape[2] == 3:  # no alpha channel, add one
+                open_image = cv2.cvtColor(open_image, cv2.COLOR_BGR2BGRA)
+            if transparency:
+                bg_color = [0, 0, 0, 0]
+            else:
+                bg_color = [0, 0, 0, 255]
+            new_image = np.full((height, width, 4), bg_color, dtype=np.uint8)
 
-            # 粘贴图像
-            new_image.paste(open_image, position)
+            # Compute coords to place image on black background
+            position = ((width - open_image.shape[1]) // 2, (height - open_image.shape[0]) // 2)
 
-            buffered = BytesIO()
-            new_image.save(buffered, format="PNG")
-            return base64.b64encode(buffered.getvalue()).decode("utf-8")
+            # Place the image on black background at the calculated position
+            new_image[position[1]:position[1] + open_image.shape[0],
+            position[0]:position[0] + open_image.shape[1]] = open_image
+
+            # Encode image to base64 string
+            _, buffer = cv2.imencode('.png', new_image)
+            return base64.b64encode(buffer).decode("utf-8")
 
         # Validators
         @model_validator(mode="after")

diff --git a/src/novelai_python/server.py b/src/novelai_python/server.py
@@ -104,7 +104,7 @@ async def upscale(
     :return:
     """
     try:
-        _result = await req.request(session=get_session(current_token), remove_sign=True)
+        _result = await req.request(session=get_session(current_token))
         zip_file_bytes = io.BytesIO()
         with zipfile.ZipFile(zip_file_bytes, mode="w", compression=zipfile.ZIP_DEFLATED) as zip_file:
             file = _result.files  # ONLY TUPLE
@@ -150,7 +150,7 @@ async def generate_image(
     :return:
     """
     try:
-        _result = await req.request(session=get_session(current_token), remove_sign=True)
+        _result = await req.request(session=get_session(current_token))
         zip_file_bytes = io.BytesIO()
         with zipfile.ZipFile(zip_file_bytes, mode="w", compression=zipfile.ZIP_DEFLATED) as zip_file:
             for file in _result.files: