|
""" |
|
Module to handle image uploading and processing for Bing AI integrations. |
|
""" |
|
from __future__ import annotations |
|
|
|
import json |
|
import math |
|
from aiohttp import ClientSession, FormData |
|
|
|
from ...typing import ImageType, Tuple |
|
from ...image import to_image, process_image, to_base64_jpg, ImageRequest, Image |
|
from ...requests import raise_for_status |
|
|
|
IMAGE_CONFIG = { |
|
"maxImagePixels": 360000, |
|
"imageCompressionRate": 0.7, |
|
"enableFaceBlurDebug": False, |
|
} |
|
|
|
async def upload_image( |
|
session: ClientSession, |
|
image_data: ImageType, |
|
tone: str, |
|
headers: dict |
|
) -> ImageRequest: |
|
""" |
|
Uploads an image to Bing's AI service and returns the image response. |
|
|
|
Args: |
|
session (ClientSession): The active session. |
|
image_data (bytes): The image data to be uploaded. |
|
tone (str): The tone of the conversation. |
|
proxy (str, optional): Proxy if any. Defaults to None. |
|
|
|
Raises: |
|
RuntimeError: If the image upload fails. |
|
|
|
Returns: |
|
ImageRequest: The response from the image upload. |
|
""" |
|
image = to_image(image_data) |
|
new_width, new_height = calculate_new_dimensions(image) |
|
image = process_image(image, new_width, new_height) |
|
img_binary_data = to_base64_jpg(image, IMAGE_CONFIG['imageCompressionRate']) |
|
|
|
data = build_image_upload_payload(img_binary_data, tone) |
|
|
|
async with session.post("https://www.bing.com/images/kblob", data=data, headers=prepare_headers(headers)) as response: |
|
await raise_for_status(response, "Failed to upload image") |
|
return parse_image_response(await response.json()) |
|
|
|
def calculate_new_dimensions(image: Image) -> Tuple[int, int]: |
|
""" |
|
Calculates the new dimensions for the image based on the maximum allowed pixels. |
|
|
|
Args: |
|
image (Image): The PIL Image object. |
|
|
|
Returns: |
|
Tuple[int, int]: The new width and height for the image. |
|
""" |
|
width, height = image.size |
|
max_image_pixels = IMAGE_CONFIG['maxImagePixels'] |
|
if max_image_pixels / (width * height) < 1: |
|
scale_factor = math.sqrt(max_image_pixels / (width * height)) |
|
return int(width * scale_factor), int(height * scale_factor) |
|
return width, height |
|
|
|
def build_image_upload_payload(image_bin: str, tone: str) -> FormData: |
|
""" |
|
Builds the payload for image uploading. |
|
|
|
Args: |
|
image_bin (str): Base64 encoded image binary data. |
|
tone (str): The tone of the conversation. |
|
|
|
Returns: |
|
Tuple[str, str]: The data and boundary for the payload. |
|
""" |
|
data = FormData() |
|
knowledge_request = json.dumps(build_knowledge_request(tone), ensure_ascii=False) |
|
data.add_field('knowledgeRequest', knowledge_request, content_type="application/json") |
|
data.add_field('imageBase64', image_bin) |
|
return data |
|
|
|
def build_knowledge_request(tone: str) -> dict: |
|
""" |
|
Builds the knowledge request payload. |
|
|
|
Args: |
|
tone (str): The tone of the conversation. |
|
|
|
Returns: |
|
dict: The knowledge request payload. |
|
""" |
|
return { |
|
"imageInfo": {}, |
|
"knowledgeRequest": { |
|
'invokedSkills': ["ImageById"], |
|
'subscriptionId': "Bing.Chat.Multimodal", |
|
'invokedSkillsRequestData': { |
|
'enableFaceBlur': True |
|
}, |
|
'convoData': { |
|
'convoid': "", |
|
'convotone': tone |
|
} |
|
} |
|
} |
|
|
|
def prepare_headers(headers: dict) -> dict: |
|
""" |
|
Prepares the headers for the image upload request. |
|
|
|
Args: |
|
session (ClientSession): The active session. |
|
boundary (str): The boundary string for the multipart/form-data. |
|
|
|
Returns: |
|
dict: The headers for the request. |
|
""" |
|
headers["Referer"] = 'https://www.bing.com/search?q=Bing+AI&showconv=1&FORM=hpcodx' |
|
headers["Origin"] = 'https://www.bing.com' |
|
return headers |
|
|
|
def parse_image_response(response: dict) -> ImageRequest: |
|
""" |
|
Parses the response from the image upload. |
|
|
|
Args: |
|
response (dict): The response dictionary. |
|
|
|
Raises: |
|
RuntimeError: If parsing the image info fails. |
|
|
|
Returns: |
|
ImageRequest: The parsed image response. |
|
""" |
|
if not response.get('blobId'): |
|
raise RuntimeError("Failed to parse image info.") |
|
|
|
result = {'bcid': response.get('blobId', ""), 'blurredBcid': response.get('processedBlobId', "")} |
|
result["imageUrl"] = f"https://www.bing.com/images/blob?bcid={result['blurredBcid'] or result['bcid']}" |
|
|
|
result['originalImageUrl'] = ( |
|
f"https://www.bing.com/images/blob?bcid={result['blurredBcid']}" |
|
if IMAGE_CONFIG["enableFaceBlurDebug"] else |
|
f"https://www.bing.com/images/blob?bcid={result['bcid']}" |
|
) |
|
return ImageRequest(result) |