mirror of
https://github.com/xtekky/gpt4free.git
synced 2024-11-05 00:01:00 +00:00
a28bab9387
Fix preview for uploaded and generated images in gui Improve typing, readme
152 lines
4.7 KiB
Python
152 lines
4.7 KiB
Python
"""
|
|
Module to handle image uploading and processing for Bing AI integrations.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import json
|
|
import math
|
|
from aiohttp import ClientSession, FormData
|
|
|
|
from ...typing import ImageType, Tuple
|
|
from ...image import to_image, process_image, to_base64_jpg, ImageRequest, Image
|
|
|
|
IMAGE_CONFIG = {
|
|
"maxImagePixels": 360000,
|
|
"imageCompressionRate": 0.7,
|
|
"enableFaceBlurDebug": False,
|
|
}
|
|
|
|
async def upload_image(
|
|
session: ClientSession,
|
|
image_data: ImageType,
|
|
tone: str,
|
|
proxy: str = None
|
|
) -> ImageRequest:
|
|
"""
|
|
Uploads an image to Bing's AI service and returns the image response.
|
|
|
|
Args:
|
|
session (ClientSession): The active session.
|
|
image_data (bytes): The image data to be uploaded.
|
|
tone (str): The tone of the conversation.
|
|
proxy (str, optional): Proxy if any. Defaults to None.
|
|
|
|
Raises:
|
|
RuntimeError: If the image upload fails.
|
|
|
|
Returns:
|
|
ImageRequest: The response from the image upload.
|
|
"""
|
|
image = to_image(image_data)
|
|
new_width, new_height = calculate_new_dimensions(image)
|
|
image = process_image(image, new_width, new_height)
|
|
img_binary_data = to_base64_jpg(image, IMAGE_CONFIG['imageCompressionRate'])
|
|
|
|
data = build_image_upload_payload(img_binary_data, tone)
|
|
headers = prepare_headers(session)
|
|
|
|
async with session.post("https://www.bing.com/images/kblob", data=data, headers=headers, proxy=proxy) as response:
|
|
if response.status != 200:
|
|
raise RuntimeError("Failed to upload image.")
|
|
return parse_image_response(await response.json())
|
|
|
|
def calculate_new_dimensions(image: Image) -> Tuple[int, int]:
|
|
"""
|
|
Calculates the new dimensions for the image based on the maximum allowed pixels.
|
|
|
|
Args:
|
|
image (Image): The PIL Image object.
|
|
|
|
Returns:
|
|
Tuple[int, int]: The new width and height for the image.
|
|
"""
|
|
width, height = image.size
|
|
max_image_pixels = IMAGE_CONFIG['maxImagePixels']
|
|
if max_image_pixels / (width * height) < 1:
|
|
scale_factor = math.sqrt(max_image_pixels / (width * height))
|
|
return int(width * scale_factor), int(height * scale_factor)
|
|
return width, height
|
|
|
|
def build_image_upload_payload(image_bin: str, tone: str) -> FormData:
|
|
"""
|
|
Builds the payload for image uploading.
|
|
|
|
Args:
|
|
image_bin (str): Base64 encoded image binary data.
|
|
tone (str): The tone of the conversation.
|
|
|
|
Returns:
|
|
Tuple[str, str]: The data and boundary for the payload.
|
|
"""
|
|
data = FormData()
|
|
knowledge_request = json.dumps(build_knowledge_request(tone), ensure_ascii=False)
|
|
data.add_field('knowledgeRequest', knowledge_request, content_type="application/json")
|
|
data.add_field('imageBase64', image_bin)
|
|
return data
|
|
|
|
def build_knowledge_request(tone: str) -> dict:
|
|
"""
|
|
Builds the knowledge request payload.
|
|
|
|
Args:
|
|
tone (str): The tone of the conversation.
|
|
|
|
Returns:
|
|
dict: The knowledge request payload.
|
|
"""
|
|
return {
|
|
"imageInfo": {},
|
|
"knowledgeRequest": {
|
|
'invokedSkills': ["ImageById"],
|
|
'subscriptionId': "Bing.Chat.Multimodal",
|
|
'invokedSkillsRequestData': {
|
|
'enableFaceBlur': True
|
|
},
|
|
'convoData': {
|
|
'convoid': "",
|
|
'convotone': tone
|
|
}
|
|
}
|
|
}
|
|
|
|
def prepare_headers(session: ClientSession) -> dict:
|
|
"""
|
|
Prepares the headers for the image upload request.
|
|
|
|
Args:
|
|
session (ClientSession): The active session.
|
|
boundary (str): The boundary string for the multipart/form-data.
|
|
|
|
Returns:
|
|
dict: The headers for the request.
|
|
"""
|
|
headers = session.headers.copy()
|
|
headers["Referer"] = 'https://www.bing.com/search?q=Bing+AI&showconv=1&FORM=hpcodx'
|
|
headers["Origin"] = 'https://www.bing.com'
|
|
return headers
|
|
|
|
def parse_image_response(response: dict) -> ImageRequest:
|
|
"""
|
|
Parses the response from the image upload.
|
|
|
|
Args:
|
|
response (dict): The response dictionary.
|
|
|
|
Raises:
|
|
RuntimeError: If parsing the image info fails.
|
|
|
|
Returns:
|
|
ImageRequest: The parsed image response.
|
|
"""
|
|
if not response.get('blobId'):
|
|
raise RuntimeError("Failed to parse image info.")
|
|
|
|
result = {'bcid': response.get('blobId', ""), 'blurredBcid': response.get('processedBlobId', "")}
|
|
result["imageUrl"] = f"https://www.bing.com/images/blob?bcid={result['blurredBcid'] or result['bcid']}"
|
|
|
|
result['originalImageUrl'] = (
|
|
f"https://www.bing.com/images/blob?bcid={result['blurredBcid']}"
|
|
if IMAGE_CONFIG["enableFaceBlurDebug"] else
|
|
f"https://www.bing.com/images/blob?bcid={result['bcid']}"
|
|
)
|
|
return ImageRequest(result) |