Tiktok-Talent-Info/endpoints/image.py

from fastapi import UploadFile, Form
from fastapi.responses import JSONResponse
import base64
import io
import asyncio
import numpy as np
from PIL import Image
from pipeline_setup import pipe, IMAGE_TOKEN 
from utils.image_processing import encode_image_base64

# api
async def image_query(file: UploadFile, question: str = Form(...)):
    """
    API endpoint to process an image with the user's query.
    """
    try:
        if file.content_type not in ["image/jpeg", "image/png"]:
            return JSONResponse({"query": question, "error": "Unsupported file type."})

        image_data = await file.read()
        image = Image.open(io.BytesIO(image_data)).convert("RGB").resize((512, 512))
        encoded_image_base64 = encode_image_base64(image)
        
        question_with_image_token = f"{question}\n{IMAGE_TOKEN}"
        response = await asyncio.to_thread(pipe, (question, image))  
        return JSONResponse({"query": question, "response": response.text})
    except Exception as e:
        return JSONResponse({"query": question, "error": str(e)})

# gradio
# async def image_query(image: np.ndarray, question: str):
#     try:
#         # Convert the numpy array to a PIL Image
#         image = Image.fromarray(image).convert("RGB").resize((512, 512))
        
#         # Encode the image to base64 (optional, if needed by your pipeline)
#         buffered = io.BytesIO()
#         image.save(buffered, format="JPEG")
#         encoded_image_base64 = base64.b64encode(buffered.getvalue()).decode("utf-8")

#         # Prepare the query with the image token
#         question_with_image_token = f"{question}\n{IMAGE_TOKEN}"

#         # Query the model
#         response = await asyncio.to_thread(pipe, (question, image))
#         return {"query": question, "response": response.text}
#     except Exception as e:
#         return {"query": question, "error": str(e)}

# celery
# def image_query(image_path: str, question: str):
#     try:
#         print("image_path in image_query...")
#         with open(image_path, "rb") as file:
#             image_data = file.read()

#         image = Image.open(io.BytesIO(image_data)).convert("RGB").resize((512, 512))
#         encoded_image_base64 = encode_image_base64(image)

#         # Prepare the question with the image token
#         question_with_image_token = f"{question}\n{IMAGE_TOKEN}"

#         # Run model inference (blocking call, but can be async)
#         response = pipe((question_with_image_token, image)) 
        
#         return {"query": question, "response": response.text}
    
#     except Exception as e:
#         return {"query": question, "error": str(e)}
updated ui 2025-01-23 21:50:55 +08:00			`from fastapi import UploadFile, Form`
			`from fastapi.responses import JSONResponse`
updated gradio 2025-02-08 18:52:07 +08:00			`import base64`
updated ui 2025-01-23 21:50:55 +08:00			`import io`
updated ui 2025-01-23 21:57:08 +08:00			`import asyncio`
updated image and video upload 2025-01-24 14:11:46 +08:00			`import numpy as np`
updated ui 2025-01-23 21:50:55 +08:00			`from PIL import Image`
updated celery redis 2025-02-07 19:18:35 +08:00			`from pipeline_setup import pipe, IMAGE_TOKEN`
updated ui 2025-01-23 21:50:55 +08:00			`from utils.image_processing import encode_image_base64`

updated readme 2025-05-12 11:22:46 +08:00			`# api`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`async def image_query(file: UploadFile, question: str = Form(...)):`
			`"""`
			`API endpoint to process an image with the user's query.`
			`"""`
			`try:`
			`if file.content_type not in ["image/jpeg", "image/png"]:`
			`return JSONResponse({"query": question, "error": "Unsupported file type."})`

			`image_data = await file.read()`
			`image = Image.open(io.BytesIO(image_data)).convert("RGB").resize((512, 512))`
			`encoded_image_base64 = encode_image_base64(image)`

			`question_with_image_token = f"{question}\n{IMAGE_TOKEN}"`
			`response = await asyncio.to_thread(pipe, (question, image))`
			`return JSONResponse({"query": question, "response": response.text})`
			`except Exception as e:`
			`return JSONResponse({"query": question, "error": str(e)})`

updated readme 2025-05-12 11:22:46 +08:00			`# gradio`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# async def image_query(image: np.ndarray, question: str):`
updated gradio 2025-02-08 18:52:07 +08:00			`# try:`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# # Convert the numpy array to a PIL Image`
			`# image = Image.fromarray(image).convert("RGB").resize((512, 512))`
updated image and video upload 2025-01-24 14:11:46 +08:00
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# # Encode the image to base64 (optional, if needed by your pipeline)`
			`# buffered = io.BytesIO()`
			`# image.save(buffered, format="JPEG")`
			`# encoded_image_base64 = base64.b64encode(buffered.getvalue()).decode("utf-8")`

			`# # Prepare the query with the image token`
updated gradio 2025-02-08 18:52:07 +08:00			`# question_with_image_token = f"{question}\n{IMAGE_TOKEN}"`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00
			`# # Query the model`
			`# response = await asyncio.to_thread(pipe, (question, image))`
			`# return {"query": question, "response": response.text}`
updated gradio 2025-02-08 18:52:07 +08:00			`# except Exception as e:`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# return {"query": question, "error": str(e)}`
updated image and video upload 2025-01-24 14:11:46 +08:00
updated readme 2025-05-12 11:22:46 +08:00			`# celery`
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# def image_query(image_path: str, question: str):`
			`# try:`
			`# print("image_path in image_query...")`
			`# with open(image_path, "rb") as file:`
			`# image_data = file.read()`
updated image and video upload 2025-01-24 14:11:46 +08:00
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# image = Image.open(io.BytesIO(image_data)).convert("RGB").resize((512, 512))`
			`# encoded_image_base64 = encode_image_base64(image)`
updated image and video upload 2025-01-24 14:11:46 +08:00
updated celery cpu gpu optimization 2025-03-22 20:54:10 +08:00			`# # Prepare the question with the image token`
			`# question_with_image_token = f"{question}\n{IMAGE_TOKEN}"`

			`# # Run model inference (blocking call, but can be async)`
			`# response = pipe((question_with_image_token, image))`

			`# return {"query": question, "response": response.text}`

			`# except Exception as e:`
			`# return {"query": question, "error": str(e)}`