updated celery redis

2025-02-07 19:18:35 +08:00 · 2025-02-07 19:18:35 +08:00 · 814e558959
commit 814e558959
parent 7b80572f09
17 changed files with 309 additions and 55 deletions
--- a/init.py
+++ b/init.py
--- a/pycache/celery_app.cpython-312.pyc
+++ b/pycache/celery_app.cpython-312.pyc
--- a/pycache/locustfile.cpython-312.pyc
+++ b/pycache/locustfile.cpython-312.pyc
--- a/pycache/main.cpython-312.pyc
+++ b/pycache/main.cpython-312.pyc
--- a/pycache/pipeline_setup.cpython-312.pyc
+++ b/pycache/pipeline_setup.cpython-312.pyc
--- a/pycache/tasks.cpython-312.pyc
+++ b/pycache/tasks.cpython-312.pyc
--- a/celery_app.py
+++ b/celery_app.py
@ -0,0 +1,25 @@
+# from celery import Celery
+
+# celery_app = Celery(
+#     "tasks",
+#     broker="redis://localhost:6379/0",  # Redis as broker
+#     backend="redis://localhost:6379/0",  # Redis for storing results
+# )
+
+# celery_app.conf.task_routes = {
+#     "tasks.*": {"queue": "default"},
+# }
+
+from celery import Celery
+
+celery_app = Celery(
+    "tasks",
+    broker="redis://localhost:6379/0",
+    backend="redis://localhost:6379/0",
+    include=["tasks"]  # ✅ Prevents import issues
+)
+
+celery_app.conf.task_routes = {
+    "tasks.*": {"queue": "default"},
+}
+
--- a/endpoints/init.py
+++ b/endpoints/init.py
--- a/endpoints/image.py
+++ b/endpoints/image.py
@ -1,7 +1,6 @@
 from fastapi import UploadFile, Form
 from fastapi.responses import JSONResponse
 import io
-import base64
 import asyncio
 import numpy as np
 from PIL import Image
@ -27,7 +26,6 @@ async def image_query(file: UploadFile, question: str = Form(...)):
        return JSONResponse({"query": question, "error": str(e)})


-# import mimetypes
 # async def image_query(image: np.ndarray, question: str):
 #     """
 #     API endpoint to process an image (as numpy array) with the user's query.
--- a/endpoints/text.py
+++ b/endpoints/text.py
@ -9,11 +9,12 @@ async def text_query(question: str = Form(...)):
    API endpoint to process text input with the user's query.
    """
    try:
-        response = await asyncio.to_thread(pipe, question)
+        response = await to_thread(pipe, question) 
        return JSONResponse({"query": question, "response": response.text})
    except Exception as e:
        return JSONResponse({"query": question, "error": str(e)})

+
 # async def text_query(question: str = Form(...)):
 #     """
 #     API endpoint to process text input with the user's query.
--- a/locustfile.py
+++ b/locustfile.py
@ -1,18 +1,117 @@
-from locust import HttpUser, task, between
+import os
+import time
+import asyncio
+from locust import FastHttpUser, HttpUser, task, between, constant

-class MultiModalUser(HttpUser):
-    wait_time = between(1, 3)
+import torch
+print(torch.cuda.is_available())  
+
+class FastAPIUser(FastHttpUser):
+    # wait_time = between(1, 3)  # Wait time between requests
+    wait_time = constant(0)  # send request simultaneously
+    
+    def ensure_event_loop(self):
+        """Ensures each Locust task runs in a fresh asyncio event loop."""
+        try:
+            asyncio.get_running_loop()
+        except RuntimeError:
+            asyncio.set_event_loop(asyncio.new_event_loop())
+
+    # @task
+    # def text_query(self):
+    #     """Simulate text query request."""
+    #     url = "/api/text"
+        
+    #     # start_event.wait()  # Synchronize all users
+
+    #     start_time = time.time()
+    #     response = self.client.post(url, data={"question": "What is FastAPI?"})
+    #     total_time = time.time() - start_time
+
+    #     if response.status_code == 200:
+    #         print(f"Success: {response.json()} (Time: {total_time:.2f}s)")
+    #     else:
+    #         print(f"Error: {response.status_code} - {response.text}")
+
+    # @task
+    # def upload_image(self):
+    #     """Sends an image with the correct query format."""
+    #     url = "/api/image"
+    #     image_path = "../profile/1.png"
+
+    #     if not os.path.exists(image_path):
+    #         print(f"Error: File {image_path} not found!")
+    #         return
+
+    #     query_text = (
+    #         "Extract the following information from this image and return the result in JSON format:\n"
+    #         "- Name: <name>\n"
+    #         "- ID: <id>\n"
+    #         "- Profile Picture: <url>\n"
+    #         "- Follower Count: <count>\n"
+    #         "- Likes Count: <count>\n"
+    #         "- Bio: <bio>\n"
+    #         "- Following Count: <count>\n"
+    #         "- External Links: <links>\n"
+    #         "Do not include any disclaimers or comments like 'I'm sorry' or 'I can't assist'."
+    #     )
+
+    #     with open(image_path, "rb") as image_file:
+    #         files = {
+    #             "file": ("1.png", image_file, "image/png"),
+    #             "question": (None, query_text)
+    #         }
+
+    #         start_time = time.time()
+    #         response = self.client.post(url, files=files)
+    #         total_time = time.time() - start_time
+
+    #         if response.status_code == 200:
+    #             print(f"Success: {response.json()} (Time: {total_time:.2f}s)")
+    #         else:
+    #             print(f"Error: {response.status_code} - {response.text}")

    @task
-    def text_query(self):
-        self.client.post("/api/predict", json={"input": "What is the capital of France?"})
+    def video_query(self):
+        """Uploads a video and asks a detailed question."""
+        url = "/api/video"
+        video_path = "../video/1.1.mp4"

-    # @task
-    # def image_query(self):
-    #     with open("test_image.jpg", "rb") as f:
-    #         self.client.post("/api/image_predict", files={"file": f}, data={"question": "What is in this image?"})
+        if not os.path.exists(video_path):
+            print(f"Error: File {video_path} not found!")
+            return

-    # @task
-    # def video_query(self):
-    #     with open("test_video.mp4", "rb") as f:
-    #         self.client.post("/api/video_predict", files={"file": f}, data={"question": "What is happening in this video?"})
+        with open(video_path, "rb") as file:
+            files = {
+                "file": ("1.1.mp4", file, "video/mp4"),
+                "question": (None, """Based on the given images and audio script, extract detailed 
+                information about the products recommended in the video and format the output as JSON with 
+                the following fields:
+                1. **Product Name**: The specific name of the product, if mentioned.
+                2. **Category**: The specific category of the product (e.g., electronics, skincare, casual wear, etc.).
+                3. **Styles or Variants**: Any styles, designs, or variants of the product described 
+                   (e.g., colors, patterns, sizes, or other distinguishing attributes).
+                4. **Highlights**: The unique selling points or notable features emphasized by the anchor 
+                   (e.g., benefits, quality, or standout features).
+                5. **Promotional Details**: Any additional promotional information mentioned, such as discounts, 
+                   offers, or key features that set the product apart."""
+                )
+            }
+
+            print("Starting video query...")
+            start_time = time.time()
+            response = self.client.post(url, files=files) 
+            total_time = time.time() - start_time
+
+            if response.status_code == 200:
+                print(f"Success: {response.json()} (Time: {total_time:.2f}s)")
+            else:
+                print(f"Error: {response.status_code} - {response.text}")
+
+            print("Video query completed.")
+
+# locust -f locustfile.py
+
+# curl -X POST http://localhost:8002/api/image \
+#   -F "file=@../profile/1.png" \
+#   -F "question=What is this image about?"
--- a/main.py
+++ b/main.py
@ -1,18 +1,83 @@
-from fastapi import FastAPI
-from endpoints.text import text_query
-from endpoints.image import image_query
-from endpoints.video import video_query
+# from fastapi import FastAPI, Form, UploadFile
+# from fastapi.responses import JSONResponse
+# import asyncio
+
+# app = FastAPI()
+
+# @app.post("/api/text")
+# async def text_query_endpoint(question: str = Form(...)):
+#     """
+#     API endpoint to process text input with the user's query.
+#     """
+#     from endpoints.text import text_query 
+#     return await text_query(question=question)
+
+
+# @app.post("/api/image")
+# async def image_query_endpoint(file: UploadFile, question: str = Form(...)):
+#     """
+#     API endpoint to process an image with the user's query.
+#     """
+#     from endpoints.image import image_query 
+#     return await image_query(file=file, question=question)
+
+
+# @app.post("/api/video")
+# async def video_query_endpoint(file: UploadFile, question: str = Form(...)):
+#     """
+#     API endpoint to process a video file with the user's query.
+#     """
+#     from endpoints.video import video_query  
+#     return await video_query(file=file, question=question)
+
+
+# if __name__ == "__main__":
+#     import uvicorn
+#     uvicorn.run("main:app", host="0.0.0.0", port=8002, reload=True, loop="uvloop")
+
+
+from fastapi import FastAPI, Form, UploadFile
+from fastapi.responses import JSONResponse
+import shutil
+import uuid
+from tasks import text_query_task, image_query_task, video_query_task

 app = FastAPI()

-# Register routes
-app.post("/api/text")(text_query)
-app.post("/api/image")(image_query)
-app.post("/api/video")(video_query)
+# @app.post("/api/text")
+# async def text_query_endpoint(question: str = Form(...)):
+#     task = text_query_task.apply_async(args=[question])
+#     return JSONResponse({"task_id": task.id})

-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run("main:app", host="0.0.0.0", port=8002, reload=True)
+@app.post("/api/text")
+async def text_query_endpoint(question: str = Form(...)):
+    print(f"Received request: {question}") 
+    task = text_query_task.apply_async(args=[question])
+    print(f"Task sent: {task.id}")
+    return JSONResponse({"task_id": task.id})

-# python main.py
-# uvicorn main:app --reload
+@app.post("/api/image")
+async def image_query_endpoint(file: UploadFile, question: str = Form(...)):
+    file_path = f"/tmp/{uuid.uuid4()}_{file.filename}"
+    with open(file_path, "wb") as buffer:
+        shutil.copyfileobj(file.file, buffer)
+    
+    task = image_query_task.apply_async(args=[file_path, question])
+    return JSONResponse({"task_id": task.id})
+
+@app.post("/api/video")
+async def video_query_endpoint(file: UploadFile, question: str = Form(...)):
+    file_path = f"/tmp/{uuid.uuid4()}_{file.filename}"
+    with open(file_path, "wb") as buffer:
+        shutil.copyfileobj(file.file, buffer)
+    
+    task = video_query_task.apply_async(args=[file_path, question])
+    return JSONResponse({"task_id": task.id})
+
+@app.get("/api/task/{task_id}")
+async def get_task_result(task_id: str):
+    from celery.result import AsyncResult
+    result = AsyncResult(task_id)
+    if result.ready():
+        return JSONResponse({"status": "completed", "result": result.result})
+    return JSONResponse({"status": "pending"})
--- a/multi-user.py
+++ b/multi-user.py
@ -1,22 +1,63 @@
-import requests
-import threading
+import asyncio
+import httpx

-def send_request(user_id):
-    url = "http://localhost:8002"
-    data = {"input": f"Test input from user {user_id}"}
-    response = requests.post(url, json=data)
-    print(f"User {user_id} response: {response.text}")
+BASE_URL = "http://localhost:8002" 

-def main(num_users):
-    threads = []
-    for i in range(num_users):
-        thread = threading.Thread(target=send_request, args=(i,))
-        threads.append(thread)
-        thread.start()
+async def test_text_query(session_id: int):
+    """Send a POST request to the /api/text endpoint."""
+    try:
+        async with httpx.AsyncClient(timeout=30.0) as client:
+            # Correctly send form data
+            response = await client.post(
+                "http://localhost:8002/api/text",
+                data={"question": f"Test question: what is AI from session {session_id}"}
+            )
+            print(f"Session {session_id} Status Code: {response.status_code}")
+            print(f"Session {session_id} Headers: {response.headers}")
+            if response.content:
+                print(f"Session {session_id} Response: {response.json()}")
+            else:
+                print(f"Session {session_id} Response is empty.")
+    except Exception as e:
+        print(f"Session {session_id} encountered an error: {e}")
+
+
+async def test_image_query(session_id: int):
+    """Send a POST request to the /api/image endpoint with a dummy image."""
+    async with httpx.AsyncClient(timeout=30.0) as client:
+        files = {'file': ('../profile/1.jpg', b'binary data of the file', 'image/jpeg')}
+        response = await client.post(
+            f"{BASE_URL}/api/image",
+            data={"question": f"Image query: what is in the picture from session {session_id}"},
+            files=files
+        )
+        print(f"Session {session_id} Raw Response: {response.text}")
+        print(f"Session {session_id} Response: {response.json()}")
+
+
+async def test_video_query(session_id: int):
+    """Send a POST request to the /api/video endpoint with a dummy video."""
+    async with httpx.AsyncClient(timeout=30.0) as client:
+        files = {'file': ('../video/1.mp4', b'binary data of the file', 'video/mp4')}
+        response = await client.post(
+            f"{BASE_URL}/api/video",
+            data={"question": f"Video query: what is in the video from session {session_id}"},
+            files=files
+        )
+        print(f"Session {session_id} Raw Response: {response.text}")
+        print(f"Session {session_id} Response: {response.json()}")
+
+
+async def main():
+    tasks = []
+    for i in range(1, 3):
+        tasks.append(test_text_query(i))
+        # tasks.append(test_image_query(i))
+        # tasks.append(test_video_query(i))
+
+    # Run all tasks concurrently
+    await asyncio.gather(*tasks)

-    for thread in threads:
-        thread.join()

 if __name__ == "__main__":
-    num_users = 2
-    main(num_users)
+    asyncio.run(main())
--- a/pipeline_setup.py
+++ b/pipeline_setup.py
@ -4,6 +4,7 @@ from lmdeploy import pipeline, TurbomindEngineConfig, GenerationConfig
 IMAGE_TOKEN = "[IMAGE_TOKEN]"

 os.environ["CUDA_VISIBLE_DEVICES"] = "0,1"
+# os.environ["CUDA_VISIBLE_DEVICES"] = "2,3"

 # Model initialization
 model = "OpenGVLab/InternVL2-26B-AWQ"
@ -13,11 +14,11 @@ pipe = pipeline(
        model_format="awq",
        tp=2,
        # tp=4,
-        session_len=2048,  # 4096, 8192, 16384, 32768
+        session_len=16384,  # 4096, 8192, 16384, 32768
        max_batch_size=1,
-        cache_max_entry_count=0.1, # 0.05
-        cache_block_seq_len=4096,  # 8192, 16384, 32768
-        quant_policy=4,
+        cache_max_entry_count=0.2, # 0.05
+        cache_block_seq_len=16384,  # 8192, 16384, 32768
+        # quant_policy=8,
        # precision="fp16",
    ), 
    # log_level='DEBUG'
--- a/tasks.py
+++ b/tasks.py
@ -0,0 +1,25 @@
+import asyncio
+from celery_app import celery_app
+
+@celery_app.task
+def text_query_task(question: str):
+    from endpoints.text import text_query  # Import inside the function to avoid circular import
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+    return loop.run_until_complete(text_query(question=question))  # ✅ Correct way to call async functions in Celery
+
+@celery_app.task
+def image_query_task(file_path: str, question: str):
+    from endpoints.image import image_query  # Import inside the function
+    with open(file_path, "rb") as file:
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        return loop.run_until_complete(image_query(file=file, question=question))  # ✅ Use event loop
+
+@celery_app.task
+def video_query_task(file_path: str, question: str):
+    from endpoints.video import video_query  # Import inside the function
+    with open(file_path, "rb") as file:
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        return loop.run_until_complete(video_query(file=file, question=question))  # ✅ Use event loop
--- a/ui.py
+++ b/ui.py
@ -92,7 +92,6 @@ def setup_ui():
                    outputs=[video_output]
                )

-
    return ui

 if __name__ == "__main__":