msinap · arman-aminian · Aug 11, 2023 · Aug 11, 2023 · Aug 11, 2023 · Aug 11, 2023
diff --git a/inference_server/main.py b/inference_server/main.py
@@ -6,20 +6,35 @@
 from transformers import AutoModel, AutoTokenizer
 from fastapi.openapi.utils import get_openapi
 from fastapi.responses import JSONResponse
-
+from mlflow.tracking import MlflowClient
+from mlflow.entities import ViewType
 
 client = QdrantClient("https://qdrant-mlsd-video-search.darkube.app", port=443)
 
 app = FastAPI()
 
-text_encoder = AutoModel.from_pretrained(os.environ['TEXT_ENCODER_MODEL'])
-text_tokenizer = AutoTokenizer.from_pretrained(os.environ['TEXT_ENCODER_MODEL'])
+MLFLOW_TRACKING_URI = "https://mlflow-mlsd-video-search.darkube.app/"
+client = MlflowClient(tracking_uri=MLFLOW_TRACKING_URI)
+experiments = client.search_experiments()
+exp_id = list(filter(lambda e: e.name == 'clip-farsi', experiments))[0].experiment_id
+runs = client.search_runs(
+    experiment_ids=exp_id,
+    filter_string="metrics.acc_at_10 >0.2",
+    run_view_type=ViewType.ACTIVE_ONLY,
+    max_results=5,
+    order_by=["metrics.acc_at_10 DESC"]
+)
+TEXT_ENCODER_MODEL = runs[0].data.tags['text_model']
+
+text_encoder = AutoModel.from_pretrained(TEXT_ENCODER_MODEL)
+text_tokenizer = AutoTokenizer.from_pretrained(TEXT_ENCODER_MODEL)
 
 
 @app.get("/{video_name}/")
 async def query(
-    video_name: str = Path(..., title="Video Name", description="Name of the video or 'ALL' to search in all videos"),
-    search_entry: str = Query(..., title="Search Entry", description="The search entry for text embedding"),
+        video_name: str = Path(..., title="Video Name",
+                               description="Name of the video or 'ALL' to search in all videos"),
+        search_entry: str = Query(..., title="Search Entry", description="The search entry for text embedding"),
 ):
     """
         Query for video frames based on the provided text search entry.
@@ -85,4 +100,3 @@ async def get_open_api_endpoint():
 @app.get("/docs", include_in_schema=False)
 async def get_documentation():
     return JSONResponse(content=app.openapi())
-
diff --git a/inference_server/requirements.txt b/inference_server/requirements.txt
@@ -4,3 +4,4 @@ torch  --index-url https://download.pytorch.org/whl/cpu
 torchvision  --index-url https://download.pytorch.org/whl/cpu
 transformers
 qdrant_client
+mlflow
diff --git a/video_database/video_to_db.py b/video_database/video_to_db.py
@@ -9,6 +9,8 @@
 import torchvision.transforms as transforms
 from qdrant_client import QdrantClient
 from qdrant_client.models import Record
+from mlflow.tracking import MlflowClient
+from mlflow.entities import ViewType
 
 
 def image_to_string(image):
@@ -25,7 +27,20 @@ def image_to_string(image):
     fps = int(video.get(cv2.CAP_PROP_FPS))
     frame_interval = fps * 5  # capture a frame every 5 seconds
 
-    image_encoder = CLIPVisionModel.from_pretrained('arman-aminian/clip-farsi-vision').eval()
+    MLFLOW_TRACKING_URI = "https://mlflow-mlsd-video-search.darkube.app/"
+    client = MlflowClient(tracking_uri=MLFLOW_TRACKING_URI)
+    experiments = client.search_experiments()
+    exp_id = list(filter(lambda e: e.name == 'clip-farsi', experiments))[0].experiment_id
+    runs = client.search_runs(
+        experiment_ids=exp_id,
+        filter_string="metrics.acc_at_10 >0.2",
+        run_view_type=ViewType.ACTIVE_ONLY,
+        max_results=5,
+        order_by=["metrics.acc_at_10 DESC"]
+    )
+    VISION_ENCODER_MODEL = runs[0].data.tags['vision_model']
+
+    image_encoder = CLIPVisionModel.from_pretrained(VISION_ENCODER_MODEL).eval()
 
     insert_data = []
     currentframe = 0