uhh-lt
diff --git a/‎backend/src/alembic/versions/d7e768a5b23d_vscode_launcher.py‎
Lines changed: 145 additions & 0 deletions b/‎backend/src/alembic/versions/d7e768a5b23d_vscode_launcher.py‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎backend/src/api/endpoints/document_tag_recommendation.py‎
Lines changed: 58 additions & 3 deletions b/‎backend/src/api/endpoints/document_tag_recommendation.py‎
Lines changed: 58 additions & 3 deletions
diff --git a/‎backend/src/app/celery/background_jobs/__init__.py‎
Lines changed: 2 additions & 1 deletion b/‎backend/src/app/celery/background_jobs/__init__.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎backend/src/app/celery/background_jobs/document_classification.py‎
Lines changed: 3 additions & 3 deletions b/‎backend/src/app/celery/background_jobs/document_classification.py‎
Lines changed: 3 additions & 3 deletions
@@ -0,0 +1,145 @@
+"""vscode launcher
+
+Revision ID: d7e768a5b23d
+Revises: f3108bb5e496
+Create Date: 2025-01-22 08:51:22.353360
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "d7e768a5b23d"
+down_revision: Union[str, None] = "f3108bb5e496"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.create_table(
+        "documenttagrecommendation",
+        sa.Column("task_id", sa.Integer(), nullable=False),
+        sa.Column("model_name", sa.String(), nullable=True),
+        sa.Column(
+            "created", sa.DateTime(), server_default=sa.text("now()"), nullable=False
+        ),
+        sa.Column("user_id", sa.Integer(), nullable=False),
+        sa.Column("project_id", sa.Integer(), nullable=False),
+        sa.ForeignKeyConstraint(["project_id"], ["project.id"], ondelete="CASCADE"),
+        sa.ForeignKeyConstraint(["user_id"], ["user.id"], ondelete="CASCADE"),
+        sa.PrimaryKeyConstraint("task_id"),
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendation_created"),
+        "documenttagrecommendation",
+        ["created"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendation_model_name"),
+        "documenttagrecommendation",
+        ["model_name"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendation_project_id"),
+        "documenttagrecommendation",
+        ["project_id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendation_task_id"),
+        "documenttagrecommendation",
+        ["task_id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendation_user_id"),
+        "documenttagrecommendation",
+        ["user_id"],
+        unique=False,
+    )
+    op.create_table(
+        "documenttagrecommendationlink",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("recommendation_task_id", sa.Integer(), nullable=False),
+        sa.Column("source_document_id", sa.Integer(), nullable=False),
+        sa.Column("predicted_tag_id", sa.Integer(), nullable=False),
+        sa.Column("prediction_score", sa.Float(), nullable=True),
+        sa.Column("is_accepted", sa.Boolean(), nullable=True),
+        sa.ForeignKeyConstraint(
+            ["predicted_tag_id"], ["documenttag.id"], ondelete="CASCADE"
+        ),
+        sa.ForeignKeyConstraint(
+            ["recommendation_task_id"],
+            ["documenttagrecommendation.task_id"],
+            ondelete="CASCADE",
+        ),
+        sa.ForeignKeyConstraint(
+            ["source_document_id"], ["sourcedocument.id"], ondelete="CASCADE"
+        ),
+        sa.PrimaryKeyConstraint("id"),
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendationlink_id"),
+        "documenttagrecommendationlink",
+        ["id"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendationlink_is_accepted"),
+        "documenttagrecommendationlink",
+        ["is_accepted"],
+        unique=False,
+    )
+    op.create_index(
+        op.f("ix_documenttagrecommendationlink_prediction_score"),
+        "documenttagrecommendationlink",
+        ["prediction_score"],
+        unique=False,
+    )
+    # ### end Alembic commands ###
+
+
+def downgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.drop_index(
+        op.f("ix_documenttagrecommendationlink_prediction_score"),
+        table_name="documenttagrecommendationlink",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendationlink_is_accepted"),
+        table_name="documenttagrecommendationlink",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendationlink_id"),
+        table_name="documenttagrecommendationlink",
+    )
+    op.drop_table("documenttagrecommendationlink")
+    op.drop_index(
+        op.f("ix_documenttagrecommendation_user_id"),
+        table_name="documenttagrecommendation",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendation_task_id"),
+        table_name="documenttagrecommendation",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendation_project_id"),
+        table_name="documenttagrecommendation",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendation_model_name"),
+        table_name="documenttagrecommendation",
+    )
+    op.drop_index(
+        op.f("ix_documenttagrecommendation_created"),
+        table_name="documenttagrecommendation",
+    )
+    op.drop_table("documenttagrecommendation")
+    # ### end Alembic commands ###
@@ -1,11 +1,16 @@
-from fastapi import APIRouter, BackgroundTasks, Depends
+from typing import List
+
+from fastapi import APIRouter, Depends, HTTPException
 from sqlalchemy.orm import Session
 
 from api.dependencies import get_current_user, get_db_session
 from app.celery.background_jobs import (
     prepare_and_start_document_classification_job_async,
 )
 from app.core.authorization.authz_user import AuthzUser
+from app.core.data.classification.document_classification_service import (
+    DocumentClassificationService,
+)
 from app.core.data.crud.document_tag_recommendation import (
     crud_document_tag_recommendation,
 )
@@ -15,6 +20,8 @@
     DocumentTagRecommendationRead,
 )
 
+dcs: DocumentClassificationService = DocumentClassificationService()
+
 router = APIRouter(
     prefix="/doctagrecommendation",
     dependencies=[Depends(get_current_user)],
@@ -32,7 +39,6 @@ def create_new_doc_tag_rec_task(
     db: Session = Depends(get_db_session),
     doc_tag_rec: DocumentTagRecommendationCreate,
     authz_user: AuthzUser = Depends(),
-    background_tasks: BackgroundTasks,
 ) -> DocumentTagRecommendationRead:
     authz_user.assert_in_project(doc_tag_rec.project_id)
 
@@ -51,4 +57,53 @@ def create_new_doc_tag_rec_task(
     return response
 
 
-# To-Do: Update of tag recommendation
+@router.get(
+    "/{task_id}",
+    response_model=List[dict],
+    summary="Retrieve all document tag recommendations for the given task ID.",
+)
+def get_recommendations_from_task_endpoint(task_id: int) -> List[dict]:
+    """
+    Retrieves document tag recommendations based on the specified task ID.
+
+    ### Response Format:
+    The endpoint returns a list of recommendations, where each recommendation
+    is represented as a dictionary with the following structure:
+
+    ```python
+    {
+        "recommendation_id": int,  # Unique identifier for the recommendation
+        "source_document": str,    # Name of the source document
+        "predicted_tag_id": int,   # ID of the predicted tag
+        "predicted_tag": str,      # Name of the predicted tag
+        "prediction_score": float  # Confidence score of the prediction
+    }
+    ```
+
+    ### Error Handling:
+    - Returns HTTP 404 if no recommendations are found for the given task ID.
+    """
+    recommendations = dcs.get_recommendations_from_task(task_id)
+    if not recommendations:
+        raise HTTPException(status_code=404, detail="No recommendations found.")
+    return recommendations
+
+
+@router.patch(
+    "/accept_recommendations",
+    response_model=int,
+    summary="The endpoint receives IDs of correctly tagged document recommendations and sets `is_accepted` to `true`, while setting the corresponding document tags.",
+)
+def update_document_tag_recommendations(
+    *,
+    accepted_recommendation_ids: List[int],
+) -> int:
+    modifications = dcs.validate_recommendations(
+        recommendation_ids=accepted_recommendation_ids
+    )
+    if modifications == -1:
+        raise HTTPException(
+            status_code=400, detail="An error occurred while updating recommendations."
+        )
+
+    return modifications
@@ -4,7 +4,7 @@
 from celery import Task
 
 from app.core.data.classification.document_classification_service import (
-    ClassificationService as ClassificationService,
+    DocumentClassificationService as DocumentClassificationService,
 )
 from app.core.data.crawler.crawler_service import CrawlerService
 from app.core.data.dto.crawler_job import CrawlerJobParameters, CrawlerJobRead
@@ -169,4 +169,5 @@ def prepare_and_start_document_classification_job_async(
         start_document_classification_job,
     )
 
+    assert isinstance(start_document_classification_job, Task), "Not a Celery Task"
     start_document_classification_job(task_id=task_id, project_id=project_id)
@@ -1,14 +1,14 @@
 from loguru import logger
 
 from app.core.data.classification.document_classification_service import (
-    ClassificationService,
+    DocumentClassificationService,
 )
 
-cs: ClassificationService = ClassificationService()
+dcs: DocumentClassificationService = DocumentClassificationService()
 
 
 def start_document_classification_job_(task_id: int, project_id):
     logger.info((f"Starting classification job with task id {task_id}",))
-    cs.perform_dummy_classification(task_id=task_id, project_id=project_id)
+    dcs.classify_untagged_documents(task_id=task_id, project_id=project_id)
 
     logger.info(f"Classification job {task_id} has finished.")
Original file line number	Diff line number	Diff line change
`@@ -4,7 +4,7 @@`
`4`	`4`	`from celery import Task`
`5`	`5`
`6`	`6`	`from app.core.data.classification.document_classification_service import (`
`7`		`- ClassificationService as ClassificationService,`
	`7`	`+ DocumentClassificationService as DocumentClassificationService,`
`8`	`8`	`)`
`9`	`9`	`from app.core.data.crawler.crawler_service import CrawlerService`
`10`	`10`	`from app.core.data.dto.crawler_job import CrawlerJobParameters, CrawlerJobRead`
`@@ -169,4 +169,5 @@ def prepare_and_start_document_classification_job_async(`
`169`	`169`	`start_document_classification_job,`
`170`	`170`	`)`
`171`	`171`
	`172`	`+ assert isinstance(start_document_classification_job, Task), "Not a Celery Task"`
`172`	`173`	`start_document_classification_job(task_id=task_id, project_id=project_id)`