Skip to content

Commit 2df90b3

Browse files
committed
added new rq-gpu-worker (that uses gpu queue, old gpu queue renamed to api)
1 parent 89bbf83 commit 2df90b3

File tree

19 files changed

+98
-38
lines changed

19 files changed

+98
-38
lines changed

backend/.vscode/launch.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@
2727
"env": {
2828
"PYTHONPATH": "${workspaceFolder}/src",
2929
"RQ_WORKERS_CPU": "1",
30+
"RQ_WORKERS_API": "1",
3031
"RQ_WORKERS_GPU": "1",
3132
"CUDA_VISIBLE_DEVICES": "1"
3233
}

backend/src/modules/concept_over_time_analysis/cota_refinement_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919
job_type=JobType.COTA_REFINEMENT,
2020
input_type=COTARefinementJobInput,
2121
output_type=None,
22-
device="gpu",
22+
device="api",
2323
result_ttl=JobResultTTL.NINETY_DAYS,
2424
)
2525
def cota_refinement(payload: COTARefinementJobInput, job: Job) -> None:

backend/src/modules/doc_processing/audio/transcription_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ class TranscriptionJobOutput(JobOutputBase):
4141
job_type=JobType.AUDIO_TRANSCRIPTION,
4242
input_type=TranscriptionJobInput,
4343
output_type=TranscriptionJobOutput,
44-
device="gpu",
44+
device="api",
4545
)
4646
def handle_transcription_job(
4747
payload: TranscriptionJobInput, job: Job

backend/src/modules/doc_processing/html/sentence_embedding_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ class TextSentenceEmbeddingJobInput(SdocProcessingJobInput):
2222
@register_job(
2323
job_type=JobType.TEXT_SENTENCE_EMBEDDING,
2424
input_type=TextSentenceEmbeddingJobInput,
25-
device="gpu",
25+
device="api",
2626
)
2727
def handle_text_sentence_embedding_job(
2828
payload: TextSentenceEmbeddingJobInput, job: Job

backend/src/modules/doc_processing/image/image_caption_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@ class ImageCaptionJobOutput(JobOutputBase):
3030
job_type=JobType.IMAGE_CAPTION,
3131
input_type=ImageCaptionJobInput,
3232
output_type=ImageCaptionJobOutput,
33-
device="gpu",
33+
device="api",
3434
)
3535
def handle_image_caption_job(
3636
payload: ImageCaptionJobInput, job: Job

backend/src/modules/doc_processing/image/image_embedding_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ class ImageEmbeddingJobInput(SdocProcessingJobInput):
2020

2121

2222
@register_job(
23-
job_type=JobType.IMAGE_EMBEDDING, input_type=ImageEmbeddingJobInput, device="gpu"
23+
job_type=JobType.IMAGE_EMBEDDING, input_type=ImageEmbeddingJobInput, device="api"
2424
)
2525
def handle_image_embedding_job(payload: ImageEmbeddingJobInput, job: Job) -> None:
2626
# embed the image

backend/src/modules/doc_processing/image/object_detection_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ class ObjectDetectionJobInput(SdocProcessingJobInput):
2828
@register_job(
2929
job_type=JobType.IMAGE_OBJECT_DETECTION,
3030
input_type=ObjectDetectionJobInput,
31-
device="gpu",
31+
device="api",
3232
)
3333
def handle_object_detection_job(payload: ObjectDetectionJobInput, job: Job) -> None:
3434
# Run object detection with ray

backend/src/modules/llm_assistant/llm_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
output_type=LLMJobOutput,
1515
generate_endpoints=EndpointGeneration.ALL,
1616
router=router,
17-
device="gpu",
17+
device="api",
1818
result_ttl=JobResultTTL.NINETY_DAYS,
1919
timeout=-1, # infinite/no timeout
2020
)

backend/src/modules/ml/ml_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
job_type=JobType.ML,
2828
input_type=MLJobInput,
2929
generate_endpoints=EndpointGeneration.ALL,
30-
device="gpu",
30+
device="api",
3131
result_ttl=JobResultTTL.NINETY_DAYS,
3232
)
3333
def ml_job(payload: MLJobInput, job: Job) -> None:

backend/src/modules/perspectives/perspectives_job.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
@register_job(
1111
job_type=JobType.PERSPECTIVES,
1212
input_type=PerspectivesJobInput,
13-
device="gpu",
13+
device="api",
1414
result_ttl=JobResultTTL.NINETY_DAYS,
1515
)
1616
def perspectives_job(payload: PerspectivesJobInput, job: Job) -> None:

0 commit comments

Comments
 (0)