diff --git a/extensions/inference-triton-trtllm-extension/src/index.ts b/extensions/inference-triton-trtllm-extension/src/index.ts index d0de32357c..9e8d64bb25 100644 --- a/extensions/inference-triton-trtllm-extension/src/index.ts +++ b/extensions/inference-triton-trtllm-extension/src/index.ts @@ -93,7 +93,7 @@ export default class JanInferenceTritonTrtLLMExtension implements InferenceExten static async writeDefaultEngineSettings() { try { const engine_json = join(JanInferenceTritonTrtLLMExtension._homeDir, JanInferenceTritonTrtLLMExtension._engineMetadataFileName) - if (await fs.checkFileExists(engine_json)) { + if (await fs.exists(engine_json)) { JanInferenceTritonTrtLLMExtension._engineSettings = JSON.parse(await fs.readFile(engine_json)) } else { @@ -123,7 +123,7 @@ export default class JanInferenceTritonTrtLLMExtension implements InferenceExten * @param {MessageRequest} data - The data for the inference request. * @returns {Promise} A promise that resolves with the inference response. */ - async inferenceRequest(data: MessageRequest): Promise { + async inference(data: MessageRequest): Promise { const timestamp = Date.now(); const message: ThreadMessage = { thread_id: data.threadId,