Skip to content

Commit c853cf5

Browse files
committed
release v0.2.4
1 parent 86940b9 commit c853cf5

File tree

4 files changed

+20
-17
lines changed

4 files changed

+20
-17
lines changed

requirements.txt

+5-2
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,7 @@
1-
vllm>=0.4.2
2-
infinity-emb[torch,optimum]>=0.0.33
1+
vllm==0.4.3
2+
infinity-emb[torch,optimum]==0.0.40
33
openai>=1.5.0
4+
uvicorn
5+
pydantic
6+
fastapi
47
sse-starlette

src/imitater/__init__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
__version__ = "0.2.4.dev0"
1+
__version__ = "0.2.4"

src/imitater/model/chat_model.py

+9-9
Original file line numberDiff line numberDiff line change
@@ -34,14 +34,14 @@ class ChatConfig:
3434

3535
@staticmethod
3636
def add_cli_args(parser: "ArgumentParser") -> None:
37-
parser.add_argument("--name", type=str)
38-
parser.add_argument("--path", type=str)
39-
parser.add_argument("--device", type=int, nargs="+")
40-
parser.add_argument("--port", type=int)
41-
parser.add_argument("--maxlen", type=int, default=2048)
42-
parser.add_argument("--agent_type", type=str, choices=list_agents(), default="react")
43-
parser.add_argument("--template", type=str, default=None)
44-
parser.add_argument("--gen_config", type=str, default=None)
37+
parser.add_argument("--name", type=str, required=True, help="Model name.")
38+
parser.add_argument("--path", type=str, required=True, help="Model path or hub id.")
39+
parser.add_argument("--device", type=int, nargs="+", required=True, help="Device ids.")
40+
parser.add_argument("--port", type=int, required=True, help="API port.")
41+
parser.add_argument("--maxlen", type=int, default=2048, help="Max sequence length.")
42+
parser.add_argument("--agent_type", type=str, choices=list_agents(), default="react", help="Agent type.")
43+
parser.add_argument("--template", type=str, default=None, help="Template path.")
44+
parser.add_argument("--gen_config", type=str, default=None, help="Generation config path.")
4545

4646
@classmethod
4747
def from_cli_args(cls, args: "Namespace") -> Self:
@@ -130,7 +130,7 @@ async def _generate(self, messages: List[Dict[str, str]], request_id: str, **gen
130130
stop_token_ids=self._generation_config.eos_token_id + gen_kwargs.pop("stop_token_ids", []),
131131
)
132132
result_generator = self._engine.generate(
133-
prompt=None, sampling_params=sampling_params, request_id=request_id, prompt_token_ids=input_ids
133+
inputs={"prompt_token_ids": input_ids}, sampling_params=sampling_params, request_id=request_id
134134
)
135135
return result_generator
136136

src/imitater/model/embed_model.py

+5-5
Original file line numberDiff line numberDiff line change
@@ -32,11 +32,11 @@ class EmbedConfig:
3232

3333
@staticmethod
3434
def add_cli_args(parser: "ArgumentParser") -> None:
35-
parser.add_argument("--name", type=str, required=True)
36-
parser.add_argument("--path", type=str, required=True)
37-
parser.add_argument("--device", type=int, nargs="+", required=True)
38-
parser.add_argument("--port", type=int, required=True)
39-
parser.add_argument("--batch_size", type=int, default=64)
35+
parser.add_argument("--name", type=str, required=True, help="Model name.")
36+
parser.add_argument("--path", type=str, required=True, help="Model path or hub id.")
37+
parser.add_argument("--device", type=int, nargs="+", required=True, help="Device ids.")
38+
parser.add_argument("--port", type=int, required=True, help="API port.")
39+
parser.add_argument("--batch_size", type=int, default=64, help="Batch size.")
4040

4141
@classmethod
4242
def from_cli_args(cls, args: "Namespace") -> Self:

0 commit comments

Comments
 (0)