forked from singlestore-labs/private-llm-aws
-
Notifications
You must be signed in to change notification settings - Fork 0
/
vars.tf
157 lines (139 loc) · 3.37 KB
/
vars.tf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
variable api_image_uri {
description = "The API between SageMaker, Your Apps, and SingleStore"
type = string
default = "public.ecr.aws/n7b1f4b4/private_llm_fastapi_server:latest"
}
variable "naming_prefix" {
description = "Naming Prefix - ie pllm"
type = string
default = "pllm"
}
variable "hf_task" {
description = "HuggingFace Task - ie text-generation"
type = string
default = "text-generation"
}
variable "hf_model_id" {
description = "HuggingFace Model ID - ie TheBloke/Llama-2-7B-GGUF"
type = string
default = "meta-llama/Llama-2-7b-chat-hf"
}
variable "hf_api_token" {
description = "HuggingFace API Token"
type = string
default = null
}
variable "hf_model_revision" {
description = "HuggingFace Model Revision - allows you to pin to a specific version"
type = string
default = null
}
variable "instance_type" {
description = "Instance Type - ie ml.g4dn.xlarge"
type = string
default = "ml.g4dn.12xlarge"
}
variable "create_db" {
description = "Create a SingleStore DB, defaults to false, expecting you might already have a database in place."
type = bool
default = false
}
variable "init_db" {
description = "Initialize the SingleStore DB with the Proper Schema, defaults to false, expecting you might already have a database in place."
type = bool
default = false
}
variable "aws" {
type = object({
AWS_ACCESS_KEY_ID = string
AWS_SECRET_ACCESS_KEY = string
AWS_REGION = string
AWS_ACCOUNT_ID = string
})
default = {
AWS_ACCESS_KEY_ID = ""
AWS_SECRET_ACCESS_KEY = ""
AWS_REGION = "us-west-2"
AWS_ACCOUNT_ID = ""
}
}
variable "pllm-group" {
type = object(
{
group_name = string
description = string
}
)
default = {
group_name = "pllm-group"
description = "Private LLM Group"
}
}
variable "api" {
type = object(
{
user_name = string
role_name = string
repo_name = string
service_name = string
}
)
default = {
user_name = "pllm-api-user"
role_name = "pllm-api-role"
repo_name = "pllm-api"
service_name = "pllm-api-svc"
}
}
variable "llm-deployer" {
type = object(
{
user_name = string
role_name = string
}
)
default = {
user_name = "pllm-deployer"
role_name = "pllm-deployer-role"
}
}
variable "vpc" {
type = object(
{
cidr_block = string
subnet_name = string
subnet_cidr_block = string
vpc_name = string
}
)
default = {
cidr_block = "10.37.37.0/24"
subnet_name = "private-llm-subnet"
subnet_cidr_block = "10.37.37.0/24"
vpc_name = "private-llm-vpc"
}
}
variable "sagemaker" {
type = object(
{
domain_name = string
exec_role_name = string
}
)
default = {
domain_name = "pllm-sagemaker-domain"
exec_role_name = "pllm-sagemaker-exec-role"
}
}
variable "s2_db_host" {
type = string
}
variable "s2_db_name" {
type = string
}
variable "s2_db_user" {
type = string
}
variable "s2_db_pass" {
type = string
}