Skip to content

Commit

Permalink
added the tuned tgi params
Browse files Browse the repository at this point in the history
  • Loading branch information
Zhenzhong1 committed Oct 22, 2024
1 parent 24de14e commit a953632
Show file tree
Hide file tree
Showing 2 changed files with 11 additions and 2 deletions.
3 changes: 2 additions & 1 deletion ChatQnA/benchmark/performance/helm_charts/deployment.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ def generate_yaml(num_nodes, mode="oob", with_rerank="True"):
if num_nodes == 1:
replicas = [
{"name": "chatqna-backend-server-deploy", "replicas": 2},
{"name": "embedding-dependency-deploy", "replicas": 2},
{"name": "embedding-dependency-deploy", "replicas": 1},
{"name": "reranking-dependency-deploy", "replicas": 1} if with_rerank else None,
{"name": "llm-dependency-deploy", "replicas": 7 if with_rerank else 8},
{"name": "dataprep-deploy", "replicas": 1},
Expand Down Expand Up @@ -69,6 +69,7 @@ def generate_yaml(num_nodes, mode="oob", with_rerank="True"):
{
"name": "llm-dependency-deploy",
"args": [
{"name": "--model-id", "value": '$(LLM_MODEL_ID)'},
{"name": "--max-input-length", "value": 1280},
{"name": "--max-total-tokens", "value": 2048},
{"name": "--max-batch-total-tokens", "value": 35536},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,9 +31,17 @@ spec:
- envFrom:
- configMapRef:
name: {{ $global.config.CONFIG_MAP_NAME }}

{{- $args := $microservice.args }}
{{- range $podSpec := $global.podSpecs }}
{{- if eq $podSpec.name $microservice.name }}
{{- $args = $podSpec.args | default $microservice.args }}
{{- end }}
{{- end }}

{{- if $microservice.args }}
args:
{{- range $arg := $microservice.args }}
{{- range $arg := $args }}
{{- if $arg.name }}
- {{ $arg.name }}
{{- end }}
Expand Down

0 comments on commit a953632

Please sign in to comment.