Skip to content

Commit

Permalink
chore: rename web_example_chat_completion.py to inference-api.py
Browse files Browse the repository at this point in the history
  • Loading branch information
ishaansehgal99 committed Oct 20, 2023
1 parent beec436 commit 3706150
Show file tree
Hide file tree
Showing 7 changed files with 6 additions and 6 deletions.
4 changes: 2 additions & 2 deletions pkg/inference/preset-inference-types.go
Original file line number Diff line number Diff line change
Expand Up @@ -40,8 +40,8 @@ var (
baseCommandPresetLlama2AChat = fmt.Sprintf("cd /workspace/llama/%s && torchrun", kaitov1alpha1.PresetLlama2AChat)
baseCommandPresetLlama2BChat = fmt.Sprintf("cd /workspace/llama/%s && torchrun", kaitov1alpha1.PresetLlama2BChat)
baseCommandPresetLlama2CChat = fmt.Sprintf("cd /workspace/llama/%s && torchrun", kaitov1alpha1.PresetLlama2CChat)
// llamaTextInferenceFile = "web_example_text_completion.py" TODO: To support Text Generation Llama Models
llamaChatInferenceFile = "web_example_chat_completion.py"
// llamaTextInferenceFile = "inference-api.py" TODO: To support Text Generation Llama Models
llamaChatInferenceFile = "inference-api.py"
llamaRunParams = map[string]string{
"max_seq_len": "512",
"max_batch_size": "8",
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ spec:
- |
echo "MASTER_ADDR: $MASTER_ADDR"
NODE_RANK=$(echo $HOSTNAME | grep -o '[^-]*$')
cd /workspace/llama/llama-2 && torchrun --nnodes 2 --nproc_per_node 1 --node_rank $NODE_RANK --master_addr $MASTER_ADDR --master_port 29500 web_example_chat_completion.py
cd /workspace/llama/llama-2 && torchrun --nnodes 2 --nproc_per_node 1 --node_rank $NODE_RANK --master_addr $MASTER_ADDR --master_port 29500 inference-api.py
resources:
limits:
nvidia.com/gpu: "1"
Expand Down
2 changes: 1 addition & 1 deletion presets/examples/llama-2-13b/llama-2-13b-statefulset.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ spec:
- |
echo "MASTER_ADDR: $MASTER_ADDR"
NODE_RANK=$(echo $HOSTNAME | grep -o '[^-]*$')
cd /workspace/llama/llama-2 && torchrun --nnodes 2 --nproc_per_node 1 --node_rank $NODE_RANK --master-addr $MASTER_ADDR --master-port 29500 web_example_text_completion.py
cd /workspace/llama/llama-2 && torchrun --nnodes 2 --nproc_per_node 1 --node_rank $NODE_RANK --master-addr $MASTER_ADDR --master-port 29500 inference-api.py
resources:
limits:
nvidia.com/gpu: "1"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ spec:
command:
- /bin/sh
- -c
- cd /workspace/llama/llama-2 && torchrun web_example_chat_completion.py
- cd /workspace/llama/llama-2 && torchrun inference-api.py
resources:
limits:
nvidia.com/gpu: "1"
Expand Down
2 changes: 1 addition & 1 deletion presets/examples/llama-2-7b/llama-2-7b-statefulset.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ spec:
command:
- /bin/sh
- -c
- cd /workspace/llama/llama-2 && torchrun web_example_text_completion.py
- cd /workspace/llama/llama-2 && torchrun inference-api.py
resources:
limits:
nvidia.com/gpu: "1"
Expand Down
File renamed without changes.
File renamed without changes.

0 comments on commit 3706150

Please sign in to comment.