Skip to content

Commit

Permalink
Update bencmark model URLs to use S3 URL instead of alias
Browse files Browse the repository at this point in the history
  • Loading branch information
namannandan committed Jun 5, 2024
1 parent b9a79fe commit b11c473
Show file tree
Hide file tree
Showing 2 changed files with 8 additions and 8 deletions.
8 changes: 4 additions & 4 deletions benchmarks/models_config/bert_neuronx.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
bert_neuronx_batch_1:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/BERTSeqClassification_torchscript_neuronx_batch_1.mar
url: https://torchserve.s3.amazonaws.com/mar_files/BERTSeqClassification_torchscript_neuronx_batch_1.mar
workers:
- 2
batch_delay: 100
Expand All @@ -19,7 +19,7 @@ bert_neuronx_batch_1:
bert_neuronx_batch_2:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/BERTSeqClassification_torchscript_neuronx_batch_2.mar
url: https://torchserve.s3.amazonaws.com/mar_files/BERTSeqClassification_torchscript_neuronx_batch_2.mar
workers:
- 2
batch_delay: 100
Expand All @@ -36,7 +36,7 @@ bert_neuronx_batch_2:
bert_neuronx_batch_4:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/BERTSeqClassification_torchscript_neuronx_batch_4.mar
url: https://torchserve.s3.amazonaws.com/mar_files/BERTSeqClassification_torchscript_neuronx_batch_4.mar
workers:
- 2
batch_delay: 100
Expand All @@ -53,7 +53,7 @@ bert_neuronx_batch_4:
bert_neuronx_batch_8:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/BERTSeqClassification_torchscript_neuronx_batch_8.mar
url: https://torchserve.s3.amazonaws.com/mar_files/BERTSeqClassification_torchscript_neuronx_batch_8.mar
workers:
- 2
batch_delay: 100
Expand Down
8 changes: 4 additions & 4 deletions benchmarks/models_config/opt_6.7b_neuronx.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
opt_6.7b_neuronx_batch_1:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/opt_6.7b_neuronx_batch_1.tar.gz
url: https://torchserve.s3.amazonaws.com/mar_files/opt_6.7b_neuronx_batch_1.tar.gz
workers:
- 1
batch_delay: 100
Expand All @@ -19,7 +19,7 @@ opt_6.7b_neuronx_batch_1:
opt_6.7b_neuronx_batch_2:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/opt_6.7b_neuronx_batch_2.tar.gz
url: https://torchserve.s3.amazonaws.com/mar_files/opt_6.7b_neuronx_batch_2.tar.gz
workers:
- 1
batch_delay: 100
Expand All @@ -36,7 +36,7 @@ opt_6.7b_neuronx_batch_2:
opt_6.7b_neuronx_batch_4:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/opt_6.7b_neuronx_batch_4.tar.gz
url: https://torchserve.s3.amazonaws.com/mar_files/opt_6.7b_neuronx_batch_4.tar.gz
workers:
- 1
batch_delay: 100
Expand All @@ -53,7 +53,7 @@ opt_6.7b_neuronx_batch_4:
opt_6.7b_neuronx_batch_8:
scripted_mode:
benchmark_engine: "ab"
url: https://torchserve.pytorch.org/mar_files/opt_6.7b_neuronx_batch_8.tar.gz
url: https://torchserve.s3.amazonaws.com/mar_files/opt_6.7b_neuronx_batch_8.tar.gz
workers:
- 1
batch_delay: 100
Expand Down

0 comments on commit b11c473

Please sign in to comment.