Skip to content

Commit

Permalink
Fix artifact path for presharding (#63)
Browse files Browse the repository at this point in the history
fix
  • Loading branch information
sunggg authored Nov 14, 2023
1 parent ce1a63e commit 33c5a88
Showing 1 changed file with 4 additions and 5 deletions.
9 changes: 4 additions & 5 deletions serve/mlc_serve/model/paged_cache_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -327,11 +327,10 @@ def copy_to_worker_0(sess: di.Session, host_array):


def get_tvm_model(artifact_path, model, quantization, num_shards, dev):
if num_shards > 1:
model_artifact_path = os.path.join(
artifact_path, f"{model}-{quantization}-presharded-{num_shards}gpu"
)
else:
model_artifact_path = os.path.join(
artifact_path, f"{model}-{quantization}-presharded-{num_shards}gpu"
)
if not os.path.exists(model_artifact_path):
model_artifact_path = os.path.join(artifact_path, f"{model}-{quantization}")

lib_path = os.path.join(model_artifact_path, f"{model}-{quantization}-cuda.so")
Expand Down

0 comments on commit 33c5a88

Please sign in to comment.