From f90bde8cd53c8120c59e7c1e6debfdd71614c02e Mon Sep 17 00:00:00 2001 From: weitao <51255903105@stu.ecnu.edu.cn> Date: Mon, 29 Apr 2024 07:09:55 +0000 Subject: [PATCH 1/2] improve Install via environment variable --- docs/install/mlc_llm.rst | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/docs/install/mlc_llm.rst b/docs/install/mlc_llm.rst index 7b64dce9fb..ce15616957 100644 --- a/docs/install/mlc_llm.rst +++ b/docs/install/mlc_llm.rst @@ -214,7 +214,9 @@ There are two ways to do so: .. code-tab :: bash Install via environment variable - export PYTHONPATH=/path-to-mlc-llm/python:$PYTHONPATH + export MLC_LLM_HOME=/path-to-mlc-llm + export PYTHONPATH=$MLC_LLM_HOME/python:$PYTHONPATH + alias mlc_llm="python -m mlc_llm" .. code-tab :: bash Install via pip local project From 19763a966a44925a0286b9d66b419156e2f42218 Mon Sep 17 00:00:00 2001 From: weitao <51255903105@stu.ecnu.edu.cn> Date: Sun, 5 May 2024 21:25:36 +0800 Subject: [PATCH 2/2] [HotFix] fix kv_cache_transpose_append buffer region --- python/mlc_llm/nn/kv_cache.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/mlc_llm/nn/kv_cache.py b/python/mlc_llm/nn/kv_cache.py index e4cbf1c047..e5cae1e5cd 100644 --- a/python/mlc_llm/nn/kv_cache.py +++ b/python/mlc_llm/nn/kv_cache.py @@ -399,7 +399,7 @@ def tir_kv_cache_transpose_append( pages[T.floordiv(position, 16), 0, vh, T.floormod(position, 16), vf] = k_data[vgpos, vh, vf] with T.block("v_transpose_append"): vgpos, vh, vf = T.axis.remap("SSS", [global_pos, h, f]) - T.reads(position_map[vgpos], k_data[vgpos, vh, vf]) + T.reads(position_map[vgpos], v_data[vgpos, vh, vf]) T.writes(pages[position_map[vgpos] // 16, 1, vh, position_map[vgpos] % 16, vf]) position: T.int32 = position_map[vgpos] # type: ignore[name-defined,no-redef] pages[T.floordiv(position, 16), 1, vh, T.floormod(position, 16), vf] = v_data[vgpos, vh, vf]