@@ -172,7 +172,7 @@ __device__ void paged_attention_kernel(
172172
173173 // Load the query to registers.
174174 // Each thread in a thread group has a different part of the query.
175- // For example, if the the thread group size is 4, then the first thread in
175+ // For example, if the thread group size is 4, then the first thread in
176176 // the group has 0, 4, 8, ... th vectors of the query, and the second thread
177177 // has 1, 5, 9, ... th vectors of the query, and so on. NOTE(woosuk): Because
178178 // q is split from a qkv tensor, it may not be contiguous.
@@ -259,7 +259,7 @@ __device__ void paged_attention_kernel(
259259
260260 // Load a key to registers.
261261 // Each thread in a thread group has a different part of the key.
262- // For example, if the the thread group size is 4, then the first thread in
262+ // For example, if the thread group size is 4, then the first thread in
263263 // the group has 0, 4, 8, ... th vectors of the key, and the second thread
264264 // has 1, 5, 9, ... th vectors of the key, and so on.
265265 for (int i = 0 ; i < NUM_TOKENS_PER_THREAD_GROUP; i++) {
0 commit comments