@@ -1419,34 +1419,35 @@ void ggml_metal_graph_compute(
1419
1419
default : GGML_ASSERT (false );
1420
1420
};
1421
1421
1422
- [encoder setBuffer: id_src0 offset: offs_src0 atIndex: 0 ];
1423
- [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1424
- [encoder setBuffer: id_dst offset: offs_dst atIndex: 2 ];
1425
- [encoder setBytes: &ne00 length: sizeof ( int64_t ) atIndex: 3 ];
1426
- [encoder setBytes: &ne01 length: sizeof ( int64_t ) atIndex: 4 ];
1427
- [encoder setBytes: &ne02 length: sizeof ( int64_t ) atIndex: 5 ];
1428
- [encoder setBytes: &ne03 length: sizeof ( int64_t ) atIndex: 6 ];
1429
- [encoder setBytes: &nb00 length: sizeof (uint64_t ) atIndex: 7 ];
1430
- [encoder setBytes: &nb01 length: sizeof (uint64_t ) atIndex: 8 ];
1431
- [encoder setBytes: &nb02 length: sizeof (uint64_t ) atIndex: 9 ];
1432
- [encoder setBytes: &nb03 length: sizeof (uint64_t ) atIndex: 10 ];
1433
- [encoder setBytes: &ne0 length: sizeof ( int64_t ) atIndex: 11 ];
1434
- [encoder setBytes: &ne1 length: sizeof ( int64_t ) atIndex: 12 ];
1435
- [encoder setBytes: &ne2 length: sizeof ( int64_t ) atIndex: 13 ];
1436
- [encoder setBytes: &ne3 length: sizeof ( int64_t ) atIndex: 14 ];
1437
- [encoder setBytes: &nb0 length: sizeof (uint64_t ) atIndex: 15 ];
1438
- [encoder setBytes: &nb1 length: sizeof (uint64_t ) atIndex: 16 ];
1439
- [encoder setBytes: &nb2 length: sizeof (uint64_t ) atIndex: 17 ];
1440
- [encoder setBytes: &nb3 length: sizeof (uint64_t ) atIndex: 18 ];
1441
- [encoder setBytes: &n_past length: sizeof ( int ) atIndex: 19 ];
1442
- [encoder setBytes: &n_dims length: sizeof ( int ) atIndex: 20 ];
1443
- [encoder setBytes: &mode length: sizeof ( int ) atIndex: 21 ];
1444
- [encoder setBytes: &freq_base length: sizeof (float ) atIndex: 22 ];
1445
- [encoder setBytes: &freq_scale length: sizeof (float ) atIndex: 23 ];
1446
- [encoder setBytes: &ext_factor length: sizeof (float ) atIndex: 24 ];
1447
- [encoder setBytes: &attn_factor length: sizeof (float ) atIndex: 25 ];
1448
- [encoder setBytes: &beta_fast length: sizeof (float ) atIndex: 26 ];
1449
- [encoder setBytes: &beta_slow length: sizeof (float ) atIndex: 27 ];
1422
+ [encoder setBuffer: id_src0 offset: offs_src0 atIndex: 0 ];
1423
+ [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1424
+ [encoder setBuffer: id_dst offset: offs_dst atIndex: 2 ];
1425
+ [encoder setBytes: &ne00 length: sizeof ( int64_t ) atIndex: 3 ];
1426
+ [encoder setBytes: &ne01 length: sizeof ( int64_t ) atIndex: 4 ];
1427
+ [encoder setBytes: &ne02 length: sizeof ( int64_t ) atIndex: 5 ];
1428
+ [encoder setBytes: &ne03 length: sizeof ( int64_t ) atIndex: 6 ];
1429
+ [encoder setBytes: &nb00 length: sizeof (uint64_t ) atIndex: 7 ];
1430
+ [encoder setBytes: &nb01 length: sizeof (uint64_t ) atIndex: 8 ];
1431
+ [encoder setBytes: &nb02 length: sizeof (uint64_t ) atIndex: 9 ];
1432
+ [encoder setBytes: &nb03 length: sizeof (uint64_t ) atIndex: 10 ];
1433
+ [encoder setBytes: &ne0 length: sizeof ( int64_t ) atIndex: 11 ];
1434
+ [encoder setBytes: &ne1 length: sizeof ( int64_t ) atIndex: 12 ];
1435
+ [encoder setBytes: &ne2 length: sizeof ( int64_t ) atIndex: 13 ];
1436
+ [encoder setBytes: &ne3 length: sizeof ( int64_t ) atIndex: 14 ];
1437
+ [encoder setBytes: &nb0 length: sizeof (uint64_t ) atIndex: 15 ];
1438
+ [encoder setBytes: &nb1 length: sizeof (uint64_t ) atIndex: 16 ];
1439
+ [encoder setBytes: &nb2 length: sizeof (uint64_t ) atIndex: 17 ];
1440
+ [encoder setBytes: &nb3 length: sizeof (uint64_t ) atIndex: 18 ];
1441
+ [encoder setBytes: &n_past length: sizeof ( int ) atIndex: 19 ];
1442
+ [encoder setBytes: &n_dims length: sizeof ( int ) atIndex: 20 ];
1443
+ [encoder setBytes: &mode length: sizeof ( int ) atIndex: 21 ];
1444
+ [encoder setBytes: &n_orig_ctx length: sizeof ( int ) atIndex: 22 ];
1445
+ [encoder setBytes: &freq_base length: sizeof ( float ) atIndex: 23 ];
1446
+ [encoder setBytes: &freq_scale length: sizeof ( float ) atIndex: 24 ];
1447
+ [encoder setBytes: &ext_factor length: sizeof ( float ) atIndex: 25 ];
1448
+ [encoder setBytes: &attn_factor length: sizeof ( float ) atIndex: 26 ];
1449
+ [encoder setBytes: &beta_fast length: sizeof ( float ) atIndex: 27 ];
1450
+ [encoder setBytes: &beta_slow length: sizeof ( float ) atIndex: 28 ];
1450
1451
1451
1452
[encoder dispatchThreadgroups: MTLSizeMake (ne01, ne02, ne03) threadsPerThreadgroup: MTLSizeMake (nth, 1 , 1 )];
1452
1453
} break ;
0 commit comments