@@ -1419,34 +1419,35 @@ void ggml_metal_graph_compute(
14191419 default : GGML_ASSERT (false );
14201420 };
14211421
1422- [encoder setBuffer: id_src0 offset: offs_src0 atIndex: 0 ];
1423- [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1424- [encoder setBuffer: id_dst offset: offs_dst atIndex: 2 ];
1425- [encoder setBytes: &ne00 length: sizeof ( int64_t ) atIndex: 3 ];
1426- [encoder setBytes: &ne01 length: sizeof ( int64_t ) atIndex: 4 ];
1427- [encoder setBytes: &ne02 length: sizeof ( int64_t ) atIndex: 5 ];
1428- [encoder setBytes: &ne03 length: sizeof ( int64_t ) atIndex: 6 ];
1429- [encoder setBytes: &nb00 length: sizeof (uint64_t ) atIndex: 7 ];
1430- [encoder setBytes: &nb01 length: sizeof (uint64_t ) atIndex: 8 ];
1431- [encoder setBytes: &nb02 length: sizeof (uint64_t ) atIndex: 9 ];
1432- [encoder setBytes: &nb03 length: sizeof (uint64_t ) atIndex: 10 ];
1433- [encoder setBytes: &ne0 length: sizeof ( int64_t ) atIndex: 11 ];
1434- [encoder setBytes: &ne1 length: sizeof ( int64_t ) atIndex: 12 ];
1435- [encoder setBytes: &ne2 length: sizeof ( int64_t ) atIndex: 13 ];
1436- [encoder setBytes: &ne3 length: sizeof ( int64_t ) atIndex: 14 ];
1437- [encoder setBytes: &nb0 length: sizeof (uint64_t ) atIndex: 15 ];
1438- [encoder setBytes: &nb1 length: sizeof (uint64_t ) atIndex: 16 ];
1439- [encoder setBytes: &nb2 length: sizeof (uint64_t ) atIndex: 17 ];
1440- [encoder setBytes: &nb3 length: sizeof (uint64_t ) atIndex: 18 ];
1441- [encoder setBytes: &n_past length: sizeof ( int ) atIndex: 19 ];
1442- [encoder setBytes: &n_dims length: sizeof ( int ) atIndex: 20 ];
1443- [encoder setBytes: &mode length: sizeof ( int ) atIndex: 21 ];
1444- [encoder setBytes: &freq_base length: sizeof (float ) atIndex: 22 ];
1445- [encoder setBytes: &freq_scale length: sizeof (float ) atIndex: 23 ];
1446- [encoder setBytes: &ext_factor length: sizeof (float ) atIndex: 24 ];
1447- [encoder setBytes: &attn_factor length: sizeof (float ) atIndex: 25 ];
1448- [encoder setBytes: &beta_fast length: sizeof (float ) atIndex: 26 ];
1449- [encoder setBytes: &beta_slow length: sizeof (float ) atIndex: 27 ];
1422+ [encoder setBuffer: id_src0 offset: offs_src0 atIndex: 0 ];
1423+ [encoder setBuffer: id_src1 offset: offs_src1 atIndex: 1 ];
1424+ [encoder setBuffer: id_dst offset: offs_dst atIndex: 2 ];
1425+ [encoder setBytes: &ne00 length: sizeof ( int64_t ) atIndex: 3 ];
1426+ [encoder setBytes: &ne01 length: sizeof ( int64_t ) atIndex: 4 ];
1427+ [encoder setBytes: &ne02 length: sizeof ( int64_t ) atIndex: 5 ];
1428+ [encoder setBytes: &ne03 length: sizeof ( int64_t ) atIndex: 6 ];
1429+ [encoder setBytes: &nb00 length: sizeof (uint64_t ) atIndex: 7 ];
1430+ [encoder setBytes: &nb01 length: sizeof (uint64_t ) atIndex: 8 ];
1431+ [encoder setBytes: &nb02 length: sizeof (uint64_t ) atIndex: 9 ];
1432+ [encoder setBytes: &nb03 length: sizeof (uint64_t ) atIndex: 10 ];
1433+ [encoder setBytes: &ne0 length: sizeof ( int64_t ) atIndex: 11 ];
1434+ [encoder setBytes: &ne1 length: sizeof ( int64_t ) atIndex: 12 ];
1435+ [encoder setBytes: &ne2 length: sizeof ( int64_t ) atIndex: 13 ];
1436+ [encoder setBytes: &ne3 length: sizeof ( int64_t ) atIndex: 14 ];
1437+ [encoder setBytes: &nb0 length: sizeof (uint64_t ) atIndex: 15 ];
1438+ [encoder setBytes: &nb1 length: sizeof (uint64_t ) atIndex: 16 ];
1439+ [encoder setBytes: &nb2 length: sizeof (uint64_t ) atIndex: 17 ];
1440+ [encoder setBytes: &nb3 length: sizeof (uint64_t ) atIndex: 18 ];
1441+ [encoder setBytes: &n_past length: sizeof ( int ) atIndex: 19 ];
1442+ [encoder setBytes: &n_dims length: sizeof ( int ) atIndex: 20 ];
1443+ [encoder setBytes: &mode length: sizeof ( int ) atIndex: 21 ];
1444+ [encoder setBytes: &n_orig_ctx length: sizeof ( int ) atIndex: 22 ];
1445+ [encoder setBytes: &freq_base length: sizeof ( float ) atIndex: 23 ];
1446+ [encoder setBytes: &freq_scale length: sizeof ( float ) atIndex: 24 ];
1447+ [encoder setBytes: &ext_factor length: sizeof ( float ) atIndex: 25 ];
1448+ [encoder setBytes: &attn_factor length: sizeof ( float ) atIndex: 26 ];
1449+ [encoder setBytes: &beta_fast length: sizeof ( float ) atIndex: 27 ];
1450+ [encoder setBytes: &beta_slow length: sizeof ( float ) atIndex: 28 ];
14501451
14511452 [encoder dispatchThreadgroups: MTLSizeMake (ne01, ne02, ne03) threadsPerThreadgroup: MTLSizeMake (nth, 1 , 1 )];
14521453 } break ;
0 commit comments