File size: 392 Bytes
462dacf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
#ifndef _rope_cuh
#define _rope_cuh
#include <cuda_runtime.h>
#include <cuda_fp16.h>
#include <cstdint>
#include "../tuning.h"
void rope_cuda
(
ExLlamaTuning* tuningParams,
half* x,
const half* sin,
const half* cos,
const int bsz,
const int rows,
const int head_dim,
const int num_heads,
const int past_len,
cudaStream_t alt_stream = NULL
);
#endif |