Spaces:

Steven10429
/

apply_lora_and_quantize

Paused

llama.cpp

61b850a 10 months ago

135 Bytes

	#include "common.cuh"

	#define CUDA_CLAMP_BLOCK_SIZE 256

	void ggml_cuda_op_clamp(ggml_backend_cuda_context & ctx, ggml_tensor * dst);