blob: 4cf4024ad33da34a4362b289436c4cc29649b8be (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
|
pkgbase = llama.cpp-cuda-f16
pkgdesc = Port of Facebook's LLaMA model in C/C++ (with NVIDIA CUDA optimizations and f16)
pkgver = b4304
pkgrel = 1
url = https://github.com/ggerganov/llama.cpp
arch = x86_64
arch = armv7h
arch = aarch64
license = MIT
makedepends = cmake
makedepends = git
depends = blas-openblas
depends = blas64-openblas
depends = cuda
depends = curl
depends = gcc-libs
depends = glibc
depends = openmp
depends = python
depends = python-numpy
depends = python-sentencepiece
provides = llama.cpp
conflicts = llama.cpp
conflicts = libggml
options = lto
source = git+https://github.com/ggerganov/llama.cpp#tag=b4304
source = git+https://github.com/nomic-ai/kompute.git
source = llama.cpp.conf
source = llama.cpp.service
sha256sums = e371c57d56efce67ce33554bcabb3f2208bf05c81873b34303cb1948c83fba0f
sha256sums = SKIP
sha256sums = 53fa70cfe40cb8a3ca432590e4f76561df0f129a31b121c9b4b34af0da7c4d87
sha256sums = 0377d08a07bda056785981d3352ccd2dbc0387c4836f91fb73e6b790d836620d
pkgname = llama.cpp-cuda-f16
|