blob: 5f3916ff8441c56e71eaa14a2353f40e8c57b844 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
|
pkgbase = llama.cpp-cuda-f16
pkgdesc = Port of Facebook's LLaMA model in C/C++ (with NVIDIA CUDA optimizations and F16)
pkgver = b6000
pkgrel = 1
url = https://github.com/ggerganov/llama.cpp
arch = x86_64
arch = armv7h
arch = aarch64
license = MIT
makedepends = cmake
makedepends = git
depends = cuda
depends = curl
depends = gcc-libs
depends = glibc
depends = nvidia-utils
depends = python
depends = python-numpy
depends = python-sentencepiece
optdepends = python-pytorch
provides = llama.cpp
conflicts = llama.cpp
conflicts = libggml
conflicts = ggml
options = lto
options = !debug
source = git+https://github.com/ggerganov/llama.cpp#tag=b6000
source = llama.cpp.conf
source = llama.cpp.service
sha256sums = f04944bd1b63cffd589d0e130f778518a9283b5d2b4db3bd1266b683b05ec3c4
sha256sums = 53fa70cfe40cb8a3ca432590e4f76561df0f129a31b121c9b4b34af0da7c4d87
sha256sums = 0377d08a07bda056785981d3352ccd2dbc0387c4836f91fb73e6b790d836620d
pkgname = llama.cpp-cuda-f16
|