blob: 8f9fad9eb8c9527e31568883750b6554c9c682a4 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
|
pkgbase = llama.cpp-cuda
pkgdesc = Port of Facebook's LLaMA model in C/C++ (with NVIDIA CUDA optimizations)
pkgver = b6490
pkgrel = 1
url = https://github.com/ggerganov/llama.cpp
arch = x86_64
arch = armv7h
arch = aarch64
license = MIT
makedepends = cmake
depends = cuda
depends = curl
depends = gcc-libs
depends = glibc
depends = nvidia-utils
optdepends = python-numpy: needed for convert_hf_to_gguf.py
optdepends = python-safetensors: needed for convert_hf_to_gguf.py
optdepends = python-sentencepiece: needed for convert_hf_to_gguf.py
optdepends = python-pytorch: needed for convert_hf_to_gguf.py
optdepends = python-transformers: needed for convert_hf_to_gguf.py
provides = llama.cpp
conflicts = llama.cpp
conflicts = libggml
conflicts = ggml
replaces = llama.cpp-cuda-f16
source = llama.cpp-cuda-b6490.tar.gz::https://github.com/ggml-org/llama.cpp/archive/refs/tags/b6490.tar.gz
source = llama.cpp.conf
source = llama.cpp.service
sha256sums = aef4fa45eb7ebc1f3e04744b465670dd006ad8db86de68234a6928de15050298
sha256sums = 53fa70cfe40cb8a3ca432590e4f76561df0f129a31b121c9b4b34af0da7c4d87
sha256sums = 0377d08a07bda056785981d3352ccd2dbc0387c4836f91fb73e6b790d836620d
pkgname = llama.cpp-cuda
|