blob: 323fed44eac0c1d7afc6494b7253cb16f353280f (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
|
pkgbase = llama.cpp-cuda
pkgdesc = Port of Facebook's LLaMA model in C/C++ (with NVIDIA CUDA optimizations)
pkgver = b6482
pkgrel = 1
url = https://github.com/ggerganov/llama.cpp
arch = x86_64
arch = armv7h
arch = aarch64
license = MIT
makedepends = cmake
depends = cuda
depends = curl
depends = gcc-libs
depends = glibc
depends = nvidia-utils
optdepends = python-numpy: needed for convert_hf_to_gguf.py
optdepends = python-safetensors: needed for convert_hf_to_gguf.py
optdepends = python-sentencepiece: needed for convert_hf_to_gguf.py
optdepends = python-pytorch: needed for convert_hf_to_gguf.py
optdepends = python-transformers: needed for convert_hf_to_gguf.py
provides = llama.cpp
conflicts = llama.cpp
conflicts = libggml
conflicts = ggml
replaces = llama.cpp-cuda-f16
source = llama.cpp-cuda-b6482.tar.gz::https://github.com/ggml-org/llama.cpp/archive/refs/tags/b6482.tar.gz
source = llama.cpp.conf
source = llama.cpp.service
sha256sums = 1546fc2054f07f87cb8725765bf85feabc2ec52243a59673fddcb785f2c8a591
sha256sums = 53fa70cfe40cb8a3ca432590e4f76561df0f129a31b121c9b4b34af0da7c4d87
sha256sums = 0377d08a07bda056785981d3352ccd2dbc0387c4836f91fb73e6b790d836620d
pkgname = llama.cpp-cuda
|