blob: 9c5912e3e94df235c04f250e974a828082fa1e51 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
|
pkgbase = python-tensorrt-llm
pkgdesc = TensorRT LLM provides users with an easy-to-use Python API to define Large Language Models (LLMs) and supports state-of-the-art optimizations to perform inference efficiently on NVIDIA GPUs
pkgver = 1.2.0rc4
pkgrel = 3
url = https://github.com/NVIDIA/TensorRT-LLM
arch = x86_64
license = Apache-2.0
makedepends = python-build
makedepends = python-installer
makedepends = python-setuptools
makedepends = cmake>=3.27
makedepends = conan
makedepends = ninja
makedepends = meson
makedepends = gcc
makedepends = git
makedepends = python-cutlass
depends = python
depends = python-pytorch-cuda
depends = python-numpy
depends = python-transformers
depends = python-tensorrt
depends = python-nvidia-modelopt
depends = python-accelerate
depends = python-diffusers
depends = python-onnx
depends = python-pillow
depends = python-sentencepiece
depends = python-psutil
depends = python-pydantic
depends = python-fastapi
depends = uvicorn
depends = python-click
depends = python-mpi4py
depends = python-pandas
depends = python-h5py
depends = python-openai
depends = python-pyzmq
depends = python-peft
depends = python-einops
depends = python-opencv
depends = python-soundfile
depends = python-tiktoken
depends = python-colored
depends = python-lark-parser
depends = python-pulp
depends = python-prometheus_client
depends = python-omegaconf
depends = python-wheel
depends = python-nvidia-ml-py
depends = python-torchvision
depends = python-optimum
depends = python-datasets
depends = python-mpmath
depends = python-starlette
depends = python-ordered-set
depends = python-pypatchelf
depends = python-jsonschema
depends = python-backoff
depends = python-matplotlib
depends = python-plotly
depends = python-numexpr
depends = python-triton
depends = python-nvtx
depends = cuda
depends = cudnn
depends = tensorrt
depends = nccl
depends = rdma-core
optdepends = python-evaluate: for evaluation metrics
optdepends = python-blobfile: for blob file operations
optdepends = triton-inference-server: for Triton deployment
source = python-tensorrt-llm-1.2.0rc4.tar.gz::https://github.com/NVIDIA/TensorRT-LLM/archive/refs/tags/v1.2.0rc4.tar.gz
source = glog-0.7-compatibility.patch
sha256sums = 295dffddbd57f6a6b815969e42d171bd42140c3f2b15f68323fc4cac3e97d39a
sha256sums = 8227c455479f0013ebf65b2fd7541e19e66b323cdb6e2a65d5f4486622484e0e
pkgname = python-tensorrt-llm
|