blob: 8e90821f0f2d753ad6770a1ac782995786fbe428 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
|
# Maintainer: Maarten van Gompel <proycon at anaproy dot nl>
pkgname=ucto
pkgver=0.35
pkgrel=1
pkgdesc="An advanced rule-based (regular-expression) and unicode-aware tokenizer for various languages. Tokenization is an essential first step in any NLP pipeline."
arch=('i686' 'x86_64')
license=('GPL3')
depends=('ticcutils>=0.34' 'icu' 'libxml2' 'libfolia>=2.19' 'uctodata>=0.8')
makedepends=('libtool' 'autoconf' 'autoconf-archive')
options=(!libtool)
_gituser="LanguageMachines"
_gitname="ucto"
url="https://languagemachines.github.io/ucto"
source=(https://github.com/LanguageMachines/ucto/archive/v0.35.tar.gz)
md5sums=(8baa7734a4c0b927fa33a29276000ffc)
build() {
cd $srcdir/$pkgname-$pkgver
bash bootstrap.sh
./configure --prefix=/usr --sysconfdir=/etc --localstatedir=/var
make
}
package() {
cd $srcdir/$pkgname-$pkgver
make DESTDIR=$pkgdir install
}
|