# Maintainer: Maarten van Gompel pkgname=ucto pkgver=0.26 pkgrel=1 pkgdesc="An advanced rule-based (regular-expression) and unicode-aware tokenizer for various languages. Tokenization is an essential first step in any NLP pipeline." arch=('i686' 'x86_64') license=('GPL3') depends=('ticcutils>=0.24' 'icu' 'libxml2' 'libfolia>=2.4' 'uctodata>=0.8') makedepends=('libtool' 'autoconf' 'autoconf-archive') options=(!libtool) _gituser="LanguageMachines" _gitname="ucto" url="https://languagemachines.github.io/ucto" source=(https://github.com/LanguageMachines/ucto/archive/v0.26.tar.gz) md5sums=(a98461026b2cd0584cfd824fe9c5624a) build() { cd $srcdir/$pkgname-$pkgver bash bootstrap.sh ./configure --prefix=/usr --sysconfdir=/etc --localstatedir=/var make } package() { cd $srcdir/$pkgname-$pkgver make DESTDIR=$pkgdir install }