blob: 9710aca4aecda1c2a3f6722cc9b1e0c2aca9a8d8 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
|
pkgbase = ucto
pkgdesc = An advanced rule-based (regular-expression) and unicode-aware tokenizer for various languages. Tokenization is an essential first step in any NLP pipeline.
pkgver = 0.31
pkgrel = 1
url = https://languagemachines.github.io/ucto
arch = i686
arch = x86_64
license = GPL3
makedepends = libtool
makedepends = autoconf
makedepends = autoconf-archive
depends = ticcutils>=0.24
depends = icu
depends = libxml2
depends = libfolia>=2.4
depends = uctodata>=0.8
options = !libtool
source = https://github.com/LanguageMachines/ucto/archive/v0.31.tar.gz
md5sums = e4324aef10afbab47da943b1e2306598
pkgname = ucto
|