blob: 27be9182473cbf0e94d2cd838e819c9e1d6236aa (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
|
# Maintainer: Maarten van Gompel <proycon at anaproy dot nl>
pkgname=ucto
pkgver=0.34
pkgrel=1
pkgdesc="An advanced rule-based (regular-expression) and unicode-aware tokenizer for various languages. Tokenization is an essential first step in any NLP pipeline."
arch=('i686' 'x86_64')
license=('GPL3')
depends=('ticcutils>=0.34' 'icu' 'libxml2' 'libfolia>=2.19' 'uctodata>=0.8')
makedepends=('libtool' 'autoconf' 'autoconf-archive')
options=(!libtool)
_gituser="LanguageMachines"
_gitname="ucto"
url="https://languagemachines.github.io/ucto"
source=(https://github.com/LanguageMachines/ucto/archive/v0.34.tar.gz)
md5sums=(82cbc108e5783494202a5857513e85ef)
build() {
cd $srcdir/$pkgname-$pkgver
bash bootstrap.sh
./configure --prefix=/usr --sysconfdir=/etc --localstatedir=/var
make
}
package() {
cd $srcdir/$pkgname-$pkgver
make DESTDIR=$pkgdir install
}
|