Skip to content

Instantly share code, notes, and snippets.

Embed
What would you like to do?
#lang rash
;; ASSUME: - this script is placed into apertium-all/
;; - hfst-covtest is in the PATH
;; USAGE: racket apertium-turkic-bilingual-stats.rkt > /tmp/bilingual 2>&1
;; REQUIRES: racket
;; rash (install with "raco pkg install rash")
(provide MONOLINGUAL BILINGUAL)
(define MONOLINGUAL
(hash
'alt "apertium-incubator/apertium-alt/"
'aze "apertium-incubator/apertium-aze/"
'bak "apertium-languages/apertium-bak/"
'chv "apertium-languages/apertium-chv/"
'crh "apertium-languages/apertium-crh/"
'gag "apertium-languages/apertium-gag/"
'kaa "apertium-languages/apertium-kaa/"
'kaz "apertium-languages/apertium-kaz/"
'kir "apertium-languages/apertium-kir/"
'kjh "apertium-incubator/apertium-kjh/"
'krc "apertium-incubator/apertium-krc/"
'kum "apertium-languages/apertium-kum/"
'nog "apertium-languages/apertium-nog/"
'ota "apertium-incubator/apertium-ota/"
'sah "apertium-languages/apertium-sah/"
'tat "apertium-languages/apertium-tat/"
'tuk "apertium-languages/apertium-tuk/"
'tur "apertium-languages/apertium-tur/"
'tyv "apertium-languages/apertium-tyv/"
'uig "apertium-languages/apertium-uig/"
'uzb "apertium-languages/apertium-uzb/"))
(define BILINGUAL
'(
"apertium-incubator/apertium-chv-tat/"
"apertium-incubator/apertium-chv-tur/"
"apertium-trunk/apertium-crh-tur/"
"apertium-incubator/apertium-kaz-kaa/"
"apertium-nursery/apertium-kaz-kir/"
"apertium-nursery/apertium-kaz-kum/"
"apertium-incubator/apertium-kaz-sah/"
"apertium-trunk/apertium-kaz-tat/"
"apertium-incubator/apertium-kaz-tur/"
"apertium-incubator/apertium-kaz-tyv/"
"apertium-incubator/apertium-kaz-uig/"
"apertium-incubator/apertium-kir-uzb/"
"apertium-incubator/apertium-nog-kaz/"
"apertium-nursery/apertium-tat-bak/"
"apertium-incubator/apertium-tat-kaa/"
"apertium-incubator/apertium-tat-kir/"
"apertium-nursery/apertium-tuk-tur/"
"apertium-nursery/apertium-tur-aze/"
"apertium-nursery/apertium-tur-kir/"
"apertium-nursery/apertium-tur-tat/"
"apertium-nursery/apertium-tur-uzb/"
"apertium-incubator/apertium-uig-tur/"
"apertium-incubator/apertium-uzb-kaa/"))
(for ([p BILINGUAL])
(parameterize ([current-directory p])
(define lang1 (substring p (- (string-length p) 8) (- (string-length p) 5)))
(define lang2 (substring p (- (string-length p) 4) (- (string-length p) 1)))
(define path1 (string-append "../../" (hash-ref MONOLINGUAL (string->symbol lang1))))
(define path2 (string-append "../../" (hash-ref MONOLINGUAL (string->symbol lang2))))
{echo $lang1 $lang2
(with-handlers ([exn:fail? (λ (exn) (display "git failed\n"))])
{git checkout master
git pull
git log | head -n1})
(with-handlers ([exn:fail? (λ (exn) (display "compilation failed\n"))])
{./autogen.sh --with-lang1=$path1 --with-lang2=$path2
make clean
make})
echo
echo bible coverage (values lang1) -> (values lang2)
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))])
{aq-covtest (string-append path1 "bible.destxt") (string-append lang1 "-" lang2 ".automorf.bin")
hfst-covtest (string-append lang1 "-" lang2) . (string-append path1 "bible.destxt")})
echo wikipedia coverage (values lang1) -> (values lang2)
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))])
{aq-covtest (string-append path1 "wiki.destxt") (string-append lang1 "-" lang2 ".automorf.bin")
hfst-covtest (string-append lang1 "-" lang2) . (string-append path1 "wiki.destxt")})
echo
echo bible coverage (values lang2) -> (values lang1)
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))])
{aq-covtest (string-append path2 "bible.destxt") (string-append lang2 "-" lang1 ".automorf.bin")
hfst-covtest (string-append lang2 "-" lang1) . (string-append path2 "bible.destxt")})
echo wikipedia coverage (values lang2) -> (values lang1)
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))])
{aq-covtest (string-append path2 "wiki.destxt") (string-append lang2 "-" lang1 ".automorf.bin")
hfst-covtest (string-append lang2 "-" lang1) . (string-append path2 "wiki.destxt")})
printf "\n\n\n\n"}))
#/usr/bin/env bash
## ASSUME: - this script is placed into apertium-all/
## - hfst-covtest is in the PATH
## USAGE: bash apertium-turkic-monolingual-stats.bash > /tmp/monolingual-log 2>&1
## 3-letter language code => Wikipedia prefix
declare -A LANGS=( ["tat"]="tt" ["kaz"]="kk" ["kir"]="ky" ["crh"]="crh" ["tyv"]="tyv"
["bak"]="ba" ["chv"]="cv" ["uzb"]="uz" ["kaa"]="kaa" ["uig"]="ug" ["sah"]="sah" ["kum"]=false
["nog"]=false ["gag"]="gag" ["tuk"]="tk" ["tur"]="tr" )
declare -A LANGSINCUBATOR=( ["krc"]="krc" ["alt"]=false ["kjh"]=false ["ota"]=false ["aze"]="az" )
OUT=/tmp/monolingual-turkicstats
## ["incubator" / "languages"] iso3 => stats
stats () {
printf "$2: " >> $OUT
cd "apertium-$1/apertium-$2"
pwd
git checkout master
git pull
git log | head -n1 >> $OUT
printf "stems: " >> $OUT
# count stems
grep -E ":\w+.*;" "apertium-$2.$2.lexc" | grep -v "[<>]" | wc -l >> $OUT
./autogen.sh
make clean; make
## bibles are in https://github.com/taruen/apertiumpp/tree/master/data4apertium/corpora/bible/
printf "bible coverage\n" >> $OUT
apertium-destxt -n ../../../data4apertium/corpora/bible/$2.txt > bible.destxt
aq-covtest bible.destxt $2.automorf.bin >> $OUT 2>&1
hfst-covtest $2 . ../../../data4apertium/corpora/bible/$2.txt >> $OUT 2>&1
printf "bible corpus size (tokens): " >> $OUT
wc -w ../../../data4apertium/corpora/bible/$2.txt >> $OUT
if [ "$1" == "languages" ]; then
prefix="${LANGS[$2]}"
else
prefix="${LANGSINCUBATOR[$2]}"
fi
if ! [[ "$prefix" == false ]]; then
printf "wikipedia coverage\n" >> $OUT
if ! [[ -f "wiki.destxt" ]]; then
python3 ~/local/bin/wikiextractor.py --infn "${prefix}wiki-20190901-pages-articles-multistream.xml.bz2"
apertium-destxt -n wiki.txt > wiki.destxt
fi
aq-covtest wiki.destxt $2.automorf.bin >> $OUT 2>&1
hfst-covtest $2 . wiki.txt >> $OUT 2>&1
printf "wikipedia corpus size (tokens): " >> $OUT
wc -w wiki.txt >> $OUT
fi
printf "\n" >> $OUT
cd ../..
}
printf "" > $OUT
for l in "${!LANGS[@]}"; do stats "languages" "$l"; done
for l in "${!LANGSINCUBATOR[@]}"; do stats "incubator" "$l"; done
chv tat
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 232a3031b106a312fe41ad21fea95db5851f0cb4
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-chv from ../../apertium-languages/apertium-chv/
Using apertium-tat from ../../apertium-languages/apertium-tat/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "chv-tat.autobil.bin tat-chv.autobil.bin chv-tat.automorf.bin chv-tat.autopgen.bin chv-tat.autogen.bin chv-tat.t1x.bin chv-tat.t2x.bin tat-chv.automorf.bin tat-chv.autopgen.bin tat-chv.autogen.bin tat-chv.autogen.hfst tat-chv.t1x.bin tat-chv.t2x.bin chv-tat.rlx.bin tat-chv.rlx.bin chv-tat.lrx.bin tat-chv.lrx.bin" || rm -f chv-tat.autobil.bin tat-chv.autobil.bin chv-tat.automorf.bin chv-tat.autopgen.bin chv-tat.autogen.bin chv-tat.t1x.bin chv-tat.t2x.bin tat-chv.automorf.bin tat-chv.autopgen.bin tat-chv.autogen.bin tat-chv.autogen.hfst tat-chv.t1x.bin tat-chv.t2x.bin chv-tat.rlx.bin tat-chv.rlx.bin chv-tat.lrx.bin tat-chv.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-chv-tat.chv-tat.dix
lt-comp lr apertium-chv-tat.chv-tat.dix chv-tat.autobil.bin
main@standard 34104 59904
apertium-validate-dictionary apertium-chv-tat.chv-tat.dix
lt-comp rl apertium-chv-tat.chv-tat.dix tat-chv.autobil.bin
main@standard 34106 59907
if [ ! -d .deps ]; then mkdir .deps; fi
touch .deps/.d
lt-print chv-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/chv-tat.autobil.att
hfst-txt2fst -e ε < .deps/chv-tat.autobil.att > .deps/chv-tat.autobil.hfst
hfst-project -p upper .deps/chv-tat.autobil.hfst > .deps/chv-tat.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/chv-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/chv-tat.autobil.prefixes
zcat ../../apertium-languages/apertium-chv//chv.automorf.att.gz | hfst-txt2fst > .deps/chv.automorf.hfst
hfst-compose-intersect -1 .deps/chv.automorf.hfst -2 .deps/chv-tat.autobil.prefixes -o .deps/chv-tat.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<gen>") in
transducer in file .deps/chv.automorf.hfst which are not found on the
input tapes of transducers in file .deps/chv-tat.autobil.prefixes.
hfst-fst2txt -i .deps/chv-tat.automorf.trimmed -o .deps/chv-tat.automorf.trimmed.att
lt-comp lr .deps/chv-tat.automorf.trimmed.att chv-tat.automorf.bin
main@standard 31747 72044
final@inconditional 22 45
apertium-validate-dictionary ../../apertium-languages/apertium-chv//apertium-chv.post-chv.dix
lt-comp lr ../../apertium-languages/apertium-chv//apertium-chv.post-chv.dix chv-tat.autopgen.bin
main@standard 9 114
cp ../../apertium-languages/apertium-tat//tat.autogen.bin chv-tat.autogen.bin
apertium-validate-transfer apertium-chv-tat.chv-tat.t1x
apertium-preprocess-transfer apertium-chv-tat.chv-tat.t1x chv-tat.t1x.bin
apertium-validate-transfer apertium-chv-tat.chv-tat.t2x
apertium-preprocess-transfer apertium-chv-tat.chv-tat.t2x chv-tat.t2x.bin
lt-print tat-chv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-chv.autobil.att
hfst-txt2fst -e ε < .deps/tat-chv.autobil.att > .deps/tat-chv.autobil.hfst
hfst-project -p upper .deps/tat-chv.autobil.hfst > .deps/tat-chv.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tat-chv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-chv.autobil.prefixes
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-chv.autobil.prefixes -o .deps/tat-chv.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<punct>") in
transducer in file .deps/tat.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tat-chv.autobil.prefixes.
hfst-fst2txt -i .deps/tat-chv.automorf.trimmed -o .deps/tat-chv.automorf.trimmed.att
lt-comp lr .deps/tat-chv.automorf.trimmed.att tat-chv.automorf.bin
main@standard 128750 237561
final@inconditional 751 1598
apertium-validate-dictionary ../../apertium-languages/apertium-tat//apertium-tat.post-tat.dix
lt-comp lr ../../apertium-languages/apertium-tat//apertium-tat.post-tat.dix tat-chv.autopgen.bin
main@standard 9 114
cp ../../apertium-languages/apertium-chv//chv.autogen.bin tat-chv.autogen.bin
cp ../../apertium-languages/apertium-chv//chv.autogen.hfst tat-chv.autogen.hfst
apertium-validate-transfer apertium-chv-tat.tat-chv.t1x
apertium-preprocess-transfer apertium-chv-tat.tat-chv.t1x tat-chv.t1x.bin
apertium-validate-transfer apertium-chv-tat.tat-chv.t2x
apertium-preprocess-transfer apertium-chv-tat.tat-chv.t2x tat-chv.t2x.bin
cg-comp ../../apertium-languages/apertium-chv//apertium-chv.chv.rlx chv-tat.rlx.bin
Sections: 2, Rules: 6, Sets: 16, Tags: 41
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-chv.rlx.bin
Sections: 11, Rules: 123, Sets: 154, Tags: 194
lrx-comp apertium-chv-tat.chv-tat.lrx chv-tat.lrx.bin
1: 22@23
lrx-comp apertium-chv-tat.tat-chv.lrx tat-chv.lrx.bin
10: 142@157
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
cp *.mode modes/
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden
make: *** [Makefile:779: modes/chv-tat.mode] Fehler 1
bible coverage chv -> tat
Number of tokenised words in the corpus: 196766
Coverage: 86.62%
Top unknown words in the corpus:
1432 Иисус
462 Христос
379 чухне
272 Эй
248 Иисуса
236 пурте
162 нумай
136 Святой
125 Иоанн
123 Ҫавӑн
101 Акӑ
93 илтсен
92 никам
86 Моисей
86 пӗтӗмпех
80 нимӗн
78 иудейсем
77 ҫирӗплетсе
75 Израиль
75 кирек
Translation time: 2.321425199508667 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./chv-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage chv -> tat
Error: Malformed input stream.Number of tokenised words in the corpus: 693
Coverage: 83.26%
Top unknown words in the corpus:
2 тĕрĕк
2 Хуть
2 тĕрлĕрен
2 идиомсем
2 Чăвашла
2 тĕпченин
2 чăвашла
2 Халь
2 каяп
2 вĕрентӳ
2 япон
1 пăлхар
1 пĕртен
1 Пăлхарăн
1 хазар
1 вирьял
1 мĕшĕнче
1 палăртаççĕ
1 нимпех
1 уйралса
Translation time: 0.0467984676361084 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./chv-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tat -> chv
Number of tokenised words in the corpus: 196071
Coverage: 86.16%
Top unknown words in the corpus:
1351 Гайсә
1126 Аллаһы
420 чөнки
403 Мәсих
390 Чөнки
380 кебек
372 иман
290 Раббы
288 Изге
283 Аллаһының
264 Аллаһыга
196 Гайсәнең
190 Паул
161 Гайсәне
159 Петер
137 аркылы
118 изге
113 Яхъя
112 яһүдләр
109 барысы
Translation time: 4.255837917327881 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-chv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tat -> chv
Error: Malformed input stream.Number of tokenised words in the corpus: 26
Coverage: 65.38%
Top unknown words in the corpus:
1 Tatarça
1 İnternet
1 tulısınça
1 İnternetı
1 Respublikası
1 däwlät
1 tellärendä
1 tatar
1 häm
Translation time: 0.06401181221008301 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-chv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
chv tur
Bereits auf 'master'
M tur-chv.prob
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 32735fc46542d31cf619410c4d884701381b18e5
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-chv from ../../apertium-languages/apertium-chv/
Using apertium-tur from ../../apertium-languages/apertium-tur/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "chv-tur.automorf.bin chv-tur.prob chv-tur.rlx.bin chv-tur.autobil.bin chv-tur.autolex.bin chv-tur.autogen.bin chv-tur.autopgen.bin chv-tur.t1x.bin chv-tur.t2x.bin chv-tur.t3x.bin tur-chv.automorf.bin tur-chv.prob tur-chv.rlx.bin tur-chv.autobil.bin tur-chv.autolex.bin tur-chv.autogen.bin tur-chv.autopgen.bin tur-chv.t1x.bin tur-chv.t2x.bin tur-chv.t3x.bin tur-chv.t4x.bin" || rm -f chv-tur.automorf.bin chv-tur.prob chv-tur.rlx.bin chv-tur.autobil.bin chv-tur.autolex.bin chv-tur.autogen.bin chv-tur.autopgen.bin chv-tur.t1x.bin chv-tur.t2x.bin chv-tur.t3x.bin tur-chv.automorf.bin tur-chv.prob tur-chv.rlx.bin tur-chv.autobil.bin tur-chv.autolex.bin tur-chv.autogen.bin tur-chv.autopgen.bin tur-chv.t1x.bin tur-chv.t2x.bin tur-chv.t3x.bin tur-chv.t4x.bin
rm -rf .deps modes
/bin/mkdir -p .deps
touch .deps/.d
/bin/zcat ../../apertium-languages/apertium-chv//chv.automorf.att.gz | hfst-txt2fst > .deps/chv.automorf.hfst
apertium-validate-dictionary apertium-chv-tur.chv-tur.dix
lt-comp lr apertium-chv-tur.chv-tur.dix chv-tur.autobil.bin
main@standard 308 462
nocomprovat@standard 21662 31014
notincrp@standard 90770 112482
lt-print chv-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/chv-tur.autobil.att
hfst-txt2fst -e ε < .deps/chv-tur.autobil.att > .deps/chv-tur.autobil.hfst
hfst-project -p upper .deps/chv-tur.autobil.hfst > .deps/chv-tur.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/chv-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/chv-tur.autobil.prefixes
hfst-compose-intersect -1 .deps/chv.automorf.hfst -2 .deps/chv-tur.autobil.prefixes -o .deps/chv-tur.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<abbr>") in
transducer in file .deps/chv.automorf.hfst which are not found on the
input tapes of transducers in file .deps/chv-tur.autobil.prefixes.
hfst-fst2txt -i .deps/chv-tur.automorf.trimmed -o .deps/chv-tur.automorf.trimmed.att
lt-comp lr .deps/chv-tur.automorf.trimmed.att chv-tur.automorf.bin
main@standard 408 857
final@inconditional 8 7
cp ../../apertium-languages/apertium-chv//chv.prob chv-tur.prob
cg-comp ../../apertium-languages/apertium-chv//apertium-chv.chv.rlx chv-tur.rlx.bin
Sections: 2, Rules: 6, Sets: 16, Tags: 41
lrx-comp apertium-chv-tur.chv-tur.lrx chv-tur.autolex.bin
4: 61@67
cp ../../apertium-languages/apertium-tur//tur.autogen.bin chv-tur.autogen.bin
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin chv-tur.autopgen.bin
apertium-validate-transfer apertium-chv-tur.chv-tur.t1x
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t1x chv-tur.t1x.bin
apertium-validate-interchunk apertium-chv-tur.chv-tur.t2x
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t2x chv-tur.t2x.bin
apertium-validate-postchunk apertium-chv-tur.chv-tur.t3x
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t3x chv-tur.t3x.bin
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst
apertium-validate-dictionary apertium-chv-tur.chv-tur.dix
lt-comp rl apertium-chv-tur.chv-tur.dix tur-chv.autobil.bin
main@standard 308 462
nocomprovat@standard 21662 31014
notincrp@standard 90770 112482
lt-print tur-chv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-chv.autobil.att
hfst-txt2fst -e ε < .deps/tur-chv.autobil.att > .deps/tur-chv.autobil.hfst
hfst-project -p upper .deps/tur-chv.autobil.hfst > .deps/tur-chv.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tur-chv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-chv.autobil.prefixes
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-chv.autobil.prefixes -o .deps/tur-chv.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<quot>") in
transducer in file .deps/tur.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tur-chv.autobil.prefixes.
hfst-fst2txt -i .deps/tur-chv.automorf.trimmed -o .deps/tur-chv.automorf.trimmed.att
lt-comp lr .deps/tur-chv.automorf.trimmed.att tur-chv.automorf.bin
main@standard 308 308
final@inconditional 168 167
cp ../../apertium-languages/apertium-tur//tur.prob tur-chv.prob
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-chv.rlx.bin
Sections: 4, Rules: 102, Sets: 129, Tags: 127
2 rules cannot be skipped by index.
lrx-comp apertium-chv-tur.tur-chv.lrx tur-chv.autolex.bin
22: 328@369
cp ../../apertium-languages/apertium-chv//chv.autogen.bin tur-chv.autogen.bin
cp ../../apertium-languages/apertium-chv//chv.autopgen.bin tur-chv.autopgen.bin
apertium-validate-transfer apertium-chv-tur.tur-chv.t1x
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t1x tur-chv.t1x.bin
apertium-validate-interchunk apertium-chv-tur.tur-chv.t2x
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t2x tur-chv.t2x.bin
apertium-validate-postchunk apertium-chv-tur.tur-chv.t3x
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t3x tur-chv.t3x.bin
apertium-validate-transfer apertium-chv-tur.tur-chv.t4x
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t4x tur-chv.t4x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
lt-comp lr .deps/chv.automorf.bin.att .deps/chv.automorf.bin
main@standard 55063 140662
final@inconditional 105 261
lt-comp lr .deps/tur.automorf.bin.att .deps/tur.automorf.bin
main@standard 25060 57093
final@inconditional 635 2021
bible coverage chv -> tur
Number of tokenised words in the corpus: 142124
Coverage: 0.18%
Top unknown words in the corpus:
2912 те
2665 та
1489 Турӑ
1432 Иисус
1224 вара
929 Вӑл
869 тесе
778 ҫапла
742 каланӑ
740 Эпӗ
667 тата
666 вӗсем
661 ӑна
660 пӗр
648 тесен
645 сире
623 вӑл
617 мар
610 мӗн
590 тенӗ
Translation time: 0.3829376697540283 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./chv-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage chv -> tur
Error: Malformed input stream.Number of tokenised words in the corpus: 537
Coverage: 0.19%
Top unknown words in the corpus:
17 Чăваш
13 те
10 чĕлхи
8 тата
8 чăваш
6 чĕлхе
6 чĕлхипе
5 чĕлхине
5 çине
5 та
4 пĕр
4 ытти
4 пулать
4 хальхи
3 йышĕ
3 чĕлхин
3 пек
3 хушшинчи
3 усă
3 вара
Translation time: 0.00605320930480957 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./chv-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tur -> chv
Number of tokenised words in the corpus: 322696
Coverage: 0.00%
Top unknown words in the corpus:
4764 ve
4035 bir
2738 için
2240 da
2098 de
1782 Tanrı
1686 Çünkü
1604 O
1562 nın
1505 İsrail
1460 gibi
1352 oğlu
1308 in
1238 ın
1236 bütün
1234 ya
1146 a
1124 bu
1115 dedi
1104 Ama
Translation time: 0.772911787033081 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-chv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tur -> chv
Error: Malformed input stream.Number of tokenised words in the corpus: 14776
Coverage: 0.01%
Top unknown words in the corpus:
404 ve
348 Han
331 Cengiz
293 bir
148 ın
145 ile
124 da
124 Temuçin
119 için
108 in
103 de
92 olan
91 olarak
85 bu
76 sonra
71 Çin
63 en
59 a
59 Bu
58 büyük
Translation time: 0.07053613662719727 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-chv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
crh tur
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit a48867598137559646089ed83798c2d37fb0c3a1
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-crh from ../../apertium-languages/apertium-crh/
Using apertium-tur from ../../apertium-languages/apertium-tur/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "crh-tur.automorf.bin crh-tur.prob crh-tur.rlx.bin crh-tur.autobil.bin crh-tur.autolex.bin crh-tur.autogen.bin crh-tur.autopgen.bin crh-tur.t1x.bin crh-tur.t2x.bin crh-tur.t3x.bin crh-tur.t4x.bin tur-crh.automorf.bin tur-crh.prob tur-crh.rlx.bin tur-crh.autobil.bin tur-crh.autolex.bin tur-crh.autogen.bin tur-crh.autopgen.bin tur-crh.t1x.bin tur-crh.t2x.bin tur-crh.t4x.bin tur-crh.t3x.bin" || rm -f crh-tur.automorf.bin crh-tur.prob crh-tur.rlx.bin crh-tur.autobil.bin crh-tur.autolex.bin crh-tur.autogen.bin crh-tur.autopgen.bin crh-tur.t1x.bin crh-tur.t2x.bin crh-tur.t3x.bin crh-tur.t4x.bin tur-crh.automorf.bin tur-crh.prob tur-crh.rlx.bin tur-crh.autobil.bin tur-crh.autolex.bin tur-crh.autogen.bin tur-crh.autopgen.bin tur-crh.t1x.bin tur-crh.t2x.bin tur-crh.t4x.bin tur-crh.t3x.bin
rm -rf .deps modes
/bin/mkdir -p .deps
touch .deps/.d
/bin/zcat ../../apertium-languages/apertium-crh//crh.automorf.att.gz | hfst-txt2fst > .deps/crh.automorf.hfst
apertium-validate-dictionary apertium-crh-tur.crh-tur.dix
lt-comp lr apertium-crh-tur.crh-tur.dix crh-tur.autobil.bin
main@standard 12695 19382
lt-print crh-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/crh-tur.autobil.att
hfst-txt2fst -e ε < .deps/crh-tur.autobil.att > .deps/crh-tur.autobil.hfst
hfst-project -p upper .deps/crh-tur.autobil.hfst > .deps/crh-tur.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/crh-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/crh-tur.autobil.prefixes
hfst-compose-intersect -1 .deps/crh.automorf.hfst -2 .deps/crh-tur.autobil.prefixes -o .deps/crh-tur.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<apos>") in
transducer in file .deps/crh.automorf.hfst which are not found on the
input tapes of transducers in file .deps/crh-tur.autobil.prefixes.
hfst-fst2txt -i .deps/crh-tur.automorf.trimmed -o .deps/crh-tur.automorf.trimmed.att
lt-comp lr .deps/crh-tur.automorf.trimmed.att crh-tur.automorf.bin
main@standard 83327 232963
final@inconditional 8152 14258
cp ../../apertium-languages/apertium-crh//crh.prob crh-tur.prob
cg-comp ../../apertium-languages/apertium-crh//apertium-crh.crh.rlx crh-tur.rlx.bin
Sections: 3, Rules: 72, Sets: 92, Tags: 96
2 rules cannot be skipped by index.
lrx-comp apertium-crh-tur.crh-tur.lrx crh-tur.autolex.bin
14: 298@335
cp ../../apertium-languages/apertium-tur//tur.autogen.bin crh-tur.autogen.bin
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin crh-tur.autopgen.bin
apertium-validate-transfer apertium-crh-tur.crh-tur.t1x
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t1x crh-tur.t1x.bin
apertium-validate-interchunk apertium-crh-tur.crh-tur.t2x
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t2x crh-tur.t2x.bin
apertium-validate-postchunk apertium-crh-tur.crh-tur.t3x
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t3x crh-tur.t3x.bin
apertium-validate-transfer apertium-crh-tur.crh-tur.t4x
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t4x crh-tur.t4x.bin
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst
apertium-validate-dictionary apertium-crh-tur.crh-tur.dix
lt-comp rl apertium-crh-tur.crh-tur.dix tur-crh.autobil.bin
main@standard 12664 19312
lt-print tur-crh.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-crh.autobil.att
hfst-txt2fst -e ε < .deps/tur-crh.autobil.att > .deps/tur-crh.autobil.hfst
hfst-project -p upper .deps/tur-crh.autobil.hfst > .deps/tur-crh.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tur-crh.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-crh.autobil.prefixes
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-crh.autobil.prefixes -o .deps/tur-crh.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<apos>") in
transducer in file .deps/tur.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tur-crh.autobil.prefixes.
hfst-fst2txt -i .deps/tur-crh.automorf.trimmed -o .deps/tur-crh.automorf.trimmed.att
lt-comp lr .deps/tur-crh.automorf.trimmed.att tur-crh.automorf.bin
main@standard 14064 28608
final@inconditional 2361 3820
cp ../../apertium-languages/apertium-tur//tur.prob tur-crh.prob
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-crh.rlx.bin
Sections: 4, Rules: 102, Sets: 129, Tags: 127
2 rules cannot be skipped by index.
lrx-comp apertium-crh-tur.tur-crh.lrx tur-crh.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-crh//crh.autogen.bin tur-crh.autogen.bin
cp ../../apertium-languages/apertium-crh//crh.autopgen.bin tur-crh.autopgen.bin
apertium-validate-transfer apertium-crh-tur.tur-crh.t1x
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t1x tur-crh.t1x.bin
apertium-validate-interchunk apertium-crh-tur.tur-crh.t2x
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t2x tur-crh.t2x.bin
apertium-validate-transfer apertium-crh-tur.tur-crh.t4x
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t4x tur-crh.t4x.bin
apertium-validate-postchunk apertium-crh-tur.tur-crh.t3x
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t3x tur-crh.t3x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
lt-comp lr .deps/crh.automorf.bin.att .deps/crh.automorf.bin
main@standard 112233 320968
final@inconditional 424 1452
lt-comp lr .deps/tur.automorf.bin.att .deps/tur.automorf.bin
main@standard 25060 57093
final@inconditional 635 2021
bible coverage crh -> tur
Number of tokenised words in the corpus: 108974
Coverage: 31.35%
Top unknown words in the corpus:
1566 ве
1022 Иса
910 бир
880 деди
729 ичюн
677 исе
624 эди
578 да
556 деп
505 Мен
501 бу
464 де
420 адам
352 оларгъа
339 не
336 Онынъ
319 Алланынъ
315 сонъ
296 Бу
285 оны
Translation time: 0.35404133796691895 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./crh-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage crh -> tur
Number of tokenised words in the corpus: 4299
Coverage: 88.95%
Top unknown words in the corpus:
12 Amdi
10 Abibulla
8 Odabaş
5 Giraybay
5 nemse
4 cenkâver
4 Ablây
4 افغانستان
4 Afġānistān
4 askeriy
3 ci
3 Abeşistan
3 Aluston
3 Prinsligi
2 ac
2 ae
2 af
2 ag
2 ai
2 am
Translation time: 0.17180109024047852 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./crh-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tur -> crh
Number of tokenised words in the corpus: 396976
Coverage: 76.61%
Top unknown words in the corpus:
1782 Tanrı
1484 nın
1050 ın
921 a
832 Davut
671 dek
654 e
585 Yahuda
553 Ey
528 şöyle
505 Yeruşalim
487 Egemen
409 na
377 Tanrısı
375 la
359 i
355 Saul
347 ı
326 dan
318 ey
Translation time: 6.870069742202759 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-crh.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tur -> crh
Error: Malformed input stream.Number of tokenised words in the corpus: 16235
Coverage: 77.76%
Top unknown words in the corpus:
136 ın
124 Temuçin
51 a
40 ı
40 nin
39 i
34 Camuka
34 nın
33 Jin
33 Tuğrul
29 e
29 Cuci
27 Harezmşah
22 Cebe
17 Mukhulai
17 Subutay
16 Yesügey
15 Çağatay
14 Börte
14 Alaeddin
Translation time: 0.3534669876098633 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-crh.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz kaa
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 0ef5cdf2fe24b25d9c459751cfa1290f6214913f
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-kaa from ../../apertium-languages/apertium-kaa/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-kaa.autobil.bin kaa-kaz.autobil.bin kaz-kaa.automorf.bin kaz-kaa.autopgen.bin kaz-kaa.autogen.bin kaz-kaa.t1x.bin kaz-kaa.t2x.bin kaa-kaz.automorf.bin kaa-kaz.autopgen.bin kaa-kaz.autogen.bin kaa-kaz.t1x.bin kaa-kaz.t2x.bin kaz-kaa.rlx.bin kaa-kaz.rlx.bin kaz-kaa.lrx.bin kaa-kaz.lrx.bin" || rm -f kaz-kaa.autobil.bin kaa-kaz.autobil.bin kaz-kaa.automorf.bin kaz-kaa.autopgen.bin kaz-kaa.autogen.bin kaz-kaa.t1x.bin kaz-kaa.t2x.bin kaa-kaz.automorf.bin kaa-kaz.autopgen.bin kaa-kaz.autogen.bin kaa-kaz.t1x.bin kaa-kaz.t2x.bin kaz-kaa.rlx.bin kaa-kaz.rlx.bin kaz-kaa.lrx.bin kaa-kaz.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-kaa.kaz-kaa.dix
lt-comp lr apertium-kaz-kaa.kaz-kaa.dix kaz-kaa.autobil.bin
main@standard 10901 15943
apertium-validate-dictionary apertium-kaz-kaa.kaz-kaa.dix
lt-comp rl apertium-kaz-kaa.kaz-kaa.dix kaa-kaz.autobil.bin
main@standard 10887 15926
if [ ! -d .deps ]; then mkdir .deps; fi
touch .deps/.d
lt-print kaz-kaa.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kaa.autobil.att
hfst-txt2fst -e ε < .deps/kaz-kaa.autobil.att > .deps/kaz-kaa.autobil.hfst
hfst-project -p upper .deps/kaz-kaa.autobil.hfst > .deps/kaz-kaa.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-kaa.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kaa.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kaa.autobil.prefixes -o .deps/kaz-kaa.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-kaa.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-kaa.automorf.trimmed -o .deps/kaz-kaa.automorf.trimmed.att
lt-comp lr .deps/kaz-kaa.automorf.trimmed.att kaz-kaa.automorf.bin
main@standard 181934 412306
final@inconditional 2634 7472
apertium-validate-dictionary apertium-kaz-kaa.post-kaz.dix
lt-comp lr apertium-kaz-kaa.post-kaz.dix kaz-kaa.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-kaa//kaa.autogen.bin kaz-kaa.autogen.bin
apertium-validate-transfer apertium-kaz-kaa.kaz-kaa.t1x
apertium-preprocess-transfer apertium-kaz-kaa.kaz-kaa.t1x kaz-kaa.t1x.bin
apertium-validate-transfer apertium-kaz-kaa.kaz-kaa.t2x
apertium-preprocess-transfer apertium-kaz-kaa.kaz-kaa.t2x kaz-kaa.t2x.bin
lt-print kaa-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaa-kaz.autobil.att
hfst-txt2fst -e ε < .deps/kaa-kaz.autobil.att > .deps/kaa-kaz.autobil.hfst
hfst-project -p upper .deps/kaa-kaz.autobil.hfst > .deps/kaa-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaa-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaa-kaz.autobil.prefixes
zcat ../../apertium-languages/apertium-kaa//kaa.automorf.att.gz | hfst-txt2fst > .deps/kaa.automorf.hfst
hfst-compose-intersect -1 .deps/kaa.automorf.hfst -2 .deps/kaa-kaz.autobil.prefixes -o .deps/kaa-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<subst>") in
transducer in file .deps/kaa.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaa-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/kaa-kaz.automorf.trimmed -o .deps/kaa-kaz.automorf.trimmed.att
lt-comp lr .deps/kaa-kaz.automorf.trimmed.att kaa-kaz.automorf.bin
main@standard 11323 20644
final@inconditional 444 1655
apertium-validate-dictionary apertium-kaz-kaa.post-kaa.dix
lt-comp lr apertium-kaz-kaa.post-kaa.dix kaa-kaz.autopgen.bin
main@standard 9 114
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin kaa-kaz.autogen.bin
apertium-validate-transfer apertium-kaz-kaa.kaa-kaz.t1x
apertium-preprocess-transfer apertium-kaz-kaa.kaa-kaz.t1x kaa-kaz.t1x.bin
apertium-validate-transfer apertium-kaz-kaa.kaa-kaz.t2x
apertium-preprocess-transfer apertium-kaz-kaa.kaa-kaz.t2x kaa-kaz.t2x.bin
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kaa.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
cg-comp ../../apertium-languages/apertium-kaa//apertium-kaa.kaa.rlx kaa-kaz.rlx.bin
Sections: 1, Rules: 1, Sets: 5, Tags: 23
lrx-comp apertium-kaz-kaa.kaz-kaa.lrx kaz-kaa.lrx.bin
6: 99@109
lrx-comp apertium-kaz-kaa.kaa-kaz.lrx kaa-kaz.lrx.bin
1: 19@19
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
cp *.mode modes/
bible coverage kaz -> kaa
Number of tokenised words in the corpus: 214563
Coverage: 92.41%
Top unknown words in the corpus:
1268 Иса
323 Мәсіх
284 Исаның
246 Мәсіхтің
211 Ізгі
175 Исаға
151 Исаны
150 Петір
136 Пауыл
129 Таурат
103 Мәсіхке
83 Жақия
79 Мұса
68 Ыбырайым
66 яһудилер
65 парызшылдар
64 Шимон
63 немесе
62 Иерусалимге
59 Мәсіхпен
Translation time: 6.704168081283569 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kaa.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> kaa
Error: Malformed input stream.Number of tokenised words in the corpus: 2952
Coverage: 88.52%
Top unknown words in the corpus:
8 оңт
5 ның
5 Украина
5 солт
4 Каспий
3 Алтай
3 Сібір
3 Тянь
3 Шань
3 Еділ
3 одақтық
3 м
2 Қызылқұм
2 Сібірдің
2 мыңжылдық
2 тайпалық
2 ғұндар
2 аумағындағы
2 Оғыз
2 жоспарлық
Translation time: 0.2152414321899414 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kaa.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage kaa -> kaz
Number of tokenised words in the corpus: 188496
Coverage: 88.24%
Top unknown words in the corpus:
1223 İysa
520 Muxaddes
408 ytkeni
353 Masix
346 A
294 İysanıń
214 z
212 hámme
183 Masixtıń
172 hámmesi
172 ǵo
168 İysaǵa
161 Petr
153 İysanı
148 Pavel
142 atırǵan
139 zi
112 qalay
108 Háy
106 muxaddes
Translation time: 2.959629535675049 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaa-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaa -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 4
Coverage: 100.00%
Top unknown words in the corpus:
Translation time: 0.010514259338378906 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaa-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz kir
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 34dd3475c6103f173f6f4b443155486a7231b0b7
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-kir from ../../apertium-languages/apertium-kir/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-kir.autobil.bin kir-kaz.autobil.bin kaz-kir.automorf.bin kaz-kir.autopgen.bin kaz-kir.autogen.bin kaz-kir.t1x.bin kaz-kir.t2x.bin kir-kaz.automorf.bin kir-kaz.autopgen.bin kir-kaz.autogen.bin kir-kaz.t1x.bin kir-kaz.t2x.bin kaz-kir.rlx.bin kir-kaz.rlx.bin kaz-kir.autolex.bin kir-kaz.autolex.bin kaz-kir.autoseq.bin kir-kaz.autoseq.bin kaz-kir.revautoseq.bin kir-kaz.revautoseq.bin" || rm -f kaz-kir.autobil.bin kir-kaz.autobil.bin kaz-kir.automorf.bin kaz-kir.autopgen.bin kaz-kir.autogen.bin kaz-kir.t1x.bin kaz-kir.t2x.bin kir-kaz.automorf.bin kir-kaz.autopgen.bin kir-kaz.autogen.bin kir-kaz.t1x.bin kir-kaz.t2x.bin kaz-kir.rlx.bin kir-kaz.rlx.bin kaz-kir.autolex.bin kir-kaz.autolex.bin kaz-kir.autoseq.bin kir-kaz.autoseq.bin kaz-kir.revautoseq.bin kir-kaz.revautoseq.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-kir.kaz-kir.dix
lt-comp lr apertium-kaz-kir.kaz-kir.dix kaz-kir.autobil.bin
main@standard 13606 31838
apertium-validate-dictionary apertium-kaz-kir.kaz-kir.dix
lt-comp rl apertium-kaz-kir.kaz-kir.dix kir-kaz.autobil.bin
main@standard 13574 31782
/bin/mkdir -p .deps
touch .deps/.d
lt-print kaz-kir.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kir.autobil.att
hfst-txt2fst -e ε < .deps/kaz-kir.autobil.att > .deps/kaz-kir.autobil.hfst
hfst-project -p upper .deps/kaz-kir.autobil.hfst > .deps/kaz-kir.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-kir.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kir.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kir.autobil.prefixes -o .deps/kaz-kir.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-kir.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-kir.automorf.trimmed -o .deps/kaz-kir.automorf.trimmed.att
lt-comp lr .deps/kaz-kir.automorf.trimmed.att kaz-kir.automorf.bin
main@standard 167998 377602
final@inconditional 41 67
apertium-validate-dictionary apertium-kaz-kir.post-kaz.dix
lt-comp lr apertium-kaz-kir.post-kaz.dix kaz-kir.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-kir//kir.autogen.bin kaz-kir.autogen.bin
apertium-validate-transfer apertium-kaz-kir.kaz-kir.t1x
apertium-preprocess-transfer apertium-kaz-kir.kaz-kir.t1x kaz-kir.t1x.bin
apertium-validate-transfer apertium-kaz-kir.kaz-kir.t2x
apertium-preprocess-transfer apertium-kaz-kir.kaz-kir.t2x kaz-kir.t2x.bin
lt-print kir-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kir-kaz.autobil.att
hfst-txt2fst -e ε < .deps/kir-kaz.autobil.att > .deps/kir-kaz.autobil.hfst
hfst-project -p upper .deps/kir-kaz.autobil.hfst > .deps/kir-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kir-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kir-kaz.autobil.prefixes
zcat ../../apertium-languages/apertium-kir//kir.automorf.att.gz | hfst-txt2fst > .deps/kir.automorf.hfst
hfst-compose-intersect -1 .deps/kir.automorf.hfst -2 .deps/kir-kaz.autobil.prefixes -o .deps/kir-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<percent>") in
transducer in file .deps/kir.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kir-kaz.autobil.prefixes.
hfst-fst2fst -O .deps/kir-kaz.automorf.trimmed -o kir-kaz.automorf.bin
hfst-fst2txt -i .deps/kir-kaz.automorf.trimmed -o .deps/kir-kaz.automorf.trimmed.att
lt-comp lr .deps/kir-kaz.automorf.trimmed.att kir-kaz.automorf.bin
main@standard 22176 46844
final@inconditional 16 34
apertium-validate-dictionary apertium-kaz-kir.post-kir.dix
lt-comp lr apertium-kaz-kir.post-kir.dix kir-kaz.autopgen.bin
main@standard 16 356
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin kir-kaz.autogen.bin
apertium-validate-transfer apertium-kaz-kir.kir-kaz.t1x
apertium-preprocess-transfer apertium-kaz-kir.kir-kaz.t1x kir-kaz.t1x.bin
apertium-validate-transfer apertium-kaz-kir.kir-kaz.t2x
apertium-preprocess-transfer apertium-kaz-kir.kir-kaz.t2x kir-kaz.t2x.bin
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kir.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
cg-comp ../../apertium-languages/apertium-kir//apertium-kir.kir.rlx kir-kaz.rlx.bin
Sections: 3, Rules: 71, Sets: 102, Tags: 126
lrx-comp apertium-kaz-kir.kaz-kir.lrx kaz-kir.autolex.bin
58: 963@1073
lrx-comp apertium-kaz-kir.kir-kaz.lrx kir-kaz.autolex.bin
2: 25@26
lsx-comp lr apertium-kaz-kir.kaz-kir.lsx kaz-kir.autoseq.bin
main@standard 47 50
lsx-comp lr apertium-kaz-kir.kir-kaz.lsx kir-kaz.autoseq.bin
main@standard 97 108
lsx-comp rl apertium-kaz-kir.kaz-kir.lsx kaz-kir.revautoseq.bin
main@standard 47 50
lsx-comp rl apertium-kaz-kir.kir-kaz.lsx kir-kaz.revautoseq.bin
main@standard 97 108
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
apertium-createmodes.awk: modes/kaz-kir-autoseq.mode seen twice
apertium-createmodes.awk: modes/@kaz-kir-autoseq.mode seen twice
apertium-createmodes.awk: modes/kir-kaz-autoseq.mode seen twice
apertium-createmodes.awk: modes/@kir-kaz-autoseq.mode seen twice
bible coverage kaz -> kir
Number of tokenised words in the corpus: 214330
Coverage: 92.64%
Top unknown words in the corpus:
66 яһудилер
65 парызшылдар
63 немесе
53 сиынып
50 сеніп
50 Пилат
49 өтінді
49 Жохан
48 бетер
44 Аумин
43 Ирод
43 ертіп
41 Яһудея
39 әзәзіл
36 яһудилердің
35 адалдығын
35 дүниелік
34 Матай
34 гөр
32 Ғалилея
Translation time: 6.111989498138428 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kir.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> kir
Error: Malformed input stream.Number of tokenised words in the corpus: 2937
Coverage: 90.19%
Top unknown words in the corpus:
5 ның
3 ге
3 одақтық
3 қалыптасқан
3 оңт
2 Қызылқұм
2 мыңжылдық
2 тайпалық
2 ғұндар
2 ғ
2 Оғыз
2 жоспарлық
2 өнеркәсіптік
2 өндірушісі
2 Беловеж
2 ны
2 сессиясында
2 құрлығының
2 с
2 қоңыржай
Translation time: 0.20651888847351074 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kir.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage kir -> kaz
Number of tokenised words in the corpus: 203725
Coverage: 89.17%
Top unknown words in the corpus:
1279 Ыйса
946 Кудай
597 Кудайдын
380 Машаяк
362 Ыйсанын
305 Кудайга
208 Ыйсаны
184 Ыйсага
174 Машаяктын
163 Пабыл
94 Кудайды
92 улам
90 Кудайдан
83 Жакыя
68 таалим
66 иудей
65 динкызматчылар
64 Машаякка
63 Пабылдын
62 фарисейлер
Translation time: 5.053615570068359 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kir-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kir -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 9337
Coverage: 85.91%
Top unknown words in the corpus:
15 С
10 К
10 көл
10 Көлдүн
8 б
8 Б
7 комплекстик
7 Н
7 Көл
6 дээрлик
6 закон
6 СССРдин
6 ИАнын
6 Борбордук
6 Кыргызжер
6 Сулайман
5 П
5 В
5 ландшафт
5 ээлеген
Translation time: 0.25955748558044434 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kir-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz kum
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 061a225d1c6d235e04fd492f6064fa7616409281
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-kum from ../../apertium-languages/apertium-kum/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-kum.autobil.bin kum-kaz.autobil.bin kaz-kum.automorf.bin kaz-kum.autopgen.bin kaz-kum.autogen.bin kaz-kum.t1x.bin kaz-kum.t2x.bin kaz-kum.rlx.bin kum-kaz.rlx.bin kaz-kum.lrx.bin " || rm -f kaz-kum.autobil.bin kum-kaz.autobil.bin kaz-kum.automorf.bin kaz-kum.autopgen.bin kaz-kum.autogen.bin kaz-kum.t1x.bin kaz-kum.t2x.bin kaz-kum.rlx.bin kum-kaz.rlx.bin kaz-kum.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-kum.kaz-kum.dix
lt-comp lr apertium-kaz-kum.kaz-kum.dix kaz-kum.autobil.bin
main@standard 1671 2288
apertium-validate-dictionary apertium-kaz-kum.kaz-kum.dix
lt-comp rl apertium-kaz-kum.kaz-kum.dix kum-kaz.autobil.bin
main@standard 1653 2265
if [ ! -d .deps ]; then mkdir .deps; fi
touch .deps/.d
lt-print kaz-kum.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kum.autobil.att
hfst-txt2fst -e ε < .deps/kaz-kum.autobil.att > .deps/kaz-kum.autobil.hfst
hfst-project -p upper .deps/kaz-kum.autobil.hfst > .deps/kaz-kum.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-kum.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kum.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kum.autobil.prefixes -o .deps/kaz-kum.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-kum.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-kum.automorf.trimmed -o .deps/kaz-kum.automorf.trimmed.att
lt-comp lr .deps/kaz-kum.automorf.trimmed.att kaz-kum.automorf.bin
main@standard 38123 86166
final@inconditional 2616 7439
apertium-validate-dictionary ../../apertium-languages/apertium-kaz//apertium-kaz.post-kaz.dix
lt-comp lr ../../apertium-languages/apertium-kaz//apertium-kaz.post-kaz.dix kaz-kum.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-kum//kum.autogen.bin kaz-kum.autogen.bin
apertium-validate-transfer apertium-kaz-kum.kaz-kum.t1x
apertium-preprocess-transfer apertium-kaz-kum.kaz-kum.t1x kaz-kum.t1x.bin
apertium-validate-transfer apertium-kaz-kum.kaz-kum.t2x
apertium-preprocess-transfer apertium-kaz-kum.kaz-kum.t2x kaz-kum.t2x.bin
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kum.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
cg-comp ../../apertium-languages/apertium-kum//apertium-kum.kum.rlx kum-kaz.rlx.bin
Sections: 1, Rules: 6, Sets: 20, Tags: 32
lrx-comp apertium-kaz-kum.kaz-kum.lrx kaz-kum.lrx.bin
2: 36@40
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
cp *.mode modes/
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden
make: *** [Makefile:781: modes/kaz-kum.mode] Fehler 1
bible coverage kaz -> kum
Number of tokenised words in the corpus: 175579
Coverage: 56.36%
Top unknown words in the corpus:
1268 Иса
411 туралы
383 сендер
371 рухани
349 Себебі
339 арқылы
323 Мәсіх
309 Киелі
308 сендерге
284 Исаның
270 Иеміз
246 Мәсіхтің
238 Сондықтан
219 әрі
211 Ізгі
211 күні
196 сияқты
195 діни
194 біз
188 Алайда
Translation time: 3.2530195713043213 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kum.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> kum
Error: Malformed input stream.Number of tokenised words in the corpus: 2675
Coverage: 48.64%
Top unknown words in the corpus:
11 км
10 бойынша
8 КСРО
8 оңт
7 негізгі
7 тайпалар
6 Қазақ
6 экономикалық
6 туралы
6 жылғы
6 желтоқсанда
6 басшылары
5 бөлігін
5 ның
5 феодалдық
5 Украина
5 солт
4 арқылы
4 оңтүстік
4 Елдің
Translation time: 0.08241939544677734 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-kum.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage kum -> kaz
[Errno 2] No such file or directory: 'kum-kaz.automorf.bin'
wikipedia coverage kum -> kaz
[Errno 2] No such file or directory: '../../apertium-languages/apertium-kum/wiki.destxt'
kaz sah
Bereits auf 'master'
M ap_include.am
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 176f11224e72a9789db879fe7e88ebaf93d124db
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-sah from ../../apertium-languages/apertium-sah/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-sah.automorf.bin kaz-sah.prob kaz-sah.rlx.bin kaz-sah.autobil.bin kaz-sah.autolex.bin kaz-sah.autogen.bin kaz-sah.autopgen.bin kaz-sah.t1x.bin kaz-sah.t2x.bin kaz-sah.t3x.bin kaz-sah.t4x.bin sah-kaz.automorf.bin sah-kaz.prob sah-kaz.rlx.bin sah-kaz.autobil.bin sah-kaz.autolex.bin sah-kaz.autogen.bin sah-kaz.autopgen.bin sah-kaz.t1x.bin sah-kaz.t2x.bin sah-kaz.t3x.bin" || rm -f kaz-sah.automorf.bin kaz-sah.prob kaz-sah.rlx.bin kaz-sah.autobil.bin kaz-sah.autolex.bin kaz-sah.autogen.bin kaz-sah.autopgen.bin kaz-sah.t1x.bin kaz-sah.t2x.bin kaz-sah.t3x.bin kaz-sah.t4x.bin sah-kaz.automorf.bin sah-kaz.prob sah-kaz.rlx.bin sah-kaz.autobil.bin sah-kaz.autolex.bin sah-kaz.autogen.bin sah-kaz.autopgen.bin sah-kaz.t1x.bin sah-kaz.t2x.bin sah-kaz.t3x.bin
rm -rf .deps modes
/bin/mkdir -p .deps
touch .deps/.d
/bin/zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
apertium-validate-dictionary apertium-kaz-sah.kaz-sah.dix
lt-comp lr apertium-kaz-sah.kaz-sah.dix kaz-sah.autobil.bin
main@standard 8508 11300
lt-print kaz-sah.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-sah.autobil.att
hfst-txt2fst -e ε < .deps/kaz-sah.autobil.att > .deps/kaz-sah.autobil.hfst
hfst-project -p upper .deps/kaz-sah.autobil.hfst > .deps/kaz-sah.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-sah.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-sah.autobil.prefixes
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-sah.autobil.prefixes -o .deps/kaz-sah.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-sah.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-sah.automorf.trimmed -o .deps/kaz-sah.automorf.trimmed.att
lt-comp lr .deps/kaz-sah.automorf.trimmed.att kaz-sah.automorf.bin
main@standard 86196 189326
final@inconditional 28 38
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-sah.prob
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-sah.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
lrx-comp apertium-kaz-sah.kaz-sah.lrx kaz-sah.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-sah//sah.autogen.bin kaz-sah.autogen.bin
cp ../../apertium-languages/apertium-sah//sah.autopgen.bin kaz-sah.autopgen.bin
apertium-validate-transfer apertium-kaz-sah.kaz-sah.t1x
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t1x kaz-sah.t1x.bin
apertium-validate-interchunk apertium-kaz-sah.kaz-sah.t2x
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t2x kaz-sah.t2x.bin
apertium-validate-postchunk apertium-kaz-sah.kaz-sah.t3x
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t3x kaz-sah.t3x.bin
apertium-validate-transfer apertium-kaz-sah.kaz-sah.t4x
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t4x kaz-sah.t4x.bin
/bin/zcat ../../apertium-languages/apertium-sah//sah.automorf.att.gz | hfst-txt2fst > .deps/sah.automorf.hfst
apertium-validate-dictionary apertium-kaz-sah.kaz-sah.dix
lt-comp rl apertium-kaz-sah.kaz-sah.dix sah-kaz.autobil.bin
main@standard 8502 11291
lt-print sah-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/sah-kaz.autobil.att
hfst-txt2fst -e ε < .deps/sah-kaz.autobil.att > .deps/sah-kaz.autobil.hfst
hfst-project -p upper .deps/sah-kaz.autobil.hfst > .deps/sah-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/sah-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/sah-kaz.autobil.prefixes
hfst-compose-intersect -1 .deps/sah.automorf.hfst -2 .deps/sah-kaz.autobil.prefixes -o .deps/sah-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<apos>") in
transducer in file .deps/sah.automorf.hfst which are not found on the
input tapes of transducers in file .deps/sah-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/sah-kaz.automorf.trimmed -o .deps/sah-kaz.automorf.trimmed.att
lt-comp lr .deps/sah-kaz.automorf.trimmed.att sah-kaz.automorf.bin
main@standard 17257 40258
final@inconditional 549 1631
cp ../../apertium-languages/apertium-sah//sah.prob sah-kaz.prob
cg-comp ../../apertium-languages/apertium-sah//apertium-sah.sah.rlx sah-kaz.rlx.bin
Sections: 1, Rules: 2, Sets: 7, Tags: 17
1 rules cannot be skipped by index.
lrx-comp apertium-kaz-sah.sah-kaz.lrx sah-kaz.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin sah-kaz.autogen.bin
cp ../../apertium-languages/apertium-kaz//kaz.autopgen.bin sah-kaz.autopgen.bin
apertium-validate-transfer apertium-kaz-sah.sah-kaz.t1x
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t1x sah-kaz.t1x.bin
apertium-validate-interchunk apertium-kaz-sah.sah-kaz.t2x
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t2x sah-kaz.t2x.bin
apertium-validate-postchunk apertium-kaz-sah.sah-kaz.t3x
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t3x sah-kaz.t3x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
lt-comp lr .deps/kaz.automorf.bin.att .deps/kaz.automorf.bin
main@standard 380438 893117
final@inconditional 2645 7326
lt-comp lr .deps/sah.automorf.bin.att .deps/sah.automorf.bin
main@standard 17256 40256
final@inconditional 543 1625
bible coverage kaz -> sah
Number of tokenised words in the corpus: 174579
Coverage: 67.93%
Top unknown words in the corpus:
1268 Иса
825 Құдайдың
762 Құдай
324 1
323 Мәсіх
306 2
298 Құдайға
284 3
284 Исаның
279 4
276 5
272 6
269 7
269 10
267 8
267 9
267 11
265 12
264 13
252 14
Translation time: 4.182401418685913 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-sah.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> sah
Error: Malformed input stream.Number of tokenised words in the corpus: 2675
Coverage: 71.93%
Top unknown words in the corpus:
11 1991
8 1
8 оңт
7 тайпалар
5 2
5 3
5 феодалдық
5 30
5 10
5 солт
4 шығысында
4 70
4 60
4 салдарынан
4 мыңдаған
3 ге
3 созылып
3 өкілдері
3 16
3 яғни
Translation time: 0.13700127601623535 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-sah.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage sah -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 1107
Coverage: 91.06%
Top unknown words in the corpus:
5 Апостоллар
3 Евангелие
2 Спасскай
2 миссионердар
2 Аланд
1 Annotation
1 НОВЫЙ
1 ЗАВЕТ
1 якутском
1 языке
1 in
1 c
1 эҕэрдэлиибин
1 Тэнгри
1 чочуобунаны
1 сүрэхтэнэр
1 бэргэһэлэнэр
1 Дежнев
1 Абакайааданы
1 бэргэһэлээбит
Translation time: 0.04111599922180176 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./sah-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage sah -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 3672
Coverage: 90.36%
Top unknown words in the corpus:
5 Орест
4 якутского
4 языка
3 Вейсенбург
2 Ромулус
2 киириитиэр
2 саарар
2 фон
2 монастырыгар
2 рукопись
2 этилэр
2 биллибитэ
2 К
2 Пеллерин
2 Кустуктуурап
2 буоланнар
2 Максимовы
2 Маҥаачыйа
2 Поликарпов
2 сорохторун
Translation time: 0.08243060111999512 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./sah-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz tat
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit ea9afd606afe03df1f9c7c6adc2affd0ef72500a
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-tat from ../../apertium-languages/apertium-tat/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-tat.autobil.bin tat-kaz.autobil.bin kaz-tat.automorf.bin kaz-tat.autopgen.bin kaz-tat.autogen.bin kaz-tat.t1x.bin kaz-tat.t2x.bin tat-kaz.automorf.bin tat-kaz.autopgen.bin tat-kaz.autogen.bin tat-kaz.t1x.bin tat-kaz.t2x.bin kaz-tat.rlx.bin tat-kaz.rlx.bin kaz-tat.lrx.bin tat-kaz.lrx.bin" || rm -f kaz-tat.autobil.bin tat-kaz.autobil.bin kaz-tat.automorf.bin kaz-tat.autopgen.bin kaz-tat.autogen.bin kaz-tat.t1x.bin kaz-tat.t2x.bin tat-kaz.automorf.bin tat-kaz.autopgen.bin tat-kaz.autogen.bin tat-kaz.t1x.bin tat-kaz.t2x.bin kaz-tat.rlx.bin tat-kaz.rlx.bin kaz-tat.lrx.bin tat-kaz.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-tat.kaz-tat.dix
lt-comp lr apertium-kaz-tat.kaz-tat.dix kaz-tat.autobil.bin
main@standard 18888 36358
apertium-validate-dictionary apertium-kaz-tat.kaz-tat.dix
lt-comp rl apertium-kaz-tat.kaz-tat.dix tat-kaz.autobil.bin
main@standard 18854 36285
/bin/mkdir -p .deps
touch .deps/.d
lt-print kaz-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tat.autobil.att
hfst-txt2fst -e ε < .deps/kaz-tat.autobil.att > .deps/kaz-tat.autobil.hfst
hfst-project -p upper .deps/kaz-tat.autobil.hfst > .deps/kaz-tat.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tat.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tat.autobil.prefixes -o .deps/kaz-tat.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<percent>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-tat.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-tat.automorf.trimmed -o .deps/kaz-tat.automorf.trimmed.att
lt-comp lr .deps/kaz-tat.automorf.trimmed.att kaz-tat.automorf.bin
main@standard 210972 478879
final@inconditional 2596 7002
apertium-validate-dictionary apertium-kaz-tat.post-kaz.dix
lt-comp lr apertium-kaz-tat.post-kaz.dix kaz-tat.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-tat//tat.autogen.bin kaz-tat.autogen.bin
apertium-validate-transfer apertium-kaz-tat.kaz-tat.t1x
apertium-preprocess-transfer apertium-kaz-tat.kaz-tat.t1x kaz-tat.t1x.bin
apertium-validate-transfer apertium-kaz-tat.kaz-tat.t2x
apertium-preprocess-transfer apertium-kaz-tat.kaz-tat.t2x kaz-tat.t2x.bin
lt-print tat-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-kaz.autobil.att
hfst-txt2fst -e ε < .deps/tat-kaz.autobil.att > .deps/tat-kaz.autobil.hfst
hfst-project -p upper .deps/tat-kaz.autobil.hfst > .deps/tat-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tat-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-kaz.autobil.prefixes
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-kaz.autobil.prefixes -o .deps/tat-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<punct>") in
transducer in file .deps/tat.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tat-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/tat-kaz.automorf.trimmed -o .deps/tat-kaz.automorf.trimmed.att
lt-comp lr .deps/tat-kaz.automorf.trimmed.att tat-kaz.automorf.bin
main@standard 97321 178518
final@inconditional 755 1606
apertium-validate-dictionary apertium-kaz-tat.post-tat.dix
lt-comp lr apertium-kaz-tat.post-tat.dix tat-kaz.autopgen.bin
main@standard 16 356
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tat-kaz.autogen.bin
apertium-validate-transfer apertium-kaz-tat.tat-kaz.t1x
apertium-preprocess-transfer apertium-kaz-tat.tat-kaz.t1x tat-kaz.t1x.bin
apertium-validate-transfer apertium-kaz-tat.tat-kaz.t2x
apertium-preprocess-transfer apertium-kaz-tat.tat-kaz.t2x tat-kaz.t2x.bin
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tat.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-kaz.rlx.bin
Sections: 11, Rules: 123, Sets: 154, Tags: 194
lrx-comp apertium-kaz-tat.kaz-tat.lrx kaz-tat.lrx.bin
43: 1009@1120
lrx-comp apertium-kaz-tat.tat-kaz.lrx tat-kaz.lrx.bin
3: 49@52
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
bible coverage kaz -> tat
Number of tokenised words in the corpus: 214397
Coverage: 95.03%
Top unknown words in the corpus:
66 яһудилер
65 парызшылдар
63 немесе
50 Пилат
49 Жохан
44 Аумин
43 Ирод
41 Яһудея
39 әзәзіл
36 яһудилердің
35 дүниелік
34 гөр
32 Ғалилея
31 уағыздап
29 екеуі
29 кейбіреулері
29 Саул
29 Қорынттықтарга
27 Лұқа
26 ұлылығын
Translation time: 7.922478675842285 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> tat
Error: Malformed input stream.Number of tokenised words in the corpus: 2937
Coverage: 92.17%
Top unknown words in the corpus:
5 ның
3 ге
3 одақтық
3 оңт
2 Қызылқұм
2 мыңжылдық
2 тайпалық
2 ғұндар
2 Оғыз
2 жоспарлық
2 өнеркәсіптік
2 Беловеж
2 ны
2 сессиясында
2 құрлығының
2 қоңыржай
2 респ
2 жоғ
2 өкілеттігі
2 мореналық
Translation time: 0.23727869987487793 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tat -> kaz
Number of tokenised words in the corpus: 194164
Coverage: 93.57%
Top unknown words in the corpus:
190 Паул
159 Петер
112 яһүдләр
108 берсе
91 яһүд
90 канун
80 әллә
74 карата
73 бөек
66 Шимун
60 Пилат
57 каршында
55 Яһүд
52 явыз
52 фарисейләр
49 Һируд
49 һәммәсе
49 хачка
47 Аннары
47 канунчылар
Translation time: 5.087080955505371 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tat -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 26
Coverage: 65.38%
Top unknown words in the corpus:
1 Tatarça
1 İnternet
1 tulısınça
1 İnternetı
1 Respublikası
1 däwlät
1 tellärendä
1 tatar
1 häm
Translation time: 0.05028939247131348 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz tur
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 5939a3b8ca9a9331bc8eb1c9ec9e3824e0fa2aaa
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-tur from ../../apertium-languages/apertium-tur/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-tur.automorf.bin kaz-tur.prob kaz-tur.rlx.bin kaz-tur.autobil.bin kaz-tur.autolex.bin kaz-tur.autogen.bin kaz-tur.autopgen.bin kaz-tur.t1x.bin kaz-tur.t2x.bin kaz-tur.t3x.bin kaz-tur.t4x.bin tur-kaz.automorf.bin tur-kaz.prob tur-kaz.rlx.bin tur-kaz.autobil.bin tur-kaz.autolex.bin tur-kaz.autogen.bin tur-kaz.t1x.bin tur-kaz.t2x.bin tur-kaz.t3x.bin" || rm -f kaz-tur.automorf.bin kaz-tur.prob kaz-tur.rlx.bin kaz-tur.autobil.bin kaz-tur.autolex.bin kaz-tur.autogen.bin kaz-tur.autopgen.bin kaz-tur.t1x.bin kaz-tur.t2x.bin kaz-tur.t3x.bin kaz-tur.t4x.bin tur-kaz.automorf.bin tur-kaz.prob tur-kaz.rlx.bin tur-kaz.autobil.bin tur-kaz.autolex.bin tur-kaz.autogen.bin tur-kaz.t1x.bin tur-kaz.t2x.bin tur-kaz.t3x.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-tur.kaz-tur.dix
lt-comp lr apertium-kaz-tur.kaz-tur.dix kaz-tur.autobil.bin
main@standard 20029 27244
/bin/mkdir -p .deps
touch .deps/.d
lt-print kaz-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tur.autobil.att
hfst-txt2fst -e ε < .deps/kaz-tur.autobil.att > .deps/kaz-tur.autobil.hfst
hfst-project -p upper .deps/kaz-tur.autobil.hfst > .deps/kaz-tur.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tur.autobil.prefixes
/bin/zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tur.autobil.prefixes -o .deps/kaz-tur.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-tur.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-tur.automorf.trimmed -o .deps/kaz-tur.automorf.trimmed.att
lt-comp lr .deps/kaz-tur.automorf.trimmed.att kaz-tur.automorf.bin
main@standard 162122 359659
final@inconditional 41 68
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-tur.prob
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tur.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
lrx-comp apertium-kaz-tur.kaz-tur.lrx kaz-tur.autolex.bin
95: 2190@2458
cp ../../apertium-languages/apertium-tur//tur.autogen.bin kaz-tur.autogen.bin
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin kaz-tur.autopgen.bin
apertium-validate-transfer apertium-kaz-tur.kaz-tur.t1x
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t1x kaz-tur.t1x.bin
Warning (717): Paths to rule 5 blocked by rule 4.
Warning (958): Paths to rule 13 blocked by rule 12.
Warning (1602): Paths to rule 34 blocked by rule 33.
Warning (1710): Paths to rule 36 blocked by rule 35.
Warning (2020): Paths to rule 46 blocked by rule 45.
Warning (2080): Paths to rule 48 blocked by rule 47.
Warning (2839): Paths to rule 71 blocked by rule 70.
Warning (2839): Paths to rule 71 blocked by rule 70.
apertium-validate-interchunk apertium-kaz-tur.kaz-tur.t2x
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t2x kaz-tur.t2x.bin
apertium-validate-postchunk apertium-kaz-tur.kaz-tur.t3x
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t3x kaz-tur.t3x.bin
apertium-validate-transfer apertium-kaz-tur.kaz-tur.t4x
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t4x kaz-tur.t4x.bin
apertium-validate-dictionary apertium-kaz-tur.kaz-tur.dix
lt-comp rl apertium-kaz-tur.kaz-tur.dix tur-kaz.autobil.bin
main@standard 19995 27192
lt-print tur-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-kaz.autobil.att
hfst-txt2fst -e ε < .deps/tur-kaz.autobil.att > .deps/tur-kaz.autobil.hfst
hfst-project -p upper .deps/tur-kaz.autobil.hfst > .deps/tur-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tur-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-kaz.autobil.prefixes
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-kaz.autobil.prefixes -o .deps/tur-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<quot>") in
transducer in file .deps/tur.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tur-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/tur-kaz.automorf.trimmed -o .deps/tur-kaz.automorf.trimmed.att
lt-comp lr .deps/tur-kaz.automorf.trimmed.att tur-kaz.automorf.bin
main@standard 12675 24541
final@inconditional 4052 7570
cp ../../apertium-languages/apertium-tur//tur.prob tur-kaz.prob
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-kaz.rlx.bin
Sections: 4, Rules: 102, Sets: 129, Tags: 127
2 rules cannot be skipped by index.
lrx-comp apertium-kaz-tur.tur-kaz.lrx tur-kaz.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tur-kaz.autogen.bin
apertium-validate-transfer apertium-kaz-tur.tur-kaz.t1x
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t1x tur-kaz.t1x.bin
apertium-validate-interchunk apertium-kaz-tur.tur-kaz.t2x
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t2x tur-kaz.t2x.bin
apertium-validate-postchunk apertium-kaz-tur.tur-kaz.t3x
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t3x tur-kaz.t3x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
bible coverage kaz -> tur
Number of tokenised words in the corpus: 214376
Coverage: 89.05%
Top unknown words in the corpus:
1268 Иса
323 Мәсіх
309 Киелі
284 Исаның
246 Мәсіхтің
211 Ізгі
175 Исаға
151 Исаны
150 Петір
136 Пауыл
129 Таурат
127 шынайы
106 күнәкар
103 Мәсіхке
89 киелі
88 яғни
83 Жақия
83 әркім
79 әділ
79 Мұса
Translation time: 7.062980890274048 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> tur
Error: Malformed input stream.Number of tokenised words in the corpus: 2936
Coverage: 88.28%
Top unknown words in the corpus:
8 оңт
5 феодалдық
5 солт
4 мыңдаған
3 ге
3 Тянь
3 Шань
3 Еділ
3 яғни
3 VI
3 Социалистік
3 жж
3 одақтық
3 ядролық
3 м
3 континенттік
2 Қызылқұм
2 тайпалық
2 ғұндар
2 әкімшілік
Translation time: 0.20586729049682617 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tur.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tur -> kaz
Number of tokenised words in the corpus: 493813
Coverage: 82.25%
Top unknown words in the corpus:
1782 Tanrı
1686 Çünkü
1562 nın
1150 ın
1044 a
912 ki
832 Davut
620 üzerine
585 Yahuda
553 Ey
505 Yeruşalim
487 Egemen
448 Musa
409 na
390 la
377 Tanrısı
376 ı
362 i
355 Saul
340 dan
Translation time: 7.328187942504883 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tur -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 16959
Coverage: 77.57%
Top unknown words in the corpus:
141 ın
124 Temuçin
53 a
41 ı
40 i
40 nin
34 Camuka
34 nın
33 Jin
33 Tuğrul
29 Cuci
28 Kırım
27 soyundan
27 Harezmşah
24 üzerine
22 Cebe
22 Hanlığı
17 Mukhulai
17 Subutay
16 Yesügey
Translation time: 0.4011809825897217 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tur-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz tyv
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit ba80cf81d1ca88b2b35fb961f2d746f8f28e42a2
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-tyv from ../../apertium-languages/apertium-tyv/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-tyv.automorf.bin kaz-tyv.prob kaz-tyv.rlx.bin kaz-tyv.autobil.bin kaz-tyv.autolex.bin kaz-tyv.autogen.bin kaz-tyv.autopgen.bin kaz-tyv.t1x.bin kaz-tyv.t2x.bin kaz-tyv.t3x.bin kaz-tyv.t4x.bin tyv-kaz.automorf.bin tyv-kaz.prob tyv-kaz.rlx.bin tyv-kaz.autobil.bin tyv-kaz.autolex.bin tyv-kaz.autogen.bin tyv-kaz.autopgen.bin tyv-kaz.t1x.bin tyv-kaz.t2x.bin tyv-kaz.t3x.bin" || rm -f kaz-tyv.automorf.bin kaz-tyv.prob kaz-tyv.rlx.bin kaz-tyv.autobil.bin kaz-tyv.autolex.bin kaz-tyv.autogen.bin kaz-tyv.autopgen.bin kaz-tyv.t1x.bin kaz-tyv.t2x.bin kaz-tyv.t3x.bin kaz-tyv.t4x.bin tyv-kaz.automorf.bin tyv-kaz.prob tyv-kaz.rlx.bin tyv-kaz.autobil.bin tyv-kaz.autolex.bin tyv-kaz.autogen.bin tyv-kaz.autopgen.bin tyv-kaz.t1x.bin tyv-kaz.t2x.bin tyv-kaz.t3x.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-tyv.kaz-tyv.dix
lt-comp lr apertium-kaz-tyv.kaz-tyv.dix kaz-tyv.autobil.bin
main@standard 465 671
/bin/mkdir -p .deps
touch .deps/.d
lt-print kaz-tyv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tyv.autobil.att
hfst-txt2fst -e ε < .deps/kaz-tyv.autobil.att > .deps/kaz-tyv.autobil.hfst
hfst-project -p upper .deps/kaz-tyv.autobil.hfst > .deps/kaz-tyv.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-tyv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tyv.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tyv.autobil.prefixes -o .deps/kaz-tyv.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-tyv.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-tyv.automorf.trimmed -o .deps/kaz-tyv.automorf.trimmed.att
lt-comp lr .deps/kaz-tyv.automorf.trimmed.att kaz-tyv.automorf.bin
main@standard 21219 48771
final@inconditional 2584 6986
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-tyv.prob
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tyv.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
lrx-comp apertium-kaz-tyv.kaz-tyv.lrx kaz-tyv.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-tyv//tyv.autogen.bin kaz-tyv.autogen.bin
cp ../../apertium-languages/apertium-tyv//tyv.autopgen.bin kaz-tyv.autopgen.bin
apertium-validate-transfer apertium-kaz-tyv.kaz-tyv.t1x
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t1x kaz-tyv.t1x.bin
apertium-validate-interchunk apertium-kaz-tyv.kaz-tyv.t2x
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t2x kaz-tyv.t2x.bin
apertium-validate-postchunk apertium-kaz-tyv.kaz-tyv.t3x
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t3x kaz-tyv.t3x.bin
apertium-validate-transfer apertium-kaz-tyv.kaz-tyv.t4x
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t4x kaz-tyv.t4x.bin
apertium-validate-dictionary apertium-kaz-tyv.kaz-tyv.dix
lt-comp rl apertium-kaz-tyv.kaz-tyv.dix tyv-kaz.autobil.bin
main@standard 465 671
lt-print tyv-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tyv-kaz.autobil.att
hfst-txt2fst -e ε < .deps/tyv-kaz.autobil.att > .deps/tyv-kaz.autobil.hfst
hfst-project -p upper .deps/tyv-kaz.autobil.hfst > .deps/tyv-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tyv-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tyv-kaz.autobil.prefixes
zcat ../../apertium-languages/apertium-tyv//tyv.automorf.att.gz | hfst-txt2fst > .deps/tyv.automorf.hfst
hfst-compose-intersect -1 .deps/tyv.automorf.hfst -2 .deps/tyv-kaz.autobil.prefixes -o .deps/tyv-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<subst>") in
transducer in file .deps/tyv.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tyv-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/tyv-kaz.automorf.trimmed -o .deps/tyv-kaz.automorf.trimmed.att
lt-comp lr .deps/tyv-kaz.automorf.trimmed.att tyv-kaz.automorf.bin
main@standard 1721 4129
final@inconditional 307 799
cp ../../apertium-languages/apertium-tyv//tyv.prob tyv-kaz.prob
cg-comp ../../apertium-languages/apertium-tyv//apertium-tyv.tyv.rlx tyv-kaz.rlx.bin
Sections: 2, Rules: 34, Sets: 60, Tags: 102
1 rules cannot be skipped by index.
lrx-comp apertium-kaz-tyv.tyv-kaz.lrx tyv-kaz.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tyv-kaz.autogen.bin
cp ../../apertium-languages/apertium-kaz//kaz.autopgen.bin tyv-kaz.autopgen.bin
apertium-validate-transfer apertium-kaz-tyv.tyv-kaz.t1x
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t1x tyv-kaz.t1x.bin
apertium-validate-interchunk apertium-kaz-tyv.tyv-kaz.t2x
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t2x tyv-kaz.t2x.bin
apertium-validate-postchunk apertium-kaz-tyv.tyv-kaz.t3x
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t3x tyv-kaz.t3x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
bible coverage kaz -> tyv
Number of tokenised words in the corpus: 217646
Coverage: 57.56%
Top unknown words in the corpus:
1268 Иса
825 Құдайдың
808 үшін
762 Құдай
434 Сонда
414 осы
411 туралы
383 сендер
371 рухани
351 өз
349 Себебі
339 арқылы
323 Мәсіх
309 Киелі
308 сендерге
298 Құдайға
284 Исаның
270 Иеміз
246 Мәсіхтің
240 қатты
Translation time: 2.413213014602661 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tyv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> tyv
Error: Malformed input stream.Number of tokenised words in the corpus: 2980
Coverage: 40.77%
Top unknown words in the corpus:
51 Қазақстан
11 км
10 бойынша
8 мемлекет
8 Қазақстанның
8 КСРО
8 Орта
8 оңт
7 ең
7 негізгі
7 өз
7 тайпалар
6 Республикасы
6 орналасқан
6 Қазақ
6 шығыс
6 экономикалық
6 туралы
6 ірі
6 республика
Translation time: 0.06718015670776367 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-tyv.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage tyv -> kaz
Number of tokenised words in the corpus: 227032
Coverage: 59.05%
Top unknown words in the corpus:
1547 даа
1179 Бурганның
1101 Иисус
703 мынча
678 бүгү
558 Бурган
545 силерге
543 Дээрги
532 Мен
501 силер
475 мен
447 дег
442 ла
430 чедип
423 Мээң
393 өске
373 дугайында
360 катап
321 ле
318 бис
Translation time: 1.5751702785491943 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tyv-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tyv -> kaz
Number of tokenised words in the corpus: 433
Coverage: 49.19%
Top unknown words in the corpus:
4 В
4 quot
4 Кезер
4 Даңгына
3 Азия
3 Хемниң
3 Ачыты
3 Мерген
3 бурят
2 Азияның
2 төвү
2 Азий
2 Төвү
2 Тываның
2 тураскаал
2 төвүнде
2 он
2 ла
2 илереткен
2 Куулар
Translation time: 0.008584737777709961 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tyv-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kaz uig
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 27242d1bc93089f2430d555817239e064530f2d1
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kaz from ../../apertium-languages/apertium-kaz/
Using apertium-uig from ../../apertium-languages/apertium-uig/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kaz-uig.autobil.bin uig-kaz.autobil.bin kaz-uig.automorf.bin kaz-uig.autopgen.bin kaz-uig.autogen.bin kaz-uig.t1x.bin kaz-uig.t2x.bin uig-kaz.automorf.bin uig-kaz.autopgen.bin uig-kaz.autogen.bin uig-kaz.t1x.bin uig-kaz.t2x.bin kaz-uig.rlx.bin uig-kaz.rlx.bin kaz-uig.lrx.bin uig-kaz.lrx.bin" || rm -f kaz-uig.autobil.bin uig-kaz.autobil.bin kaz-uig.automorf.bin kaz-uig.autopgen.bin kaz-uig.autogen.bin kaz-uig.t1x.bin kaz-uig.t2x.bin uig-kaz.automorf.bin uig-kaz.autopgen.bin uig-kaz.autogen.bin uig-kaz.t1x.bin uig-kaz.t2x.bin kaz-uig.rlx.bin uig-kaz.rlx.bin kaz-uig.lrx.bin uig-kaz.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kaz-uig.kaz-uig.dix
lt-comp lr apertium-kaz-uig.kaz-uig.dix kaz-uig.autobil.bin
main@standard 6798 9416
apertium-validate-dictionary apertium-kaz-uig.kaz-uig.dix
lt-comp rl apertium-kaz-uig.kaz-uig.dix uig-kaz.autobil.bin
main@standard 6786 9401
if [ ! -d .deps ]; then mkdir .deps; fi
touch .deps/.d
lt-print kaz-uig.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-uig.autobil.att
hfst-txt2fst -e ε < .deps/kaz-uig.autobil.att > .deps/kaz-uig.autobil.hfst
hfst-project -p upper .deps/kaz-uig.autobil.hfst > .deps/kaz-uig.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaz-uig.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-uig.autobil.prefixes
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-uig.autobil.prefixes -o .deps/kaz-uig.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<ltr>") in
transducer in file .deps/kaz.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaz-uig.autobil.prefixes.
hfst-fst2txt -i .deps/kaz-uig.automorf.trimmed -o .deps/kaz-uig.automorf.trimmed.att
lt-comp lr .deps/kaz-uig.automorf.trimmed.att kaz-uig.automorf.bin
main@standard 104981 233480
final@inconditional 2589 6991
apertium-validate-dictionary apertium-kaz-uig.post-kaz.dix
lt-comp lr apertium-kaz-uig.post-kaz.dix kaz-uig.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-uig//uig.autogen.bin kaz-uig.autogen.bin
apertium-validate-transfer apertium-kaz-uig.kaz-uig.t1x
apertium-preprocess-transfer apertium-kaz-uig.kaz-uig.t1x kaz-uig.t1x.bin
apertium-validate-transfer apertium-kaz-uig.kaz-uig.t2x
apertium-preprocess-transfer apertium-kaz-uig.kaz-uig.t2x kaz-uig.t2x.bin
lt-print uig-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/uig-kaz.autobil.att
hfst-txt2fst -e ε < .deps/uig-kaz.autobil.att > .deps/uig-kaz.autobil.hfst
hfst-project -p upper .deps/uig-kaz.autobil.hfst > .deps/uig-kaz.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/uig-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/uig-kaz.autobil.prefixes
zcat ../../apertium-languages/apertium-uig//uig.automorf.att.gz | hfst-txt2fst > .deps/uig.automorf.hfst
hfst-compose-intersect -1 .deps/uig.automorf.hfst -2 .deps/uig-kaz.autobil.prefixes -o .deps/uig-kaz.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<barb>") in
transducer in file .deps/uig.automorf.hfst which are not found on the
input tapes of transducers in file .deps/uig-kaz.autobil.prefixes.
hfst-fst2txt -i .deps/uig-kaz.automorf.trimmed -o .deps/uig-kaz.automorf.trimmed.att
lt-comp lr .deps/uig-kaz.automorf.trimmed.att uig-kaz.automorf.bin
main@standard 7086 37292
final@inconditional 17 38
apertium-validate-dictionary apertium-kaz-uig.post-uig.dix
lt-comp lr apertium-kaz-uig.post-uig.dix uig-kaz.autopgen.bin
main@standard 9 114
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin uig-kaz.autogen.bin
apertium-validate-transfer apertium-kaz-uig.uig-kaz.t1x
apertium-preprocess-transfer apertium-kaz-uig.uig-kaz.t1x uig-kaz.t1x.bin
apertium-validate-transfer apertium-kaz-uig.uig-kaz.t2x
apertium-preprocess-transfer apertium-kaz-uig.uig-kaz.t2x uig-kaz.t2x.bin
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-uig.rlx.bin
Sections: 3, Rules: 150, Sets: 204, Tags: 234
1 rules cannot be skipped by index.
cg-comp ../../apertium-languages/apertium-uig//apertium-uig.uig.rlx uig-kaz.rlx.bin
Sections: 1, Rules: 55, Sets: 81, Tags: 147
lrx-comp apertium-kaz-uig.kaz-uig.lrx kaz-uig.lrx.bin
6: 99@109
lrx-comp apertium-kaz-uig.uig-kaz.lrx uig-kaz.lrx.bin
1: 19@19
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
cp *.mode modes/
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden
make: *** [Makefile:779: modes/kaz-uig.mode] Fehler 1
bible coverage kaz -> uig
Number of tokenised words in the corpus: 215836
Coverage: 79.13%
Top unknown words in the corpus:
1268 Иса
462 былай
434 Сонда
323 Мәсіх
284 Исаның
270 Иеміз
246 Мәсіхтің
238 Сондықтан
211 Ізгі
208 Содан
208 айтып
205 кезде
188 Алайда
181 етіп
175 Исаға
174 барып
166 жерде
151 Исаны
150 Петір
141 Сонымен
Translation time: 4.965975522994995 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-uig.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaz -> uig
Error: Malformed input stream.Number of tokenised words in the corpus: 2966
Coverage: 70.23%
Top unknown words in the corpus:
8 КСРО
8 оңт
7 тайпалар
7 жерінде
6 Республикасы
6 Қазақ
6 шығыс
6 жер
6 республика
6 желтоқсанда
6 басшылары
6 республиканың
5 ның
5 батыс
5 Украина
5 Республикасының
5 солт
4 шығысында
4 тау
4 Каспий
Translation time: 0.15818142890930176 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaz-uig.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage uig -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 692001
Coverage: 57.33%
Top unknown words in the corpus:
5391 ۋە
4124 بۇ
4115 ئۇ
3007 بىر
2610 مەن
2541 ئۇالر
2289 دەپ
2189 ئۈچۈن
2173 دېدى
2159 ئەيسا
2014 ھەزرىتى
1875 پەرۋەردىگار
1704 قىلىپ
1656 بولۇپ
1454 ئۆز
1379 چۈنكى
1377 سىلەر
1345 ئۇالرنىڭ
1297 بولغان
1296 قىلغان
Translation time: 4.557683944702148 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./uig-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage uig -> kaz
Error: Malformed input stream.Number of tokenised words in the corpus: 194
Coverage: 41.24%
Top unknown words in the corpus:
3 ئۇيغۇر
3 كومپۇتەر
2 ۋە
2 بولۇپ
2 بیزنیڭ
2 ئاز
2 كیشیلیریمیز
2 جۇڭخۇا
2 جۇمھۇرىيىتى
2 شەھىرى
1 ئۇيغۇرچە
1 ۋىكىپىدىيە
1 خەلقئارالىق
1 ئۇچۇر
1 بېتى
1 ۋىكىپېدىيەنىڭ
1 نۇسخاسىغا
1 خوش
1 كېلىپسىز
1 تاللانغان
Translation time: 0.015642166137695312 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./uig-kaz.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
kir uzb
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 0bd73de9fd7a7b50bfb4d95ec7c3837a7c25a164
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-kir from ../../apertium-languages/apertium-kir/
Using apertium-uzb from ../../apertium-languages/apertium-uzb/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "kir-uzb.autobil.bin uzb-kir.autobil.bin kir-uzb.automorf.bin kir-uzb.autopgen.bin kir-uzb.autogen.bin kir-uzb.t1x.bin kir-uzb.t2x.bin uzb-kir.automorf.bin uzb-kir.autopgen.bin uzb-kir.autogen.bin uzb-kir.t1x.bin uzb-kir.t2x.bin kir-uzb.rlx.bin uzb-kir.rlx.bin kir-uzb.autolex.bin uzb-kir.autolex.bin" || rm -f kir-uzb.autobil.bin uzb-kir.autobil.bin kir-uzb.automorf.bin kir-uzb.autopgen.bin kir-uzb.autogen.bin kir-uzb.t1x.bin kir-uzb.t2x.bin uzb-kir.automorf.bin uzb-kir.autopgen.bin uzb-kir.autogen.bin uzb-kir.t1x.bin uzb-kir.t2x.bin kir-uzb.rlx.bin uzb-kir.rlx.bin kir-uzb.autolex.bin uzb-kir.autolex.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-kir-uzb.kir-uzb.dix
lt-comp lr apertium-kir-uzb.kir-uzb.dix kir-uzb.autobil.bin
main@standard 838 1151
apertium-validate-dictionary apertium-kir-uzb.kir-uzb.dix
lt-comp rl apertium-kir-uzb.kir-uzb.dix uzb-kir.autobil.bin
main@standard 838 1151
if [ ! -d .deps ]; then mkdir .deps; fi
touch .deps/.d
lt-print kir-uzb.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kir-uzb.autobil.att
hfst-txt2fst -e ε < .deps/kir-uzb.autobil.att > .deps/kir-uzb.autobil.hfst
hfst-project -p upper .deps/kir-uzb.autobil.hfst > .deps/kir-uzb.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kir-uzb.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kir-uzb.autobil.prefixes
zcat ../../apertium-languages/apertium-kir//kir.automorf.att.gz | hfst-txt2fst > .deps/kir.automorf.hfst
hfst-compose-intersect -1 .deps/kir.automorf.hfst -2 .deps/kir-uzb.autobil.prefixes -o .deps/kir-uzb.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<quot>") in
transducer in file .deps/kir.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kir-uzb.autobil.prefixes.
hfst-fst2fst -O -i .deps/kir-uzb.automorf.trimmed -o kir-uzb.automorf.bin
hfst-fst2txt -i .deps/kir-uzb.automorf.trimmed -o .deps/kir-uzb.automorf.trimmed.att
lt-comp lr .deps/kir-uzb.automorf.trimmed.att kir-uzb.automorf.bin
main@standard 6684 15957
final@inconditional 827 2299
cp ../../apertium-languages/apertium-kir//kir.autopgen.bin kir-uzb.autopgen.bin
cp ../../apertium-languages/apertium-uzb//uzb.autogen.bin kir-uzb.autogen.bin
apertium-validate-transfer apertium-kir-uzb.kir-uzb.t1x
apertium-preprocess-transfer apertium-kir-uzb.kir-uzb.t1x kir-uzb.t1x.bin
apertium-validate-transfer apertium-kir-uzb.kir-uzb.t2x
apertium-preprocess-transfer apertium-kir-uzb.kir-uzb.t2x kir-uzb.t2x.bin
lt-print uzb-kir.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/uzb-kir.autobil.att
hfst-txt2fst -e ε < .deps/uzb-kir.autobil.att > .deps/uzb-kir.autobil.hfst
hfst-project -p upper .deps/uzb-kir.autobil.hfst > .deps/uzb-kir.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/uzb-kir.autobil.upper -2 .deps/any-symbol.hfst -o .deps/uzb-kir.autobil.prefixes
zcat ../../apertium-languages/apertium-uzb//uzb.automorf.att.gz | hfst-txt2fst > .deps/uzb.automorf.hfst
hfst-compose-intersect -1 .deps/uzb.automorf.hfst -2 .deps/uzb-kir.autobil.prefixes -o .deps/uzb-kir.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("{🂡}") in
transducer in file .deps/uzb.automorf.hfst which are not found on the
input tapes of transducers in file .deps/uzb-kir.autobil.prefixes.
hfst-fst2txt -i .deps/uzb-kir.automorf.trimmed -o .deps/uzb-kir.automorf.trimmed.att
lt-comp lr .deps/uzb-kir.automorf.trimmed.att uzb-kir.automorf.bin
main@standard 1109 1924
final@inconditional 21 94
apertium-validate-dictionary ../../apertium-languages/apertium-uzb//apertium-uzb.post-uzb.dix
lt-comp lr ../../apertium-languages/apertium-uzb//apertium-uzb.post-uzb.dix uzb-kir.autopgen.bin
main@standard 16 356
cp ../../apertium-languages/apertium-kir//kir.autogen.bin uzb-kir.autogen.bin
apertium-validate-transfer apertium-kir-uzb.uzb-kir.t1x
apertium-preprocess-transfer apertium-kir-uzb.uzb-kir.t1x uzb-kir.t1x.bin
apertium-validate-transfer apertium-kir-uzb.uzb-kir.t2x
apertium-preprocess-transfer apertium-kir-uzb.uzb-kir.t2x uzb-kir.t2x.bin
cg-comp ../../apertium-languages/apertium-kir//apertium-kir.kir.rlx kir-uzb.rlx.bin
Sections: 3, Rules: 71, Sets: 102, Tags: 126
cg-comp ../../apertium-languages/apertium-uzb//apertium-uzb.uzb.rlx uzb-kir.rlx.bin
Sections: 0, Rules: 62, Sets: 54, Tags: 104
lrx-comp apertium-kir-uzb.kir-uzb.lrx kir-uzb.autolex.bin
1: 19@19
lrx-comp apertium-kir-uzb.uzb-kir.lrx uzb-kir.autolex.bin
1: 19@19
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
cp *.mode modes/
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden
make: *** [Makefile:774: modes/kir-uzb.mode] Fehler 1
bible coverage kir -> uzb
Number of tokenised words in the corpus: 205768
Coverage: 64.63%
Top unknown words in the corpus:
1279 Ыйса
946 Кудай
597 Кудайдын
582 алып
380 Машаяк
362 Ыйсанын
325 өз
305 Кудайга
284 Ыйык
264 Анан
259 Эгебиз
246 баары
237 берди
229 ар
225 киши
208 Ыйсаны
204 Өз
189 керек
188 көп
187 эл
Translation time: 2.4062106609344482 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kir-uzb.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kir -> uzb
Error: Malformed input stream.Number of tokenised words in the corpus: 9480
Coverage: 44.46%
Top unknown words in the corpus:
51 Кыргыз
29 Кыргызстандын
29 Республикасынын
28 табигый
28 географиялык
27 География
25 кылымдын
24 ж
23 илимий
20 ар
20 жылы
19 жайгашкан
18 география
18 кыргыз
18 тоо
17 Географиялык
17 А
16 Кыргызстан
15 экономикалык
15 С
Translation time: 0.09597134590148926 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kir-uzb.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage uzb -> kir
Number of tokenised words in the corpus: 215561
Coverage: 51.41%
Top unknown words in the corpus:
3577 bo
3488 o
2129 ko
1423 Iso
1162 O
985 g
925 qo
854 so
755 yo
741 Xudo
735 to
715 z
553 Xudoning
450 lib
395 lgan
391 Masih
365 zi
352 har
345 lsa
333 shunday
Translation time: 0.743370771408081 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./uzb-kir.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage uzb -> kir
Error: Malformed input stream.Number of tokenised words in the corpus: 4189
Coverage: 41.27%
Top unknown words in the corpus:
32 X
27 Oʻzbekiston
22 av
21 Xorazm
15 qad
14 boʻlgan
14 mil
12 qalʼa
12 Mil
11 asr
11 yasalgan
10 boʻlib
10 xom
10 oʻlka
10 ning
10 shim
10 da
9 jan
9 madaniyati
8 qismi
Translation time: 0.02355480194091797 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./uzb-kir.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
nog kaz
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 64776015694b4e339eab1cf9b23ae9f4c6c9cb28
bible coverage nog -> kaz
[Errno 2] No such file or directory: 'nog-kaz.automorf.bin'
wikipedia coverage nog -> kaz
[Errno 2] No such file or directory: '../../apertium-languages/apertium-nog/wiki.destxt'
bible coverage kaz -> nog
[Errno 2] No such file or directory: 'kaz-nog.automorf.bin'
wikipedia coverage kaz -> nog
[Errno 2] No such file or directory: 'kaz-nog.automorf.bin'
tat bak
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 94b66d3c663e88ad5263734620780b2eeea80c16
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see:
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-tat from ../../apertium-languages/apertium-tat/
Using apertium-bak from ../../apertium-languages/apertium-bak/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "tat-bak.autobil.bin bak-tat.autobil.bin tat-bak.automorf.bin tat-bak.autopgen.bin tat-bak.autogen.bin tat-bak.t1x.bin tat-bak.t2x.bin bak-tat.automorf.bin bak-tat.autopgen.bin bak-tat.autogen.bin bak-tat.t1x.bin bak-tat.t2x.bin tat-bak.rlx.bin bak-tat.rlx.bin tat-bak.lrx.bin bak-tat.lrx.bin" || rm -f tat-bak.autobil.bin bak-tat.autobil.bin tat-bak.automorf.bin tat-bak.autopgen.bin tat-bak.autogen.bin tat-bak.t1x.bin tat-bak.t2x.bin bak-tat.automorf.bin bak-tat.autopgen.bin bak-tat.autogen.bin bak-tat.t1x.bin bak-tat.t2x.bin tat-bak.rlx.bin bak-tat.rlx.bin tat-bak.lrx.bin bak-tat.lrx.bin
rm -rf .deps modes
apertium-validate-dictionary apertium-tat-bak.tat-bak.dix
lt-comp lr apertium-tat-bak.tat-bak.dix tat-bak.autobil.bin
main@standard 71611 117353
apertium-validate-dictionary apertium-tat-bak.tat-bak.dix
lt-comp rl apertium-tat-bak.tat-bak.dix bak-tat.autobil.bin
main@standard 71609 117346
/bin/mkdir -p .deps
touch .deps/.d
lt-print tat-bak.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-bak.autobil.att
hfst-txt2fst -e ε < .deps/tat-bak.autobil.att > .deps/tat-bak.autobil.hfst
hfst-project -p upper .deps/tat-bak.autobil.hfst > .deps/tat-bak.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tat-bak.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-bak.autobil.prefixes
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-bak.autobil.prefixes -o .deps/tat-bak.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<punct>") in
transducer in file .deps/tat.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tat-bak.autobil.prefixes.
hfst-fst2txt -i .deps/tat-bak.automorf.trimmed -o .deps/tat-bak.automorf.trimmed.att
lt-comp lr .deps/tat-bak.automorf.trimmed.att tat-bak.automorf.bin
main@standard 225878 445718
final@inconditional 38 64
apertium-validate-dictionary apertium-tat-bak.post-tat.dix
lt-comp lr apertium-tat-bak.post-tat.dix tat-bak.autopgen.bin
main@standard 16 356
cp ../../apertium-languages/apertium-bak//bak.autogen.bin tat-bak.autogen.bin
apertium-validate-transfer apertium-tat-bak.tat-bak.t1x
apertium-preprocess-transfer apertium-tat-bak.tat-bak.t1x tat-bak.t1x.bin
apertium-validate-transfer apertium-tat-bak.tat-bak.t2x
apertium-preprocess-transfer apertium-tat-bak.tat-bak.t2x tat-bak.t2x.bin
lt-print bak-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/bak-tat.autobil.att
hfst-txt2fst -e ε < .deps/bak-tat.autobil.att > .deps/bak-tat.autobil.hfst
hfst-project -p upper .deps/bak-tat.autobil.hfst > .deps/bak-tat.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/bak-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/bak-tat.autobil.prefixes
zcat ../../apertium-languages/apertium-bak//bak.automorf.att.gz | hfst-txt2fst > .deps/bak.automorf.hfst
hfst-compose-intersect -1 .deps/bak.automorf.hfst -2 .deps/bak-tat.autobil.prefixes -o .deps/bak-tat.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<punct>") in
transducer in file .deps/bak.automorf.hfst which are not found on the
input tapes of transducers in file .deps/bak-tat.autobil.prefixes.
hfst-fst2txt -i .deps/bak-tat.automorf.trimmed -o .deps/bak-tat.automorf.trimmed.att
lt-comp lr .deps/bak-tat.automorf.trimmed.att bak-tat.automorf.bin
main@standard 78313 141455
final@inconditional 15 35
apertium-validate-dictionary apertium-tat-bak.post-bak.dix
lt-comp lr apertium-tat-bak.post-bak.dix bak-tat.autopgen.bin
main@standard 10 149
cp ../../apertium-languages/apertium-tat//tat.autogen.bin bak-tat.autogen.bin
apertium-validate-transfer apertium-tat-bak.bak-tat.t1x
apertium-preprocess-transfer apertium-tat-bak.bak-tat.t1x bak-tat.t1x.bin
apertium-validate-transfer apertium-tat-bak.bak-tat.t2x
apertium-preprocess-transfer apertium-tat-bak.bak-tat.t2x bak-tat.t2x.bin
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-bak.rlx.bin
Sections: 11, Rules: 123, Sets: 154, Tags: 194
cg-comp ../../apertium-languages/apertium-bak//apertium-bak.bak.rlx bak-tat.rlx.bin
Sections: 1, Rules: 5, Sets: 25, Tags: 44
lrx-comp apertium-tat-bak.tat-bak.lrx tat-bak.lrx.bin
2: 34@36
lrx-comp apertium-tat-bak.bak-tat.lrx bak-tat.lrx.bin
2: 31@33
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
bible coverage tat -> bak
Number of tokenised words in the corpus: 196787
Coverage: 97.34%
Top unknown words in the corpus:
57 каршында
52 явыз
52 фарисейләр
49 Һируд
49 хачка
47 канунчылар
36 Имандашлар
33 савыктыра
33 Барнаб
30 кайберләре
29 Шаул
29 Corinthians
28 Matthew
28 дучар
28 беркайчан
28 John
28 Acts
27 имандаш
26 Гәлиләя
26 чумдырылу
Translation time: 6.27307653427124 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-bak.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tat -> bak
Error: Malformed input stream.Number of tokenised words in the corpus: 26
Coverage: 46.15%
Top unknown words in the corpus:
3 Tatnet
1 Tatarça
1 İnternet
1 tulısınça
1 Tatar
1 İnternetı
1 Tatarstan
1 Respublikası
1 däwlät
1 tellärendä
1 tatar
1 häm
Translation time: 0.12012624740600586 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-bak.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage bak -> tat
Number of tokenised words in the corpus: 197387
Coverage: 94.05%
Top unknown words in the corpus:
176 алдында
144 Һөйөнөслө
114 китте
94 имандаштар
75 үҙҙәре
71 шундай
63 алдына
58 ҡыуып
54 арҡысаҡҡа
53 киткән
52 фарисейҙар
51 бөтөнөһө
50 ҡисса
49 дусар
49 өҫтөнән
48 Ирод
48 береһенә
48 Имандаштар
46 Йәһүҙә
46 халҡы
Translation time: 4.23078179359436 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./bak-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage bak -> tat
Error: Malformed input stream.Number of tokenised words in the corpus: 474
Coverage: 96.20%
Top unknown words in the corpus:
4 власы
2 ө
2 н
1 ноябрендә
1 октябрендә
1 суверенитеты
1 февраленән
1 ТӨРКСОЙ
1 Халҡы
1 ын
1 тауҙарының
1 Ямантау
1 мәмерйәләре
Translation time: 0.06259441375732422 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./bak-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
tat kaa
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit e685b6d852eb648f87d89649c331bc75898cc1ce
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-tat from ../../apertium-languages/apertium-tat/
Using apertium-kaa from ../../apertium-languages/apertium-kaa/
checking that generated files are newer than configure... done
configure: creating ./config.status
config.status: creating Makefile
test -z "tat-kaa.automorf.bin tat-kaa.prob tat-kaa.rlx.bin tat-kaa.autobil.bin tat-kaa.autolex.bin tat-kaa.autogen.bin tat-kaa.autopgen.bin tat-kaa.t1x.bin tat-kaa.t2x.bin tat-kaa.t3x.bin kaa-tat.automorf.bin kaa-tat.rlx.bin kaa-tat.autobil.bin kaa-tat.autolex.bin kaa-tat.autogen.bin kaa-tat.autopgen.bin kaa-tat.t1x.bin kaa-tat.t2x.bin kaa-tat.t3x.bin" || rm -f tat-kaa.automorf.bin tat-kaa.prob tat-kaa.rlx.bin tat-kaa.autobil.bin tat-kaa.autolex.bin tat-kaa.autogen.bin tat-kaa.autopgen.bin tat-kaa.t1x.bin tat-kaa.t2x.bin tat-kaa.t3x.bin kaa-tat.automorf.bin kaa-tat.rlx.bin kaa-tat.autobil.bin kaa-tat.autolex.bin kaa-tat.autogen.bin kaa-tat.autopgen.bin kaa-tat.t1x.bin kaa-tat.t2x.bin kaa-tat.t3x.bin
rm -rf .deps modes
/bin/mkdir -p .deps
touch .deps/.d
/bin/zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst
apertium-validate-dictionary apertium-tat-kaa.tat-kaa.dix
lt-comp lr apertium-tat-kaa.tat-kaa.dix tat-kaa.autobil.bin
main@standard 9 17
lt-print tat-kaa.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-kaa.autobil.att
hfst-txt2fst -e ε < .deps/tat-kaa.autobil.att > .deps/tat-kaa.autobil.hfst
hfst-project -p upper .deps/tat-kaa.autobil.hfst > .deps/tat-kaa.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/tat-kaa.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-kaa.autobil.prefixes
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-kaa.autobil.prefixes -o .deps/tat-kaa.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<punct>") in
transducer in file .deps/tat.automorf.hfst which are not found on the
input tapes of transducers in file .deps/tat-kaa.autobil.prefixes.
hfst-fst2txt -i .deps/tat-kaa.automorf.trimmed -o .deps/tat-kaa.automorf.trimmed.att
lt-comp lr .deps/tat-kaa.automorf.trimmed.att tat-kaa.automorf.bin
main@standard 351 668
final@inconditional 8 12
cp ../../apertium-languages/apertium-tat//tat.prob tat-kaa.prob
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-kaa.rlx.bin
Sections: 11, Rules: 123, Sets: 154, Tags: 194
lrx-comp apertium-tat-kaa.tat-kaa.lrx tat-kaa.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-kaa//kaa.autogen.bin tat-kaa.autogen.bin
cp ../../apertium-languages/apertium-kaa//kaa.autopgen.bin tat-kaa.autopgen.bin
apertium-validate-transfer apertium-tat-kaa.tat-kaa.t1x
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t1x tat-kaa.t1x.bin
apertium-validate-interchunk apertium-tat-kaa.tat-kaa.t2x
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t2x tat-kaa.t2x.bin
apertium-validate-postchunk apertium-tat-kaa.tat-kaa.t3x
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t3x tat-kaa.t3x.bin
/bin/zcat ../../apertium-languages/apertium-kaa//kaa.automorf.att.gz | hfst-txt2fst > .deps/kaa.automorf.hfst
apertium-validate-dictionary apertium-tat-kaa.tat-kaa.dix
lt-comp rl apertium-tat-kaa.tat-kaa.dix kaa-tat.autobil.bin
main@standard 9 17
lt-print kaa-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaa-tat.autobil.att
hfst-txt2fst -e ε < .deps/kaa-tat.autobil.att > .deps/kaa-tat.autobil.hfst
hfst-project -p upper .deps/kaa-tat.autobil.hfst > .deps/kaa-tat.autobil.upper
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst
hfst-concatenate -1 .deps/kaa-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaa-tat.autobil.prefixes
hfst-compose-intersect -1 .deps/kaa.automorf.hfst -2 .deps/kaa-tat.autobil.prefixes -o .deps/kaa-tat.automorf.trimmed
hfst-compose-intersect: warning:
Found output multi-char symbols ("<apos>") in
transducer in file .deps/kaa.automorf.hfst which are not found on the
input tapes of transducers in file .deps/kaa-tat.autobil.prefixes.
hfst-fst2txt -i .deps/kaa-tat.automorf.trimmed -o .deps/kaa-tat.automorf.trimmed.att
lt-comp lr .deps/kaa-tat.automorf.trimmed.att kaa-tat.automorf.bin
main@standard 183 359
final@inconditional 7 12
cg-comp ../../apertium-languages/apertium-kaa//apertium-kaa.kaa.rlx kaa-tat.rlx.bin
Sections: 1, Rules: 1, Sets: 5, Tags: 23
lrx-comp apertium-tat-kaa.kaa-tat.lrx kaa-tat.autolex.bin
1: 28@29
cp ../../apertium-languages/apertium-tat//tat.autogen.bin kaa-tat.autogen.bin
cp ../../apertium-languages/apertium-tat//tat.autopgen.bin kaa-tat.autopgen.bin
apertium-validate-transfer apertium-tat-kaa.kaa-tat.t1x
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t1x kaa-tat.t1x.bin
apertium-validate-interchunk apertium-tat-kaa.kaa-tat.t2x
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t2x kaa-tat.t2x.bin
apertium-validate-postchunk apertium-tat-kaa.kaa-tat.t3x
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t3x kaa-tat.t3x.bin
apertium-validate-modes modes.xml
apertium-gen-modes modes.xml
lt-comp lr .deps/tat.automorf.bin.att .deps/tat.automorf.bin
main@standard 242055 497437
final@inconditional 805 1769
lt-comp lr .deps/kaa.automorf.bin.att .deps/kaa.automorf.bin
main@standard 22375 47983
final@inconditional 443 1599
bible coverage tat -> kaa
Number of tokenised words in the corpus: 178385
Coverage: 19.96%
Top unknown words in the corpus:
3525 һәм
1964 белән
1351 Гайсә
1335 дип
1279 өчен
1202 дә
1126 Аллаһы
1109 да
1044 Ул
711 Мин
710 ул
630 бер
622 Аның
607 алар
587 иде
551 сез
533 бу
516 диде
515 итеп
511 ә
Translation time: 0.3744645118713379 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-kaa.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage tat -> kaa
Error: Malformed input stream.Number of tokenised words in the corpus: 17
Coverage: 17.65%
Top unknown words in the corpus:
2 Tatnet
1 ^Tatnet
1 Tatarça
1 İnternet
1 tulısınça
1 Tatar
1 İnternetı
1 Tatarstan
1 Respublikası
1 däwlät
1 tellärendä
1 tatar
1 häm
Translation time: 0.0061550140380859375 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./tat-kaa.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
bible coverage kaa -> tat
Number of tokenised words in the corpus: 172711
Coverage: 16.31%
Top unknown words in the corpus:
2075 hám
1625 menen
1303 ushın
1223 İysa
1223 de
1134 O
1111 bir
1060 da
1038 dep
1032 dedi
876 edi
817 Qudaydıń
807 Ol
710 Biraq
645 Quday
629 adam
620 Men
563 bul
520 Muxaddes
515 etip
Translation time: 0.3134338855743408 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaa-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
wikipedia coverage kaa -> tat
Error: Malformed input stream.Number of tokenised words in the corpus: 3
Coverage: 33.33%
Top unknown words in the corpus:
1 ^Bas
1 bet
Translation time: 0.004499197006225586 seconds
Generating hitparade (might take a bit)!
Could not open transducer file ./kaa-tat.automorf.hfst
TOP UNKNOWN WORDS:
coverage: 0 / 0 (Error 10002)
remaining unknown forms: 0
tat kir
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 56e673ad16a30e2a0eb0015015455265b66a3560
bible coverage tat -> kir
[Errno 2] No such file or directory: 'tat-kir.automorf.bin'
wikipedia coverage tat -> kir
[Errno 2] No such file or directory: 'tat-kir.automorf.bin'
bible coverage kir -> tat
[Errno 2] No such file or directory: 'kir-tat.automorf.bin'
wikipedia coverage kir -> tat
[Errno 2] No such file or directory: 'kir-tat.automorf.bin'
tuk tur
Bereits auf 'master'
Ihr Branch ist auf demselben Stand wie 'origin/master'.
Bereits aktuell.
commit 9447fb2278ed49b2dd982d6a3871e0cc5c250bd1
checking for a BSD-compatible install... /usr/bin/install -c
checking whether build environment is sane... yes
checking for a thread-safe mkdir -p... /bin/mkdir -p
checking for gawk... gawk
checking whether make sets $(MAKE)... yes
checking whether make supports nested variables... yes
checking whether ln -s works... yes
checking for gawk... (cached) gawk
checking for pkg-config... /usr/bin/pkg-config
checking pkg-config is at least version 0.9.0... yes
checking for APERTIUM... yes
checking for hfst-lexc... /usr/bin/hfst-lexc
checking for hfst-twolc... /usr/bin/hfst-twolc
checking for cg-comp... /usr/bin/cg-comp
checking for cg-proc... /usr/bin/cg-proc
checking for lrx-comp... /usr/bin/lrx-comp
checking for lrx-proc... /usr/bin/lrx-proc
checking for gzcat... no
checking for zcat... /bin/zcat
Using apertium-tuk from ../../apertium-languages/apertium-tuk/
Using apertium-tur from ../../apertium-languages/apertium-tur/
checking that generated files are newer than configure... done
configure: creating ./config.status