This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#lang rash | |
;; ASSUME: - this script is placed into apertium-all/ | |
;; - hfst-covtest is in the PATH | |
;; USAGE: racket apertium-turkic-bilingual-stats.rkt > /tmp/bilingual 2>&1 | |
;; REQUIRES: racket | |
;; rash (install with "raco pkg install rash") | |
(provide MONOLINGUAL BILINGUAL) | |
(define MONOLINGUAL | |
(hash | |
'alt "apertium-incubator/apertium-alt/" | |
'aze "apertium-incubator/apertium-aze/" | |
'bak "apertium-languages/apertium-bak/" | |
'chv "apertium-languages/apertium-chv/" | |
'crh "apertium-languages/apertium-crh/" | |
'gag "apertium-languages/apertium-gag/" | |
'kaa "apertium-languages/apertium-kaa/" | |
'kaz "apertium-languages/apertium-kaz/" | |
'kir "apertium-languages/apertium-kir/" | |
'kjh "apertium-incubator/apertium-kjh/" | |
'krc "apertium-incubator/apertium-krc/" | |
'kum "apertium-languages/apertium-kum/" | |
'nog "apertium-languages/apertium-nog/" | |
'ota "apertium-incubator/apertium-ota/" | |
'sah "apertium-languages/apertium-sah/" | |
'tat "apertium-languages/apertium-tat/" | |
'tuk "apertium-languages/apertium-tuk/" | |
'tur "apertium-languages/apertium-tur/" | |
'tyv "apertium-languages/apertium-tyv/" | |
'uig "apertium-languages/apertium-uig/" | |
'uzb "apertium-languages/apertium-uzb/")) | |
(define BILINGUAL | |
'( | |
"apertium-incubator/apertium-chv-tat/" | |
"apertium-incubator/apertium-chv-tur/" | |
"apertium-trunk/apertium-crh-tur/" | |
"apertium-incubator/apertium-kaz-kaa/" | |
"apertium-nursery/apertium-kaz-kir/" | |
"apertium-nursery/apertium-kaz-kum/" | |
"apertium-incubator/apertium-kaz-sah/" | |
"apertium-trunk/apertium-kaz-tat/" | |
"apertium-incubator/apertium-kaz-tur/" | |
"apertium-incubator/apertium-kaz-tyv/" | |
"apertium-incubator/apertium-kaz-uig/" | |
"apertium-incubator/apertium-kir-uzb/" | |
"apertium-incubator/apertium-nog-kaz/" | |
"apertium-nursery/apertium-tat-bak/" | |
"apertium-incubator/apertium-tat-kaa/" | |
"apertium-incubator/apertium-tat-kir/" | |
"apertium-nursery/apertium-tuk-tur/" | |
"apertium-nursery/apertium-tur-aze/" | |
"apertium-nursery/apertium-tur-kir/" | |
"apertium-nursery/apertium-tur-tat/" | |
"apertium-nursery/apertium-tur-uzb/" | |
"apertium-incubator/apertium-uig-tur/" | |
"apertium-incubator/apertium-uzb-kaa/")) | |
(for ([p BILINGUAL]) | |
(parameterize ([current-directory p]) | |
(define lang1 (substring p (- (string-length p) 8) (- (string-length p) 5))) | |
(define lang2 (substring p (- (string-length p) 4) (- (string-length p) 1))) | |
(define path1 (string-append "../../" (hash-ref MONOLINGUAL (string->symbol lang1)))) | |
(define path2 (string-append "../../" (hash-ref MONOLINGUAL (string->symbol lang2)))) | |
{echo $lang1 $lang2 | |
(with-handlers ([exn:fail? (λ (exn) (display "git failed\n"))]) | |
{git checkout master | |
git pull | |
git log | head -n1}) | |
(with-handlers ([exn:fail? (λ (exn) (display "compilation failed\n"))]) | |
{./autogen.sh --with-lang1=$path1 --with-lang2=$path2 | |
make clean | |
make}) | |
echo | |
echo bible coverage (values lang1) -> (values lang2) | |
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))]) | |
{aq-covtest (string-append path1 "bible.destxt") (string-append lang1 "-" lang2 ".automorf.bin") | |
hfst-covtest (string-append lang1 "-" lang2) . (string-append path1 "bible.destxt")}) | |
echo wikipedia coverage (values lang1) -> (values lang2) | |
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))]) | |
{aq-covtest (string-append path1 "wiki.destxt") (string-append lang1 "-" lang2 ".automorf.bin") | |
hfst-covtest (string-append lang1 "-" lang2) . (string-append path1 "wiki.destxt")}) | |
echo | |
echo bible coverage (values lang2) -> (values lang1) | |
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))]) | |
{aq-covtest (string-append path2 "bible.destxt") (string-append lang2 "-" lang1 ".automorf.bin") | |
hfst-covtest (string-append lang2 "-" lang1) . (string-append path2 "bible.destxt")}) | |
echo wikipedia coverage (values lang2) -> (values lang1) | |
(with-handlers ([exn:fail? (λ (exn) (display "covtest failed"))]) | |
{aq-covtest (string-append path2 "wiki.destxt") (string-append lang2 "-" lang1 ".automorf.bin") | |
hfst-covtest (string-append lang2 "-" lang1) . (string-append path2 "wiki.destxt")}) | |
printf "\n\n\n\n"})) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#/usr/bin/env bash | |
## ASSUME: - this script is placed into apertium-all/ | |
## - hfst-covtest is in the PATH | |
## USAGE: bash apertium-turkic-monolingual-stats.bash > /tmp/monolingual-log 2>&1 | |
## 3-letter language code => Wikipedia prefix | |
declare -A LANGS=( ["tat"]="tt" ["kaz"]="kk" ["kir"]="ky" ["crh"]="crh" ["tyv"]="tyv" | |
["bak"]="ba" ["chv"]="cv" ["uzb"]="uz" ["kaa"]="kaa" ["uig"]="ug" ["sah"]="sah" ["kum"]=false | |
["nog"]=false ["gag"]="gag" ["tuk"]="tk" ["tur"]="tr" ) | |
declare -A LANGSINCUBATOR=( ["krc"]="krc" ["alt"]=false ["kjh"]=false ["ota"]=false ["aze"]="az" ) | |
OUT=/tmp/monolingual-turkicstats | |
## ["incubator" / "languages"] iso3 => stats | |
stats () { | |
printf "$2: " >> $OUT | |
cd "apertium-$1/apertium-$2" | |
pwd | |
git checkout master | |
git pull | |
git log | head -n1 >> $OUT | |
printf "stems: " >> $OUT | |
# count stems | |
grep -E ":\w+.*;" "apertium-$2.$2.lexc" | grep -v "[<>]" | wc -l >> $OUT | |
./autogen.sh | |
make clean; make | |
## bibles are in https://github.com/taruen/apertiumpp/tree/master/data4apertium/corpora/bible/ | |
printf "bible coverage\n" >> $OUT | |
apertium-destxt -n ../../../data4apertium/corpora/bible/$2.txt > bible.destxt | |
aq-covtest bible.destxt $2.automorf.bin >> $OUT 2>&1 | |
hfst-covtest $2 . ../../../data4apertium/corpora/bible/$2.txt >> $OUT 2>&1 | |
printf "bible corpus size (tokens): " >> $OUT | |
wc -w ../../../data4apertium/corpora/bible/$2.txt >> $OUT | |
if [ "$1" == "languages" ]; then | |
prefix="${LANGS[$2]}" | |
else | |
prefix="${LANGSINCUBATOR[$2]}" | |
fi | |
if ! [[ "$prefix" == false ]]; then | |
printf "wikipedia coverage\n" >> $OUT | |
if ! [[ -f "wiki.destxt" ]]; then | |
python3 ~/local/bin/wikiextractor.py --infn "${prefix}wiki-20190901-pages-articles-multistream.xml.bz2" | |
apertium-destxt -n wiki.txt > wiki.destxt | |
fi | |
aq-covtest wiki.destxt $2.automorf.bin >> $OUT 2>&1 | |
hfst-covtest $2 . wiki.txt >> $OUT 2>&1 | |
printf "wikipedia corpus size (tokens): " >> $OUT | |
wc -w wiki.txt >> $OUT | |
fi | |
printf "\n" >> $OUT | |
cd ../.. | |
} | |
printf "" > $OUT | |
for l in "${!LANGS[@]}"; do stats "languages" "$l"; done | |
for l in "${!LANGSINCUBATOR[@]}"; do stats "incubator" "$l"; done |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
chv tat | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 232a3031b106a312fe41ad21fea95db5851f0cb4 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-chv from ../../apertium-languages/apertium-chv/ | |
Using apertium-tat from ../../apertium-languages/apertium-tat/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "chv-tat.autobil.bin tat-chv.autobil.bin chv-tat.automorf.bin chv-tat.autopgen.bin chv-tat.autogen.bin chv-tat.t1x.bin chv-tat.t2x.bin tat-chv.automorf.bin tat-chv.autopgen.bin tat-chv.autogen.bin tat-chv.autogen.hfst tat-chv.t1x.bin tat-chv.t2x.bin chv-tat.rlx.bin tat-chv.rlx.bin chv-tat.lrx.bin tat-chv.lrx.bin" || rm -f chv-tat.autobil.bin tat-chv.autobil.bin chv-tat.automorf.bin chv-tat.autopgen.bin chv-tat.autogen.bin chv-tat.t1x.bin chv-tat.t2x.bin tat-chv.automorf.bin tat-chv.autopgen.bin tat-chv.autogen.bin tat-chv.autogen.hfst tat-chv.t1x.bin tat-chv.t2x.bin chv-tat.rlx.bin tat-chv.rlx.bin chv-tat.lrx.bin tat-chv.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-chv-tat.chv-tat.dix | |
lt-comp lr apertium-chv-tat.chv-tat.dix chv-tat.autobil.bin | |
main@standard 34104 59904 | |
apertium-validate-dictionary apertium-chv-tat.chv-tat.dix | |
lt-comp rl apertium-chv-tat.chv-tat.dix tat-chv.autobil.bin | |
main@standard 34106 59907 | |
if [ ! -d .deps ]; then mkdir .deps; fi | |
touch .deps/.d | |
lt-print chv-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/chv-tat.autobil.att | |
hfst-txt2fst -e ε < .deps/chv-tat.autobil.att > .deps/chv-tat.autobil.hfst | |
hfst-project -p upper .deps/chv-tat.autobil.hfst > .deps/chv-tat.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/chv-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/chv-tat.autobil.prefixes | |
zcat ../../apertium-languages/apertium-chv//chv.automorf.att.gz | hfst-txt2fst > .deps/chv.automorf.hfst | |
hfst-compose-intersect -1 .deps/chv.automorf.hfst -2 .deps/chv-tat.autobil.prefixes -o .deps/chv-tat.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<gen>") in | |
transducer in file .deps/chv.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/chv-tat.autobil.prefixes. | |
hfst-fst2txt -i .deps/chv-tat.automorf.trimmed -o .deps/chv-tat.automorf.trimmed.att | |
lt-comp lr .deps/chv-tat.automorf.trimmed.att chv-tat.automorf.bin | |
main@standard 31747 72044 | |
final@inconditional 22 45 | |
apertium-validate-dictionary ../../apertium-languages/apertium-chv//apertium-chv.post-chv.dix | |
lt-comp lr ../../apertium-languages/apertium-chv//apertium-chv.post-chv.dix chv-tat.autopgen.bin | |
main@standard 9 114 | |
cp ../../apertium-languages/apertium-tat//tat.autogen.bin chv-tat.autogen.bin | |
apertium-validate-transfer apertium-chv-tat.chv-tat.t1x | |
apertium-preprocess-transfer apertium-chv-tat.chv-tat.t1x chv-tat.t1x.bin | |
apertium-validate-transfer apertium-chv-tat.chv-tat.t2x | |
apertium-preprocess-transfer apertium-chv-tat.chv-tat.t2x chv-tat.t2x.bin | |
lt-print tat-chv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-chv.autobil.att | |
hfst-txt2fst -e ε < .deps/tat-chv.autobil.att > .deps/tat-chv.autobil.hfst | |
hfst-project -p upper .deps/tat-chv.autobil.hfst > .deps/tat-chv.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tat-chv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-chv.autobil.prefixes | |
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst | |
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-chv.autobil.prefixes -o .deps/tat-chv.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<punct>") in | |
transducer in file .deps/tat.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tat-chv.autobil.prefixes. | |
hfst-fst2txt -i .deps/tat-chv.automorf.trimmed -o .deps/tat-chv.automorf.trimmed.att | |
lt-comp lr .deps/tat-chv.automorf.trimmed.att tat-chv.automorf.bin | |
main@standard 128750 237561 | |
final@inconditional 751 1598 | |
apertium-validate-dictionary ../../apertium-languages/apertium-tat//apertium-tat.post-tat.dix | |
lt-comp lr ../../apertium-languages/apertium-tat//apertium-tat.post-tat.dix tat-chv.autopgen.bin | |
main@standard 9 114 | |
cp ../../apertium-languages/apertium-chv//chv.autogen.bin tat-chv.autogen.bin | |
cp ../../apertium-languages/apertium-chv//chv.autogen.hfst tat-chv.autogen.hfst | |
apertium-validate-transfer apertium-chv-tat.tat-chv.t1x | |
apertium-preprocess-transfer apertium-chv-tat.tat-chv.t1x tat-chv.t1x.bin | |
apertium-validate-transfer apertium-chv-tat.tat-chv.t2x | |
apertium-preprocess-transfer apertium-chv-tat.tat-chv.t2x tat-chv.t2x.bin | |
cg-comp ../../apertium-languages/apertium-chv//apertium-chv.chv.rlx chv-tat.rlx.bin | |
Sections: 2, Rules: 6, Sets: 16, Tags: 41 | |
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-chv.rlx.bin | |
Sections: 11, Rules: 123, Sets: 154, Tags: 194 | |
lrx-comp apertium-chv-tat.chv-tat.lrx chv-tat.lrx.bin | |
1: 22@23 | |
lrx-comp apertium-chv-tat.tat-chv.lrx tat-chv.lrx.bin | |
10: 142@157 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
cp *.mode modes/ | |
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden | |
make: *** [Makefile:779: modes/chv-tat.mode] Fehler 1 | |
bible coverage chv -> tat | |
Number of tokenised words in the corpus: 196766 | |
Coverage: 86.62% | |
Top unknown words in the corpus: | |
1432 Иисус | |
462 Христос | |
379 чухне | |
272 Эй | |
248 Иисуса | |
236 пурте | |
162 нумай | |
136 Святой | |
125 Иоанн | |
123 Ҫавӑн | |
101 Акӑ | |
93 илтсен | |
92 никам | |
86 Моисей | |
86 пӗтӗмпех | |
80 нимӗн | |
78 иудейсем | |
77 ҫирӗплетсе | |
75 Израиль | |
75 кирек | |
Translation time: 2.321425199508667 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./chv-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage chv -> tat | |
Error: Malformed input stream.Number of tokenised words in the corpus: 693 | |
Coverage: 83.26% | |
Top unknown words in the corpus: | |
2 тĕрĕк | |
2 Хуть | |
2 тĕрлĕрен | |
2 идиомсем | |
2 Чăвашла | |
2 тĕпченин | |
2 чăвашла | |
2 Халь | |
2 каяп | |
2 вĕрентӳ | |
2 япон | |
1 пăлхар | |
1 пĕртен | |
1 Пăлхарăн | |
1 хазар | |
1 вирьял | |
1 мĕшĕнче | |
1 палăртаççĕ | |
1 нимпех | |
1 уйралса | |
Translation time: 0.0467984676361084 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./chv-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tat -> chv | |
Number of tokenised words in the corpus: 196071 | |
Coverage: 86.16% | |
Top unknown words in the corpus: | |
1351 Гайсә | |
1126 Аллаһы | |
420 чөнки | |
403 Мәсих | |
390 Чөнки | |
380 кебек | |
372 иман | |
290 Раббы | |
288 Изге | |
283 Аллаһының | |
264 Аллаһыга | |
196 Гайсәнең | |
190 Паул | |
161 Гайсәне | |
159 Петер | |
137 аркылы | |
118 изге | |
113 Яхъя | |
112 яһүдләр | |
109 барысы | |
Translation time: 4.255837917327881 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-chv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tat -> chv | |
Error: Malformed input stream.Number of tokenised words in the corpus: 26 | |
Coverage: 65.38% | |
Top unknown words in the corpus: | |
1 Tatarça | |
1 İnternet | |
1 tulısınça | |
1 İnternetı | |
1 Respublikası | |
1 däwlät | |
1 tellärendä | |
1 tatar | |
1 häm | |
Translation time: 0.06401181221008301 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-chv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
chv tur | |
Bereits auf 'master' | |
M tur-chv.prob | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 32735fc46542d31cf619410c4d884701381b18e5 | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-chv from ../../apertium-languages/apertium-chv/ | |
Using apertium-tur from ../../apertium-languages/apertium-tur/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "chv-tur.automorf.bin chv-tur.prob chv-tur.rlx.bin chv-tur.autobil.bin chv-tur.autolex.bin chv-tur.autogen.bin chv-tur.autopgen.bin chv-tur.t1x.bin chv-tur.t2x.bin chv-tur.t3x.bin tur-chv.automorf.bin tur-chv.prob tur-chv.rlx.bin tur-chv.autobil.bin tur-chv.autolex.bin tur-chv.autogen.bin tur-chv.autopgen.bin tur-chv.t1x.bin tur-chv.t2x.bin tur-chv.t3x.bin tur-chv.t4x.bin" || rm -f chv-tur.automorf.bin chv-tur.prob chv-tur.rlx.bin chv-tur.autobil.bin chv-tur.autolex.bin chv-tur.autogen.bin chv-tur.autopgen.bin chv-tur.t1x.bin chv-tur.t2x.bin chv-tur.t3x.bin tur-chv.automorf.bin tur-chv.prob tur-chv.rlx.bin tur-chv.autobil.bin tur-chv.autolex.bin tur-chv.autogen.bin tur-chv.autopgen.bin tur-chv.t1x.bin tur-chv.t2x.bin tur-chv.t3x.bin tur-chv.t4x.bin | |
rm -rf .deps modes | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
/bin/zcat ../../apertium-languages/apertium-chv//chv.automorf.att.gz | hfst-txt2fst > .deps/chv.automorf.hfst | |
apertium-validate-dictionary apertium-chv-tur.chv-tur.dix | |
lt-comp lr apertium-chv-tur.chv-tur.dix chv-tur.autobil.bin | |
main@standard 308 462 | |
nocomprovat@standard 21662 31014 | |
notincrp@standard 90770 112482 | |
lt-print chv-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/chv-tur.autobil.att | |
hfst-txt2fst -e ε < .deps/chv-tur.autobil.att > .deps/chv-tur.autobil.hfst | |
hfst-project -p upper .deps/chv-tur.autobil.hfst > .deps/chv-tur.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/chv-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/chv-tur.autobil.prefixes | |
hfst-compose-intersect -1 .deps/chv.automorf.hfst -2 .deps/chv-tur.autobil.prefixes -o .deps/chv-tur.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<abbr>") in | |
transducer in file .deps/chv.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/chv-tur.autobil.prefixes. | |
hfst-fst2txt -i .deps/chv-tur.automorf.trimmed -o .deps/chv-tur.automorf.trimmed.att | |
lt-comp lr .deps/chv-tur.automorf.trimmed.att chv-tur.automorf.bin | |
main@standard 408 857 | |
final@inconditional 8 7 | |
cp ../../apertium-languages/apertium-chv//chv.prob chv-tur.prob | |
cg-comp ../../apertium-languages/apertium-chv//apertium-chv.chv.rlx chv-tur.rlx.bin | |
Sections: 2, Rules: 6, Sets: 16, Tags: 41 | |
lrx-comp apertium-chv-tur.chv-tur.lrx chv-tur.autolex.bin | |
4: 61@67 | |
cp ../../apertium-languages/apertium-tur//tur.autogen.bin chv-tur.autogen.bin | |
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin chv-tur.autopgen.bin | |
apertium-validate-transfer apertium-chv-tur.chv-tur.t1x | |
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t1x chv-tur.t1x.bin | |
apertium-validate-interchunk apertium-chv-tur.chv-tur.t2x | |
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t2x chv-tur.t2x.bin | |
apertium-validate-postchunk apertium-chv-tur.chv-tur.t3x | |
apertium-preprocess-transfer apertium-chv-tur.chv-tur.t3x chv-tur.t3x.bin | |
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst | |
apertium-validate-dictionary apertium-chv-tur.chv-tur.dix | |
lt-comp rl apertium-chv-tur.chv-tur.dix tur-chv.autobil.bin | |
main@standard 308 462 | |
nocomprovat@standard 21662 31014 | |
notincrp@standard 90770 112482 | |
lt-print tur-chv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-chv.autobil.att | |
hfst-txt2fst -e ε < .deps/tur-chv.autobil.att > .deps/tur-chv.autobil.hfst | |
hfst-project -p upper .deps/tur-chv.autobil.hfst > .deps/tur-chv.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tur-chv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-chv.autobil.prefixes | |
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-chv.autobil.prefixes -o .deps/tur-chv.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<quot>") in | |
transducer in file .deps/tur.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tur-chv.autobil.prefixes. | |
hfst-fst2txt -i .deps/tur-chv.automorf.trimmed -o .deps/tur-chv.automorf.trimmed.att | |
lt-comp lr .deps/tur-chv.automorf.trimmed.att tur-chv.automorf.bin | |
main@standard 308 308 | |
final@inconditional 168 167 | |
cp ../../apertium-languages/apertium-tur//tur.prob tur-chv.prob | |
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-chv.rlx.bin | |
Sections: 4, Rules: 102, Sets: 129, Tags: 127 | |
2 rules cannot be skipped by index. | |
lrx-comp apertium-chv-tur.tur-chv.lrx tur-chv.autolex.bin | |
22: 328@369 | |
cp ../../apertium-languages/apertium-chv//chv.autogen.bin tur-chv.autogen.bin | |
cp ../../apertium-languages/apertium-chv//chv.autopgen.bin tur-chv.autopgen.bin | |
apertium-validate-transfer apertium-chv-tur.tur-chv.t1x | |
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t1x tur-chv.t1x.bin | |
apertium-validate-interchunk apertium-chv-tur.tur-chv.t2x | |
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t2x tur-chv.t2x.bin | |
apertium-validate-postchunk apertium-chv-tur.tur-chv.t3x | |
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t3x tur-chv.t3x.bin | |
apertium-validate-transfer apertium-chv-tur.tur-chv.t4x | |
apertium-preprocess-transfer apertium-chv-tur.tur-chv.t4x tur-chv.t4x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
lt-comp lr .deps/chv.automorf.bin.att .deps/chv.automorf.bin | |
main@standard 55063 140662 | |
final@inconditional 105 261 | |
lt-comp lr .deps/tur.automorf.bin.att .deps/tur.automorf.bin | |
main@standard 25060 57093 | |
final@inconditional 635 2021 | |
bible coverage chv -> tur | |
Number of tokenised words in the corpus: 142124 | |
Coverage: 0.18% | |
Top unknown words in the corpus: | |
2912 те | |
2665 та | |
1489 Турӑ | |
1432 Иисус | |
1224 вара | |
929 Вӑл | |
869 тесе | |
778 ҫапла | |
742 каланӑ | |
740 Эпӗ | |
667 тата | |
666 вӗсем | |
661 ӑна | |
660 пӗр | |
648 тесен | |
645 сире | |
623 вӑл | |
617 мар | |
610 мӗн | |
590 тенӗ | |
Translation time: 0.3829376697540283 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./chv-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage chv -> tur | |
Error: Malformed input stream.Number of tokenised words in the corpus: 537 | |
Coverage: 0.19% | |
Top unknown words in the corpus: | |
17 Чăваш | |
13 те | |
10 чĕлхи | |
8 тата | |
8 чăваш | |
6 чĕлхе | |
6 чĕлхипе | |
5 чĕлхине | |
5 çине | |
5 та | |
4 пĕр | |
4 ытти | |
4 пулать | |
4 хальхи | |
3 йышĕ | |
3 чĕлхин | |
3 пек | |
3 хушшинчи | |
3 усă | |
3 вара | |
Translation time: 0.00605320930480957 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./chv-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tur -> chv | |
Number of tokenised words in the corpus: 322696 | |
Coverage: 0.00% | |
Top unknown words in the corpus: | |
4764 ve | |
4035 bir | |
2738 için | |
2240 da | |
2098 de | |
1782 Tanrı | |
1686 Çünkü | |
1604 O | |
1562 nın | |
1505 İsrail | |
1460 gibi | |
1352 oğlu | |
1308 in | |
1238 ın | |
1236 bütün | |
1234 ya | |
1146 a | |
1124 bu | |
1115 dedi | |
1104 Ama | |
Translation time: 0.772911787033081 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-chv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tur -> chv | |
Error: Malformed input stream.Number of tokenised words in the corpus: 14776 | |
Coverage: 0.01% | |
Top unknown words in the corpus: | |
404 ve | |
348 Han | |
331 Cengiz | |
293 bir | |
148 ın | |
145 ile | |
124 da | |
124 Temuçin | |
119 için | |
108 in | |
103 de | |
92 olan | |
91 olarak | |
85 bu | |
76 sonra | |
71 Çin | |
63 en | |
59 a | |
59 Bu | |
58 büyük | |
Translation time: 0.07053613662719727 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-chv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
crh tur | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit a48867598137559646089ed83798c2d37fb0c3a1 | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-crh from ../../apertium-languages/apertium-crh/ | |
Using apertium-tur from ../../apertium-languages/apertium-tur/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "crh-tur.automorf.bin crh-tur.prob crh-tur.rlx.bin crh-tur.autobil.bin crh-tur.autolex.bin crh-tur.autogen.bin crh-tur.autopgen.bin crh-tur.t1x.bin crh-tur.t2x.bin crh-tur.t3x.bin crh-tur.t4x.bin tur-crh.automorf.bin tur-crh.prob tur-crh.rlx.bin tur-crh.autobil.bin tur-crh.autolex.bin tur-crh.autogen.bin tur-crh.autopgen.bin tur-crh.t1x.bin tur-crh.t2x.bin tur-crh.t4x.bin tur-crh.t3x.bin" || rm -f crh-tur.automorf.bin crh-tur.prob crh-tur.rlx.bin crh-tur.autobil.bin crh-tur.autolex.bin crh-tur.autogen.bin crh-tur.autopgen.bin crh-tur.t1x.bin crh-tur.t2x.bin crh-tur.t3x.bin crh-tur.t4x.bin tur-crh.automorf.bin tur-crh.prob tur-crh.rlx.bin tur-crh.autobil.bin tur-crh.autolex.bin tur-crh.autogen.bin tur-crh.autopgen.bin tur-crh.t1x.bin tur-crh.t2x.bin tur-crh.t4x.bin tur-crh.t3x.bin | |
rm -rf .deps modes | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
/bin/zcat ../../apertium-languages/apertium-crh//crh.automorf.att.gz | hfst-txt2fst > .deps/crh.automorf.hfst | |
apertium-validate-dictionary apertium-crh-tur.crh-tur.dix | |
lt-comp lr apertium-crh-tur.crh-tur.dix crh-tur.autobil.bin | |
main@standard 12695 19382 | |
lt-print crh-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/crh-tur.autobil.att | |
hfst-txt2fst -e ε < .deps/crh-tur.autobil.att > .deps/crh-tur.autobil.hfst | |
hfst-project -p upper .deps/crh-tur.autobil.hfst > .deps/crh-tur.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/crh-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/crh-tur.autobil.prefixes | |
hfst-compose-intersect -1 .deps/crh.automorf.hfst -2 .deps/crh-tur.autobil.prefixes -o .deps/crh-tur.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<apos>") in | |
transducer in file .deps/crh.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/crh-tur.autobil.prefixes. | |
hfst-fst2txt -i .deps/crh-tur.automorf.trimmed -o .deps/crh-tur.automorf.trimmed.att | |
lt-comp lr .deps/crh-tur.automorf.trimmed.att crh-tur.automorf.bin | |
main@standard 83327 232963 | |
final@inconditional 8152 14258 | |
cp ../../apertium-languages/apertium-crh//crh.prob crh-tur.prob | |
cg-comp ../../apertium-languages/apertium-crh//apertium-crh.crh.rlx crh-tur.rlx.bin | |
Sections: 3, Rules: 72, Sets: 92, Tags: 96 | |
2 rules cannot be skipped by index. | |
lrx-comp apertium-crh-tur.crh-tur.lrx crh-tur.autolex.bin | |
14: 298@335 | |
cp ../../apertium-languages/apertium-tur//tur.autogen.bin crh-tur.autogen.bin | |
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin crh-tur.autopgen.bin | |
apertium-validate-transfer apertium-crh-tur.crh-tur.t1x | |
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t1x crh-tur.t1x.bin | |
apertium-validate-interchunk apertium-crh-tur.crh-tur.t2x | |
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t2x crh-tur.t2x.bin | |
apertium-validate-postchunk apertium-crh-tur.crh-tur.t3x | |
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t3x crh-tur.t3x.bin | |
apertium-validate-transfer apertium-crh-tur.crh-tur.t4x | |
apertium-preprocess-transfer apertium-crh-tur.crh-tur.t4x crh-tur.t4x.bin | |
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst | |
apertium-validate-dictionary apertium-crh-tur.crh-tur.dix | |
lt-comp rl apertium-crh-tur.crh-tur.dix tur-crh.autobil.bin | |
main@standard 12664 19312 | |
lt-print tur-crh.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-crh.autobil.att | |
hfst-txt2fst -e ε < .deps/tur-crh.autobil.att > .deps/tur-crh.autobil.hfst | |
hfst-project -p upper .deps/tur-crh.autobil.hfst > .deps/tur-crh.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tur-crh.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-crh.autobil.prefixes | |
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-crh.autobil.prefixes -o .deps/tur-crh.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<apos>") in | |
transducer in file .deps/tur.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tur-crh.autobil.prefixes. | |
hfst-fst2txt -i .deps/tur-crh.automorf.trimmed -o .deps/tur-crh.automorf.trimmed.att | |
lt-comp lr .deps/tur-crh.automorf.trimmed.att tur-crh.automorf.bin | |
main@standard 14064 28608 | |
final@inconditional 2361 3820 | |
cp ../../apertium-languages/apertium-tur//tur.prob tur-crh.prob | |
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-crh.rlx.bin | |
Sections: 4, Rules: 102, Sets: 129, Tags: 127 | |
2 rules cannot be skipped by index. | |
lrx-comp apertium-crh-tur.tur-crh.lrx tur-crh.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-crh//crh.autogen.bin tur-crh.autogen.bin | |
cp ../../apertium-languages/apertium-crh//crh.autopgen.bin tur-crh.autopgen.bin | |
apertium-validate-transfer apertium-crh-tur.tur-crh.t1x | |
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t1x tur-crh.t1x.bin | |
apertium-validate-interchunk apertium-crh-tur.tur-crh.t2x | |
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t2x tur-crh.t2x.bin | |
apertium-validate-transfer apertium-crh-tur.tur-crh.t4x | |
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t4x tur-crh.t4x.bin | |
apertium-validate-postchunk apertium-crh-tur.tur-crh.t3x | |
apertium-preprocess-transfer apertium-crh-tur.tur-crh.t3x tur-crh.t3x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
lt-comp lr .deps/crh.automorf.bin.att .deps/crh.automorf.bin | |
main@standard 112233 320968 | |
final@inconditional 424 1452 | |
lt-comp lr .deps/tur.automorf.bin.att .deps/tur.automorf.bin | |
main@standard 25060 57093 | |
final@inconditional 635 2021 | |
bible coverage crh -> tur | |
Number of tokenised words in the corpus: 108974 | |
Coverage: 31.35% | |
Top unknown words in the corpus: | |
1566 ве | |
1022 Иса | |
910 бир | |
880 деди | |
729 ичюн | |
677 исе | |
624 эди | |
578 да | |
556 деп | |
505 Мен | |
501 бу | |
464 де | |
420 адам | |
352 оларгъа | |
339 не | |
336 Онынъ | |
319 Алланынъ | |
315 сонъ | |
296 Бу | |
285 оны | |
Translation time: 0.35404133796691895 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./crh-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage crh -> tur | |
Number of tokenised words in the corpus: 4299 | |
Coverage: 88.95% | |
Top unknown words in the corpus: | |
12 Amdi | |
10 Abibulla | |
8 Odabaş | |
5 Giraybay | |
5 nemse | |
4 cenkâver | |
4 Ablây | |
4 افغانستان | |
4 Afġānistān | |
4 askeriy | |
3 ci | |
3 Abeşistan | |
3 Aluston | |
3 Prinsligi | |
2 ac | |
2 ae | |
2 af | |
2 ag | |
2 ai | |
2 am | |
Translation time: 0.17180109024047852 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./crh-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tur -> crh | |
Number of tokenised words in the corpus: 396976 | |
Coverage: 76.61% | |
Top unknown words in the corpus: | |
1782 Tanrı | |
1484 nın | |
1050 ın | |
921 a | |
832 Davut | |
671 dek | |
654 e | |
585 Yahuda | |
553 Ey | |
528 şöyle | |
505 Yeruşalim | |
487 Egemen | |
409 na | |
377 Tanrısı | |
375 la | |
359 i | |
355 Saul | |
347 ı | |
326 dan | |
318 ey | |
Translation time: 6.870069742202759 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-crh.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tur -> crh | |
Error: Malformed input stream.Number of tokenised words in the corpus: 16235 | |
Coverage: 77.76% | |
Top unknown words in the corpus: | |
136 ın | |
124 Temuçin | |
51 a | |
40 ı | |
40 nin | |
39 i | |
34 Camuka | |
34 nın | |
33 Jin | |
33 Tuğrul | |
29 e | |
29 Cuci | |
27 Harezmşah | |
22 Cebe | |
17 Mukhulai | |
17 Subutay | |
16 Yesügey | |
15 Çağatay | |
14 Börte | |
14 Alaeddin | |
Translation time: 0.3534669876098633 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-crh.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz kaa | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 0ef5cdf2fe24b25d9c459751cfa1290f6214913f | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-kaa from ../../apertium-languages/apertium-kaa/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-kaa.autobil.bin kaa-kaz.autobil.bin kaz-kaa.automorf.bin kaz-kaa.autopgen.bin kaz-kaa.autogen.bin kaz-kaa.t1x.bin kaz-kaa.t2x.bin kaa-kaz.automorf.bin kaa-kaz.autopgen.bin kaa-kaz.autogen.bin kaa-kaz.t1x.bin kaa-kaz.t2x.bin kaz-kaa.rlx.bin kaa-kaz.rlx.bin kaz-kaa.lrx.bin kaa-kaz.lrx.bin" || rm -f kaz-kaa.autobil.bin kaa-kaz.autobil.bin kaz-kaa.automorf.bin kaz-kaa.autopgen.bin kaz-kaa.autogen.bin kaz-kaa.t1x.bin kaz-kaa.t2x.bin kaa-kaz.automorf.bin kaa-kaz.autopgen.bin kaa-kaz.autogen.bin kaa-kaz.t1x.bin kaa-kaz.t2x.bin kaz-kaa.rlx.bin kaa-kaz.rlx.bin kaz-kaa.lrx.bin kaa-kaz.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-kaa.kaz-kaa.dix | |
lt-comp lr apertium-kaz-kaa.kaz-kaa.dix kaz-kaa.autobil.bin | |
main@standard 10901 15943 | |
apertium-validate-dictionary apertium-kaz-kaa.kaz-kaa.dix | |
lt-comp rl apertium-kaz-kaa.kaz-kaa.dix kaa-kaz.autobil.bin | |
main@standard 10887 15926 | |
if [ ! -d .deps ]; then mkdir .deps; fi | |
touch .deps/.d | |
lt-print kaz-kaa.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kaa.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-kaa.autobil.att > .deps/kaz-kaa.autobil.hfst | |
hfst-project -p upper .deps/kaz-kaa.autobil.hfst > .deps/kaz-kaa.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-kaa.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kaa.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kaa.autobil.prefixes -o .deps/kaz-kaa.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-kaa.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-kaa.automorf.trimmed -o .deps/kaz-kaa.automorf.trimmed.att | |
lt-comp lr .deps/kaz-kaa.automorf.trimmed.att kaz-kaa.automorf.bin | |
main@standard 181934 412306 | |
final@inconditional 2634 7472 | |
apertium-validate-dictionary apertium-kaz-kaa.post-kaz.dix | |
lt-comp lr apertium-kaz-kaa.post-kaz.dix kaz-kaa.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-kaa//kaa.autogen.bin kaz-kaa.autogen.bin | |
apertium-validate-transfer apertium-kaz-kaa.kaz-kaa.t1x | |
apertium-preprocess-transfer apertium-kaz-kaa.kaz-kaa.t1x kaz-kaa.t1x.bin | |
apertium-validate-transfer apertium-kaz-kaa.kaz-kaa.t2x | |
apertium-preprocess-transfer apertium-kaz-kaa.kaz-kaa.t2x kaz-kaa.t2x.bin | |
lt-print kaa-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaa-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/kaa-kaz.autobil.att > .deps/kaa-kaz.autobil.hfst | |
hfst-project -p upper .deps/kaa-kaz.autobil.hfst > .deps/kaa-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaa-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaa-kaz.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaa//kaa.automorf.att.gz | hfst-txt2fst > .deps/kaa.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaa.automorf.hfst -2 .deps/kaa-kaz.autobil.prefixes -o .deps/kaa-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<subst>") in | |
transducer in file .deps/kaa.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaa-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaa-kaz.automorf.trimmed -o .deps/kaa-kaz.automorf.trimmed.att | |
lt-comp lr .deps/kaa-kaz.automorf.trimmed.att kaa-kaz.automorf.bin | |
main@standard 11323 20644 | |
final@inconditional 444 1655 | |
apertium-validate-dictionary apertium-kaz-kaa.post-kaa.dix | |
lt-comp lr apertium-kaz-kaa.post-kaa.dix kaa-kaz.autopgen.bin | |
main@standard 9 114 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin kaa-kaz.autogen.bin | |
apertium-validate-transfer apertium-kaz-kaa.kaa-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-kaa.kaa-kaz.t1x kaa-kaz.t1x.bin | |
apertium-validate-transfer apertium-kaz-kaa.kaa-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-kaa.kaa-kaz.t2x kaa-kaz.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kaa.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
cg-comp ../../apertium-languages/apertium-kaa//apertium-kaa.kaa.rlx kaa-kaz.rlx.bin | |
Sections: 1, Rules: 1, Sets: 5, Tags: 23 | |
lrx-comp apertium-kaz-kaa.kaz-kaa.lrx kaz-kaa.lrx.bin | |
6: 99@109 | |
lrx-comp apertium-kaz-kaa.kaa-kaz.lrx kaa-kaz.lrx.bin | |
1: 19@19 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
cp *.mode modes/ | |
bible coverage kaz -> kaa | |
Number of tokenised words in the corpus: 214563 | |
Coverage: 92.41% | |
Top unknown words in the corpus: | |
1268 Иса | |
323 Мәсіх | |
284 Исаның | |
246 Мәсіхтің | |
211 Ізгі | |
175 Исаға | |
151 Исаны | |
150 Петір | |
136 Пауыл | |
129 Таурат | |
103 Мәсіхке | |
83 Жақия | |
79 Мұса | |
68 Ыбырайым | |
66 яһудилер | |
65 парызшылдар | |
64 Шимон | |
63 немесе | |
62 Иерусалимге | |
59 Мәсіхпен | |
Translation time: 6.704168081283569 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kaa.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> kaa | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2952 | |
Coverage: 88.52% | |
Top unknown words in the corpus: | |
8 оңт | |
5 ның | |
5 Украина | |
5 солт | |
4 Каспий | |
3 Алтай | |
3 Сібір | |
3 Тянь | |
3 Шань | |
3 Еділ | |
3 одақтық | |
3 м | |
2 Қызылқұм | |
2 Сібірдің | |
2 мыңжылдық | |
2 тайпалық | |
2 ғұндар | |
2 аумағындағы | |
2 Оғыз | |
2 жоспарлық | |
Translation time: 0.2152414321899414 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kaa.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage kaa -> kaz | |
Number of tokenised words in the corpus: 188496 | |
Coverage: 88.24% | |
Top unknown words in the corpus: | |
1223 İysa | |
520 Muxaddes | |
408 ytkeni | |
353 Masix | |
346 A | |
294 İysanıń | |
214 z | |
212 hámme | |
183 Masixtıń | |
172 hámmesi | |
172 ǵo | |
168 İysaǵa | |
161 Petr | |
153 İysanı | |
148 Pavel | |
142 atırǵan | |
139 zi | |
112 qalay | |
108 Háy | |
106 muxaddes | |
Translation time: 2.959629535675049 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaa-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaa -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 4 | |
Coverage: 100.00% | |
Top unknown words in the corpus: | |
Translation time: 0.010514259338378906 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaa-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz kir | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 34dd3475c6103f173f6f4b443155486a7231b0b7 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-kir from ../../apertium-languages/apertium-kir/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-kir.autobil.bin kir-kaz.autobil.bin kaz-kir.automorf.bin kaz-kir.autopgen.bin kaz-kir.autogen.bin kaz-kir.t1x.bin kaz-kir.t2x.bin kir-kaz.automorf.bin kir-kaz.autopgen.bin kir-kaz.autogen.bin kir-kaz.t1x.bin kir-kaz.t2x.bin kaz-kir.rlx.bin kir-kaz.rlx.bin kaz-kir.autolex.bin kir-kaz.autolex.bin kaz-kir.autoseq.bin kir-kaz.autoseq.bin kaz-kir.revautoseq.bin kir-kaz.revautoseq.bin" || rm -f kaz-kir.autobil.bin kir-kaz.autobil.bin kaz-kir.automorf.bin kaz-kir.autopgen.bin kaz-kir.autogen.bin kaz-kir.t1x.bin kaz-kir.t2x.bin kir-kaz.automorf.bin kir-kaz.autopgen.bin kir-kaz.autogen.bin kir-kaz.t1x.bin kir-kaz.t2x.bin kaz-kir.rlx.bin kir-kaz.rlx.bin kaz-kir.autolex.bin kir-kaz.autolex.bin kaz-kir.autoseq.bin kir-kaz.autoseq.bin kaz-kir.revautoseq.bin kir-kaz.revautoseq.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-kir.kaz-kir.dix | |
lt-comp lr apertium-kaz-kir.kaz-kir.dix kaz-kir.autobil.bin | |
main@standard 13606 31838 | |
apertium-validate-dictionary apertium-kaz-kir.kaz-kir.dix | |
lt-comp rl apertium-kaz-kir.kaz-kir.dix kir-kaz.autobil.bin | |
main@standard 13574 31782 | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
lt-print kaz-kir.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kir.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-kir.autobil.att > .deps/kaz-kir.autobil.hfst | |
hfst-project -p upper .deps/kaz-kir.autobil.hfst > .deps/kaz-kir.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-kir.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kir.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kir.autobil.prefixes -o .deps/kaz-kir.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-kir.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-kir.automorf.trimmed -o .deps/kaz-kir.automorf.trimmed.att | |
lt-comp lr .deps/kaz-kir.automorf.trimmed.att kaz-kir.automorf.bin | |
main@standard 167998 377602 | |
final@inconditional 41 67 | |
apertium-validate-dictionary apertium-kaz-kir.post-kaz.dix | |
lt-comp lr apertium-kaz-kir.post-kaz.dix kaz-kir.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-kir//kir.autogen.bin kaz-kir.autogen.bin | |
apertium-validate-transfer apertium-kaz-kir.kaz-kir.t1x | |
apertium-preprocess-transfer apertium-kaz-kir.kaz-kir.t1x kaz-kir.t1x.bin | |
apertium-validate-transfer apertium-kaz-kir.kaz-kir.t2x | |
apertium-preprocess-transfer apertium-kaz-kir.kaz-kir.t2x kaz-kir.t2x.bin | |
lt-print kir-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kir-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/kir-kaz.autobil.att > .deps/kir-kaz.autobil.hfst | |
hfst-project -p upper .deps/kir-kaz.autobil.hfst > .deps/kir-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kir-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kir-kaz.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kir//kir.automorf.att.gz | hfst-txt2fst > .deps/kir.automorf.hfst | |
hfst-compose-intersect -1 .deps/kir.automorf.hfst -2 .deps/kir-kaz.autobil.prefixes -o .deps/kir-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<percent>") in | |
transducer in file .deps/kir.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kir-kaz.autobil.prefixes. | |
hfst-fst2fst -O .deps/kir-kaz.automorf.trimmed -o kir-kaz.automorf.bin | |
hfst-fst2txt -i .deps/kir-kaz.automorf.trimmed -o .deps/kir-kaz.automorf.trimmed.att | |
lt-comp lr .deps/kir-kaz.automorf.trimmed.att kir-kaz.automorf.bin | |
main@standard 22176 46844 | |
final@inconditional 16 34 | |
apertium-validate-dictionary apertium-kaz-kir.post-kir.dix | |
lt-comp lr apertium-kaz-kir.post-kir.dix kir-kaz.autopgen.bin | |
main@standard 16 356 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin kir-kaz.autogen.bin | |
apertium-validate-transfer apertium-kaz-kir.kir-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-kir.kir-kaz.t1x kir-kaz.t1x.bin | |
apertium-validate-transfer apertium-kaz-kir.kir-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-kir.kir-kaz.t2x kir-kaz.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kir.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
cg-comp ../../apertium-languages/apertium-kir//apertium-kir.kir.rlx kir-kaz.rlx.bin | |
Sections: 3, Rules: 71, Sets: 102, Tags: 126 | |
lrx-comp apertium-kaz-kir.kaz-kir.lrx kaz-kir.autolex.bin | |
58: 963@1073 | |
lrx-comp apertium-kaz-kir.kir-kaz.lrx kir-kaz.autolex.bin | |
2: 25@26 | |
lsx-comp lr apertium-kaz-kir.kaz-kir.lsx kaz-kir.autoseq.bin | |
main@standard 47 50 | |
lsx-comp lr apertium-kaz-kir.kir-kaz.lsx kir-kaz.autoseq.bin | |
main@standard 97 108 | |
lsx-comp rl apertium-kaz-kir.kaz-kir.lsx kaz-kir.revautoseq.bin | |
main@standard 47 50 | |
lsx-comp rl apertium-kaz-kir.kir-kaz.lsx kir-kaz.revautoseq.bin | |
main@standard 97 108 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
apertium-createmodes.awk: modes/kaz-kir-autoseq.mode seen twice | |
apertium-createmodes.awk: modes/@kaz-kir-autoseq.mode seen twice | |
apertium-createmodes.awk: modes/kir-kaz-autoseq.mode seen twice | |
apertium-createmodes.awk: modes/@kir-kaz-autoseq.mode seen twice | |
bible coverage kaz -> kir | |
Number of tokenised words in the corpus: 214330 | |
Coverage: 92.64% | |
Top unknown words in the corpus: | |
66 яһудилер | |
65 парызшылдар | |
63 немесе | |
53 сиынып | |
50 сеніп | |
50 Пилат | |
49 өтінді | |
49 Жохан | |
48 бетер | |
44 Аумин | |
43 Ирод | |
43 ертіп | |
41 Яһудея | |
39 әзәзіл | |
36 яһудилердің | |
35 адалдығын | |
35 дүниелік | |
34 Матай | |
34 гөр | |
32 Ғалилея | |
Translation time: 6.111989498138428 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kir.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> kir | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2937 | |
Coverage: 90.19% | |
Top unknown words in the corpus: | |
5 ның | |
3 ге | |
3 одақтық | |
3 қалыптасқан | |
3 оңт | |
2 Қызылқұм | |
2 мыңжылдық | |
2 тайпалық | |
2 ғұндар | |
2 ғ | |
2 Оғыз | |
2 жоспарлық | |
2 өнеркәсіптік | |
2 өндірушісі | |
2 Беловеж | |
2 ны | |
2 сессиясында | |
2 құрлығының | |
2 с | |
2 қоңыржай | |
Translation time: 0.20651888847351074 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kir.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage kir -> kaz | |
Number of tokenised words in the corpus: 203725 | |
Coverage: 89.17% | |
Top unknown words in the corpus: | |
1279 Ыйса | |
946 Кудай | |
597 Кудайдын | |
380 Машаяк | |
362 Ыйсанын | |
305 Кудайга | |
208 Ыйсаны | |
184 Ыйсага | |
174 Машаяктын | |
163 Пабыл | |
94 Кудайды | |
92 улам | |
90 Кудайдан | |
83 Жакыя | |
68 таалим | |
66 иудей | |
65 динкызматчылар | |
64 Машаякка | |
63 Пабылдын | |
62 фарисейлер | |
Translation time: 5.053615570068359 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kir-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kir -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 9337 | |
Coverage: 85.91% | |
Top unknown words in the corpus: | |
15 С | |
10 К | |
10 көл | |
10 Көлдүн | |
8 б | |
8 Б | |
7 комплекстик | |
7 Н | |
7 Көл | |
6 дээрлик | |
6 закон | |
6 СССРдин | |
6 ИАнын | |
6 Борбордук | |
6 Кыргызжер | |
6 Сулайман | |
5 П | |
5 В | |
5 ландшафт | |
5 ээлеген | |
Translation time: 0.25955748558044434 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kir-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz kum | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 061a225d1c6d235e04fd492f6064fa7616409281 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-kum from ../../apertium-languages/apertium-kum/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-kum.autobil.bin kum-kaz.autobil.bin kaz-kum.automorf.bin kaz-kum.autopgen.bin kaz-kum.autogen.bin kaz-kum.t1x.bin kaz-kum.t2x.bin kaz-kum.rlx.bin kum-kaz.rlx.bin kaz-kum.lrx.bin " || rm -f kaz-kum.autobil.bin kum-kaz.autobil.bin kaz-kum.automorf.bin kaz-kum.autopgen.bin kaz-kum.autogen.bin kaz-kum.t1x.bin kaz-kum.t2x.bin kaz-kum.rlx.bin kum-kaz.rlx.bin kaz-kum.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-kum.kaz-kum.dix | |
lt-comp lr apertium-kaz-kum.kaz-kum.dix kaz-kum.autobil.bin | |
main@standard 1671 2288 | |
apertium-validate-dictionary apertium-kaz-kum.kaz-kum.dix | |
lt-comp rl apertium-kaz-kum.kaz-kum.dix kum-kaz.autobil.bin | |
main@standard 1653 2265 | |
if [ ! -d .deps ]; then mkdir .deps; fi | |
touch .deps/.d | |
lt-print kaz-kum.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-kum.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-kum.autobil.att > .deps/kaz-kum.autobil.hfst | |
hfst-project -p upper .deps/kaz-kum.autobil.hfst > .deps/kaz-kum.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-kum.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-kum.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-kum.autobil.prefixes -o .deps/kaz-kum.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-kum.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-kum.automorf.trimmed -o .deps/kaz-kum.automorf.trimmed.att | |
lt-comp lr .deps/kaz-kum.automorf.trimmed.att kaz-kum.automorf.bin | |
main@standard 38123 86166 | |
final@inconditional 2616 7439 | |
apertium-validate-dictionary ../../apertium-languages/apertium-kaz//apertium-kaz.post-kaz.dix | |
lt-comp lr ../../apertium-languages/apertium-kaz//apertium-kaz.post-kaz.dix kaz-kum.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-kum//kum.autogen.bin kaz-kum.autogen.bin | |
apertium-validate-transfer apertium-kaz-kum.kaz-kum.t1x | |
apertium-preprocess-transfer apertium-kaz-kum.kaz-kum.t1x kaz-kum.t1x.bin | |
apertium-validate-transfer apertium-kaz-kum.kaz-kum.t2x | |
apertium-preprocess-transfer apertium-kaz-kum.kaz-kum.t2x kaz-kum.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-kum.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
cg-comp ../../apertium-languages/apertium-kum//apertium-kum.kum.rlx kum-kaz.rlx.bin | |
Sections: 1, Rules: 6, Sets: 20, Tags: 32 | |
lrx-comp apertium-kaz-kum.kaz-kum.lrx kaz-kum.lrx.bin | |
2: 36@40 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
cp *.mode modes/ | |
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden | |
make: *** [Makefile:781: modes/kaz-kum.mode] Fehler 1 | |
bible coverage kaz -> kum | |
Number of tokenised words in the corpus: 175579 | |
Coverage: 56.36% | |
Top unknown words in the corpus: | |
1268 Иса | |
411 туралы | |
383 сендер | |
371 рухани | |
349 Себебі | |
339 арқылы | |
323 Мәсіх | |
309 Киелі | |
308 сендерге | |
284 Исаның | |
270 Иеміз | |
246 Мәсіхтің | |
238 Сондықтан | |
219 әрі | |
211 Ізгі | |
211 күні | |
196 сияқты | |
195 діни | |
194 біз | |
188 Алайда | |
Translation time: 3.2530195713043213 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kum.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> kum | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2675 | |
Coverage: 48.64% | |
Top unknown words in the corpus: | |
11 км | |
10 бойынша | |
8 КСРО | |
8 оңт | |
7 негізгі | |
7 тайпалар | |
6 Қазақ | |
6 экономикалық | |
6 туралы | |
6 жылғы | |
6 желтоқсанда | |
6 басшылары | |
5 бөлігін | |
5 ның | |
5 феодалдық | |
5 Украина | |
5 солт | |
4 арқылы | |
4 оңтүстік | |
4 Елдің | |
Translation time: 0.08241939544677734 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-kum.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage kum -> kaz | |
[Errno 2] No such file or directory: 'kum-kaz.automorf.bin' | |
wikipedia coverage kum -> kaz | |
[Errno 2] No such file or directory: '../../apertium-languages/apertium-kum/wiki.destxt' | |
kaz sah | |
Bereits auf 'master' | |
M ap_include.am | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 176f11224e72a9789db879fe7e88ebaf93d124db | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-sah from ../../apertium-languages/apertium-sah/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-sah.automorf.bin kaz-sah.prob kaz-sah.rlx.bin kaz-sah.autobil.bin kaz-sah.autolex.bin kaz-sah.autogen.bin kaz-sah.autopgen.bin kaz-sah.t1x.bin kaz-sah.t2x.bin kaz-sah.t3x.bin kaz-sah.t4x.bin sah-kaz.automorf.bin sah-kaz.prob sah-kaz.rlx.bin sah-kaz.autobil.bin sah-kaz.autolex.bin sah-kaz.autogen.bin sah-kaz.autopgen.bin sah-kaz.t1x.bin sah-kaz.t2x.bin sah-kaz.t3x.bin" || rm -f kaz-sah.automorf.bin kaz-sah.prob kaz-sah.rlx.bin kaz-sah.autobil.bin kaz-sah.autolex.bin kaz-sah.autogen.bin kaz-sah.autopgen.bin kaz-sah.t1x.bin kaz-sah.t2x.bin kaz-sah.t3x.bin kaz-sah.t4x.bin sah-kaz.automorf.bin sah-kaz.prob sah-kaz.rlx.bin sah-kaz.autobil.bin sah-kaz.autolex.bin sah-kaz.autogen.bin sah-kaz.autopgen.bin sah-kaz.t1x.bin sah-kaz.t2x.bin sah-kaz.t3x.bin | |
rm -rf .deps modes | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
/bin/zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
apertium-validate-dictionary apertium-kaz-sah.kaz-sah.dix | |
lt-comp lr apertium-kaz-sah.kaz-sah.dix kaz-sah.autobil.bin | |
main@standard 8508 11300 | |
lt-print kaz-sah.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-sah.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-sah.autobil.att > .deps/kaz-sah.autobil.hfst | |
hfst-project -p upper .deps/kaz-sah.autobil.hfst > .deps/kaz-sah.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-sah.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-sah.autobil.prefixes | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-sah.autobil.prefixes -o .deps/kaz-sah.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-sah.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-sah.automorf.trimmed -o .deps/kaz-sah.automorf.trimmed.att | |
lt-comp lr .deps/kaz-sah.automorf.trimmed.att kaz-sah.automorf.bin | |
main@standard 86196 189326 | |
final@inconditional 28 38 | |
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-sah.prob | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-sah.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-sah.kaz-sah.lrx kaz-sah.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-sah//sah.autogen.bin kaz-sah.autogen.bin | |
cp ../../apertium-languages/apertium-sah//sah.autopgen.bin kaz-sah.autopgen.bin | |
apertium-validate-transfer apertium-kaz-sah.kaz-sah.t1x | |
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t1x kaz-sah.t1x.bin | |
apertium-validate-interchunk apertium-kaz-sah.kaz-sah.t2x | |
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t2x kaz-sah.t2x.bin | |
apertium-validate-postchunk apertium-kaz-sah.kaz-sah.t3x | |
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t3x kaz-sah.t3x.bin | |
apertium-validate-transfer apertium-kaz-sah.kaz-sah.t4x | |
apertium-preprocess-transfer apertium-kaz-sah.kaz-sah.t4x kaz-sah.t4x.bin | |
/bin/zcat ../../apertium-languages/apertium-sah//sah.automorf.att.gz | hfst-txt2fst > .deps/sah.automorf.hfst | |
apertium-validate-dictionary apertium-kaz-sah.kaz-sah.dix | |
lt-comp rl apertium-kaz-sah.kaz-sah.dix sah-kaz.autobil.bin | |
main@standard 8502 11291 | |
lt-print sah-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/sah-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/sah-kaz.autobil.att > .deps/sah-kaz.autobil.hfst | |
hfst-project -p upper .deps/sah-kaz.autobil.hfst > .deps/sah-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/sah-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/sah-kaz.autobil.prefixes | |
hfst-compose-intersect -1 .deps/sah.automorf.hfst -2 .deps/sah-kaz.autobil.prefixes -o .deps/sah-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<apos>") in | |
transducer in file .deps/sah.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/sah-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/sah-kaz.automorf.trimmed -o .deps/sah-kaz.automorf.trimmed.att | |
lt-comp lr .deps/sah-kaz.automorf.trimmed.att sah-kaz.automorf.bin | |
main@standard 17257 40258 | |
final@inconditional 549 1631 | |
cp ../../apertium-languages/apertium-sah//sah.prob sah-kaz.prob | |
cg-comp ../../apertium-languages/apertium-sah//apertium-sah.sah.rlx sah-kaz.rlx.bin | |
Sections: 1, Rules: 2, Sets: 7, Tags: 17 | |
1 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-sah.sah-kaz.lrx sah-kaz.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin sah-kaz.autogen.bin | |
cp ../../apertium-languages/apertium-kaz//kaz.autopgen.bin sah-kaz.autopgen.bin | |
apertium-validate-transfer apertium-kaz-sah.sah-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t1x sah-kaz.t1x.bin | |
apertium-validate-interchunk apertium-kaz-sah.sah-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t2x sah-kaz.t2x.bin | |
apertium-validate-postchunk apertium-kaz-sah.sah-kaz.t3x | |
apertium-preprocess-transfer apertium-kaz-sah.sah-kaz.t3x sah-kaz.t3x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
lt-comp lr .deps/kaz.automorf.bin.att .deps/kaz.automorf.bin | |
main@standard 380438 893117 | |
final@inconditional 2645 7326 | |
lt-comp lr .deps/sah.automorf.bin.att .deps/sah.automorf.bin | |
main@standard 17256 40256 | |
final@inconditional 543 1625 | |
bible coverage kaz -> sah | |
Number of tokenised words in the corpus: 174579 | |
Coverage: 67.93% | |
Top unknown words in the corpus: | |
1268 Иса | |
825 Құдайдың | |
762 Құдай | |
324 1 | |
323 Мәсіх | |
306 2 | |
298 Құдайға | |
284 3 | |
284 Исаның | |
279 4 | |
276 5 | |
272 6 | |
269 7 | |
269 10 | |
267 8 | |
267 9 | |
267 11 | |
265 12 | |
264 13 | |
252 14 | |
Translation time: 4.182401418685913 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-sah.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> sah | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2675 | |
Coverage: 71.93% | |
Top unknown words in the corpus: | |
11 1991 | |
8 1 | |
8 оңт | |
7 тайпалар | |
5 2 | |
5 3 | |
5 феодалдық | |
5 30 | |
5 10 | |
5 солт | |
4 шығысында | |
4 70 | |
4 60 | |
4 салдарынан | |
4 мыңдаған | |
3 ге | |
3 созылып | |
3 өкілдері | |
3 16 | |
3 яғни | |
Translation time: 0.13700127601623535 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-sah.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage sah -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 1107 | |
Coverage: 91.06% | |
Top unknown words in the corpus: | |
5 Апостоллар | |
3 Евангелие | |
2 Спасскай | |
2 миссионердар | |
2 Аланд | |
1 Annotation | |
1 НОВЫЙ | |
1 ЗАВЕТ | |
1 якутском | |
1 языке | |
1 in | |
1 c | |
1 эҕэрдэлиибин | |
1 Тэнгри | |
1 чочуобунаны | |
1 сүрэхтэнэр | |
1 бэргэһэлэнэр | |
1 Дежнев | |
1 Абакайааданы | |
1 бэргэһэлээбит | |
Translation time: 0.04111599922180176 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./sah-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage sah -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 3672 | |
Coverage: 90.36% | |
Top unknown words in the corpus: | |
5 Орест | |
4 якутского | |
4 языка | |
3 Вейсенбург | |
2 Ромулус | |
2 киириитиэр | |
2 саарар | |
2 фон | |
2 монастырыгар | |
2 рукопись | |
2 этилэр | |
2 биллибитэ | |
2 К | |
2 Пеллерин | |
2 Кустуктуурап | |
2 буоланнар | |
2 Максимовы | |
2 Маҥаачыйа | |
2 Поликарпов | |
2 сорохторун | |
Translation time: 0.08243060111999512 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./sah-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz tat | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit ea9afd606afe03df1f9c7c6adc2affd0ef72500a | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-tat from ../../apertium-languages/apertium-tat/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-tat.autobil.bin tat-kaz.autobil.bin kaz-tat.automorf.bin kaz-tat.autopgen.bin kaz-tat.autogen.bin kaz-tat.t1x.bin kaz-tat.t2x.bin tat-kaz.automorf.bin tat-kaz.autopgen.bin tat-kaz.autogen.bin tat-kaz.t1x.bin tat-kaz.t2x.bin kaz-tat.rlx.bin tat-kaz.rlx.bin kaz-tat.lrx.bin tat-kaz.lrx.bin" || rm -f kaz-tat.autobil.bin tat-kaz.autobil.bin kaz-tat.automorf.bin kaz-tat.autopgen.bin kaz-tat.autogen.bin kaz-tat.t1x.bin kaz-tat.t2x.bin tat-kaz.automorf.bin tat-kaz.autopgen.bin tat-kaz.autogen.bin tat-kaz.t1x.bin tat-kaz.t2x.bin kaz-tat.rlx.bin tat-kaz.rlx.bin kaz-tat.lrx.bin tat-kaz.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-tat.kaz-tat.dix | |
lt-comp lr apertium-kaz-tat.kaz-tat.dix kaz-tat.autobil.bin | |
main@standard 18888 36358 | |
apertium-validate-dictionary apertium-kaz-tat.kaz-tat.dix | |
lt-comp rl apertium-kaz-tat.kaz-tat.dix tat-kaz.autobil.bin | |
main@standard 18854 36285 | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
lt-print kaz-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tat.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-tat.autobil.att > .deps/kaz-tat.autobil.hfst | |
hfst-project -p upper .deps/kaz-tat.autobil.hfst > .deps/kaz-tat.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tat.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tat.autobil.prefixes -o .deps/kaz-tat.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<percent>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-tat.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-tat.automorf.trimmed -o .deps/kaz-tat.automorf.trimmed.att | |
lt-comp lr .deps/kaz-tat.automorf.trimmed.att kaz-tat.automorf.bin | |
main@standard 210972 478879 | |
final@inconditional 2596 7002 | |
apertium-validate-dictionary apertium-kaz-tat.post-kaz.dix | |
lt-comp lr apertium-kaz-tat.post-kaz.dix kaz-tat.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-tat//tat.autogen.bin kaz-tat.autogen.bin | |
apertium-validate-transfer apertium-kaz-tat.kaz-tat.t1x | |
apertium-preprocess-transfer apertium-kaz-tat.kaz-tat.t1x kaz-tat.t1x.bin | |
apertium-validate-transfer apertium-kaz-tat.kaz-tat.t2x | |
apertium-preprocess-transfer apertium-kaz-tat.kaz-tat.t2x kaz-tat.t2x.bin | |
lt-print tat-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/tat-kaz.autobil.att > .deps/tat-kaz.autobil.hfst | |
hfst-project -p upper .deps/tat-kaz.autobil.hfst > .deps/tat-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tat-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-kaz.autobil.prefixes | |
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst | |
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-kaz.autobil.prefixes -o .deps/tat-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<punct>") in | |
transducer in file .deps/tat.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tat-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/tat-kaz.automorf.trimmed -o .deps/tat-kaz.automorf.trimmed.att | |
lt-comp lr .deps/tat-kaz.automorf.trimmed.att tat-kaz.automorf.bin | |
main@standard 97321 178518 | |
final@inconditional 755 1606 | |
apertium-validate-dictionary apertium-kaz-tat.post-tat.dix | |
lt-comp lr apertium-kaz-tat.post-tat.dix tat-kaz.autopgen.bin | |
main@standard 16 356 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tat-kaz.autogen.bin | |
apertium-validate-transfer apertium-kaz-tat.tat-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-tat.tat-kaz.t1x tat-kaz.t1x.bin | |
apertium-validate-transfer apertium-kaz-tat.tat-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-tat.tat-kaz.t2x tat-kaz.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tat.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-kaz.rlx.bin | |
Sections: 11, Rules: 123, Sets: 154, Tags: 194 | |
lrx-comp apertium-kaz-tat.kaz-tat.lrx kaz-tat.lrx.bin | |
43: 1009@1120 | |
lrx-comp apertium-kaz-tat.tat-kaz.lrx tat-kaz.lrx.bin | |
3: 49@52 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
bible coverage kaz -> tat | |
Number of tokenised words in the corpus: 214397 | |
Coverage: 95.03% | |
Top unknown words in the corpus: | |
66 яһудилер | |
65 парызшылдар | |
63 немесе | |
50 Пилат | |
49 Жохан | |
44 Аумин | |
43 Ирод | |
41 Яһудея | |
39 әзәзіл | |
36 яһудилердің | |
35 дүниелік | |
34 гөр | |
32 Ғалилея | |
31 уағыздап | |
29 екеуі | |
29 кейбіреулері | |
29 Саул | |
29 Қорынттықтарга | |
27 Лұқа | |
26 ұлылығын | |
Translation time: 7.922478675842285 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> tat | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2937 | |
Coverage: 92.17% | |
Top unknown words in the corpus: | |
5 ның | |
3 ге | |
3 одақтық | |
3 оңт | |
2 Қызылқұм | |
2 мыңжылдық | |
2 тайпалық | |
2 ғұндар | |
2 Оғыз | |
2 жоспарлық | |
2 өнеркәсіптік | |
2 Беловеж | |
2 ны | |
2 сессиясында | |
2 құрлығының | |
2 қоңыржай | |
2 респ | |
2 жоғ | |
2 өкілеттігі | |
2 мореналық | |
Translation time: 0.23727869987487793 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tat -> kaz | |
Number of tokenised words in the corpus: 194164 | |
Coverage: 93.57% | |
Top unknown words in the corpus: | |
190 Паул | |
159 Петер | |
112 яһүдләр | |
108 берсе | |
91 яһүд | |
90 канун | |
80 әллә | |
74 карата | |
73 бөек | |
66 Шимун | |
60 Пилат | |
57 каршында | |
55 Яһүд | |
52 явыз | |
52 фарисейләр | |
49 Һируд | |
49 һәммәсе | |
49 хачка | |
47 Аннары | |
47 канунчылар | |
Translation time: 5.087080955505371 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tat -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 26 | |
Coverage: 65.38% | |
Top unknown words in the corpus: | |
1 Tatarça | |
1 İnternet | |
1 tulısınça | |
1 İnternetı | |
1 Respublikası | |
1 däwlät | |
1 tellärendä | |
1 tatar | |
1 häm | |
Translation time: 0.05028939247131348 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz tur | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 5939a3b8ca9a9331bc8eb1c9ec9e3824e0fa2aaa | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-tur from ../../apertium-languages/apertium-tur/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-tur.automorf.bin kaz-tur.prob kaz-tur.rlx.bin kaz-tur.autobil.bin kaz-tur.autolex.bin kaz-tur.autogen.bin kaz-tur.autopgen.bin kaz-tur.t1x.bin kaz-tur.t2x.bin kaz-tur.t3x.bin kaz-tur.t4x.bin tur-kaz.automorf.bin tur-kaz.prob tur-kaz.rlx.bin tur-kaz.autobil.bin tur-kaz.autolex.bin tur-kaz.autogen.bin tur-kaz.t1x.bin tur-kaz.t2x.bin tur-kaz.t3x.bin" || rm -f kaz-tur.automorf.bin kaz-tur.prob kaz-tur.rlx.bin kaz-tur.autobil.bin kaz-tur.autolex.bin kaz-tur.autogen.bin kaz-tur.autopgen.bin kaz-tur.t1x.bin kaz-tur.t2x.bin kaz-tur.t3x.bin kaz-tur.t4x.bin tur-kaz.automorf.bin tur-kaz.prob tur-kaz.rlx.bin tur-kaz.autobil.bin tur-kaz.autolex.bin tur-kaz.autogen.bin tur-kaz.t1x.bin tur-kaz.t2x.bin tur-kaz.t3x.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-tur.kaz-tur.dix | |
lt-comp lr apertium-kaz-tur.kaz-tur.dix kaz-tur.autobil.bin | |
main@standard 20029 27244 | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
lt-print kaz-tur.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tur.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-tur.autobil.att > .deps/kaz-tur.autobil.hfst | |
hfst-project -p upper .deps/kaz-tur.autobil.hfst > .deps/kaz-tur.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-tur.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tur.autobil.prefixes | |
/bin/zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tur.autobil.prefixes -o .deps/kaz-tur.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-tur.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-tur.automorf.trimmed -o .deps/kaz-tur.automorf.trimmed.att | |
lt-comp lr .deps/kaz-tur.automorf.trimmed.att kaz-tur.automorf.bin | |
main@standard 162122 359659 | |
final@inconditional 41 68 | |
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-tur.prob | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tur.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-tur.kaz-tur.lrx kaz-tur.autolex.bin | |
95: 2190@2458 | |
cp ../../apertium-languages/apertium-tur//tur.autogen.bin kaz-tur.autogen.bin | |
cp ../../apertium-languages/apertium-tur//tur.autopgen.bin kaz-tur.autopgen.bin | |
apertium-validate-transfer apertium-kaz-tur.kaz-tur.t1x | |
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t1x kaz-tur.t1x.bin | |
Warning (717): Paths to rule 5 blocked by rule 4. | |
Warning (958): Paths to rule 13 blocked by rule 12. | |
Warning (1602): Paths to rule 34 blocked by rule 33. | |
Warning (1710): Paths to rule 36 blocked by rule 35. | |
Warning (2020): Paths to rule 46 blocked by rule 45. | |
Warning (2080): Paths to rule 48 blocked by rule 47. | |
Warning (2839): Paths to rule 71 blocked by rule 70. | |
Warning (2839): Paths to rule 71 blocked by rule 70. | |
apertium-validate-interchunk apertium-kaz-tur.kaz-tur.t2x | |
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t2x kaz-tur.t2x.bin | |
apertium-validate-postchunk apertium-kaz-tur.kaz-tur.t3x | |
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t3x kaz-tur.t3x.bin | |
apertium-validate-transfer apertium-kaz-tur.kaz-tur.t4x | |
apertium-preprocess-transfer apertium-kaz-tur.kaz-tur.t4x kaz-tur.t4x.bin | |
apertium-validate-dictionary apertium-kaz-tur.kaz-tur.dix | |
lt-comp rl apertium-kaz-tur.kaz-tur.dix tur-kaz.autobil.bin | |
main@standard 19995 27192 | |
lt-print tur-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tur-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/tur-kaz.autobil.att > .deps/tur-kaz.autobil.hfst | |
hfst-project -p upper .deps/tur-kaz.autobil.hfst > .deps/tur-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tur-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tur-kaz.autobil.prefixes | |
/bin/zcat ../../apertium-languages/apertium-tur//tur.automorf.att.gz | hfst-txt2fst > .deps/tur.automorf.hfst | |
hfst-compose-intersect -1 .deps/tur.automorf.hfst -2 .deps/tur-kaz.autobil.prefixes -o .deps/tur-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<quot>") in | |
transducer in file .deps/tur.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tur-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/tur-kaz.automorf.trimmed -o .deps/tur-kaz.automorf.trimmed.att | |
lt-comp lr .deps/tur-kaz.automorf.trimmed.att tur-kaz.automorf.bin | |
main@standard 12675 24541 | |
final@inconditional 4052 7570 | |
cp ../../apertium-languages/apertium-tur//tur.prob tur-kaz.prob | |
cg-comp ../../apertium-languages/apertium-tur//apertium-tur.tur.rlx tur-kaz.rlx.bin | |
Sections: 4, Rules: 102, Sets: 129, Tags: 127 | |
2 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-tur.tur-kaz.lrx tur-kaz.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tur-kaz.autogen.bin | |
apertium-validate-transfer apertium-kaz-tur.tur-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t1x tur-kaz.t1x.bin | |
apertium-validate-interchunk apertium-kaz-tur.tur-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t2x tur-kaz.t2x.bin | |
apertium-validate-postchunk apertium-kaz-tur.tur-kaz.t3x | |
apertium-preprocess-transfer apertium-kaz-tur.tur-kaz.t3x tur-kaz.t3x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
bible coverage kaz -> tur | |
Number of tokenised words in the corpus: 214376 | |
Coverage: 89.05% | |
Top unknown words in the corpus: | |
1268 Иса | |
323 Мәсіх | |
309 Киелі | |
284 Исаның | |
246 Мәсіхтің | |
211 Ізгі | |
175 Исаға | |
151 Исаны | |
150 Петір | |
136 Пауыл | |
129 Таурат | |
127 шынайы | |
106 күнәкар | |
103 Мәсіхке | |
89 киелі | |
88 яғни | |
83 Жақия | |
83 әркім | |
79 әділ | |
79 Мұса | |
Translation time: 7.062980890274048 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> tur | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2936 | |
Coverage: 88.28% | |
Top unknown words in the corpus: | |
8 оңт | |
5 феодалдық | |
5 солт | |
4 мыңдаған | |
3 ге | |
3 Тянь | |
3 Шань | |
3 Еділ | |
3 яғни | |
3 VI | |
3 Социалистік | |
3 жж | |
3 одақтық | |
3 ядролық | |
3 м | |
3 континенттік | |
2 Қызылқұм | |
2 тайпалық | |
2 ғұндар | |
2 әкімшілік | |
Translation time: 0.20586729049682617 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tur.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tur -> kaz | |
Number of tokenised words in the corpus: 493813 | |
Coverage: 82.25% | |
Top unknown words in the corpus: | |
1782 Tanrı | |
1686 Çünkü | |
1562 nın | |
1150 ın | |
1044 a | |
912 ki | |
832 Davut | |
620 üzerine | |
585 Yahuda | |
553 Ey | |
505 Yeruşalim | |
487 Egemen | |
448 Musa | |
409 na | |
390 la | |
377 Tanrısı | |
376 ı | |
362 i | |
355 Saul | |
340 dan | |
Translation time: 7.328187942504883 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tur -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 16959 | |
Coverage: 77.57% | |
Top unknown words in the corpus: | |
141 ın | |
124 Temuçin | |
53 a | |
41 ı | |
40 i | |
40 nin | |
34 Camuka | |
34 nın | |
33 Jin | |
33 Tuğrul | |
29 Cuci | |
28 Kırım | |
27 soyundan | |
27 Harezmşah | |
24 üzerine | |
22 Cebe | |
22 Hanlığı | |
17 Mukhulai | |
17 Subutay | |
16 Yesügey | |
Translation time: 0.4011809825897217 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tur-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz tyv | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit ba80cf81d1ca88b2b35fb961f2d746f8f28e42a2 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-tyv from ../../apertium-languages/apertium-tyv/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-tyv.automorf.bin kaz-tyv.prob kaz-tyv.rlx.bin kaz-tyv.autobil.bin kaz-tyv.autolex.bin kaz-tyv.autogen.bin kaz-tyv.autopgen.bin kaz-tyv.t1x.bin kaz-tyv.t2x.bin kaz-tyv.t3x.bin kaz-tyv.t4x.bin tyv-kaz.automorf.bin tyv-kaz.prob tyv-kaz.rlx.bin tyv-kaz.autobil.bin tyv-kaz.autolex.bin tyv-kaz.autogen.bin tyv-kaz.autopgen.bin tyv-kaz.t1x.bin tyv-kaz.t2x.bin tyv-kaz.t3x.bin" || rm -f kaz-tyv.automorf.bin kaz-tyv.prob kaz-tyv.rlx.bin kaz-tyv.autobil.bin kaz-tyv.autolex.bin kaz-tyv.autogen.bin kaz-tyv.autopgen.bin kaz-tyv.t1x.bin kaz-tyv.t2x.bin kaz-tyv.t3x.bin kaz-tyv.t4x.bin tyv-kaz.automorf.bin tyv-kaz.prob tyv-kaz.rlx.bin tyv-kaz.autobil.bin tyv-kaz.autolex.bin tyv-kaz.autogen.bin tyv-kaz.autopgen.bin tyv-kaz.t1x.bin tyv-kaz.t2x.bin tyv-kaz.t3x.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-tyv.kaz-tyv.dix | |
lt-comp lr apertium-kaz-tyv.kaz-tyv.dix kaz-tyv.autobil.bin | |
main@standard 465 671 | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
lt-print kaz-tyv.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-tyv.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-tyv.autobil.att > .deps/kaz-tyv.autobil.hfst | |
hfst-project -p upper .deps/kaz-tyv.autobil.hfst > .deps/kaz-tyv.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-tyv.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-tyv.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-tyv.autobil.prefixes -o .deps/kaz-tyv.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-tyv.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-tyv.automorf.trimmed -o .deps/kaz-tyv.automorf.trimmed.att | |
lt-comp lr .deps/kaz-tyv.automorf.trimmed.att kaz-tyv.automorf.bin | |
main@standard 21219 48771 | |
final@inconditional 2584 6986 | |
cp ../../apertium-languages/apertium-kaz//kaz.prob kaz-tyv.prob | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-tyv.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-tyv.kaz-tyv.lrx kaz-tyv.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-tyv//tyv.autogen.bin kaz-tyv.autogen.bin | |
cp ../../apertium-languages/apertium-tyv//tyv.autopgen.bin kaz-tyv.autopgen.bin | |
apertium-validate-transfer apertium-kaz-tyv.kaz-tyv.t1x | |
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t1x kaz-tyv.t1x.bin | |
apertium-validate-interchunk apertium-kaz-tyv.kaz-tyv.t2x | |
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t2x kaz-tyv.t2x.bin | |
apertium-validate-postchunk apertium-kaz-tyv.kaz-tyv.t3x | |
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t3x kaz-tyv.t3x.bin | |
apertium-validate-transfer apertium-kaz-tyv.kaz-tyv.t4x | |
apertium-preprocess-transfer apertium-kaz-tyv.kaz-tyv.t4x kaz-tyv.t4x.bin | |
apertium-validate-dictionary apertium-kaz-tyv.kaz-tyv.dix | |
lt-comp rl apertium-kaz-tyv.kaz-tyv.dix tyv-kaz.autobil.bin | |
main@standard 465 671 | |
lt-print tyv-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tyv-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/tyv-kaz.autobil.att > .deps/tyv-kaz.autobil.hfst | |
hfst-project -p upper .deps/tyv-kaz.autobil.hfst > .deps/tyv-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tyv-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tyv-kaz.autobil.prefixes | |
zcat ../../apertium-languages/apertium-tyv//tyv.automorf.att.gz | hfst-txt2fst > .deps/tyv.automorf.hfst | |
hfst-compose-intersect -1 .deps/tyv.automorf.hfst -2 .deps/tyv-kaz.autobil.prefixes -o .deps/tyv-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<subst>") in | |
transducer in file .deps/tyv.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tyv-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/tyv-kaz.automorf.trimmed -o .deps/tyv-kaz.automorf.trimmed.att | |
lt-comp lr .deps/tyv-kaz.automorf.trimmed.att tyv-kaz.automorf.bin | |
main@standard 1721 4129 | |
final@inconditional 307 799 | |
cp ../../apertium-languages/apertium-tyv//tyv.prob tyv-kaz.prob | |
cg-comp ../../apertium-languages/apertium-tyv//apertium-tyv.tyv.rlx tyv-kaz.rlx.bin | |
Sections: 2, Rules: 34, Sets: 60, Tags: 102 | |
1 rules cannot be skipped by index. | |
lrx-comp apertium-kaz-tyv.tyv-kaz.lrx tyv-kaz.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin tyv-kaz.autogen.bin | |
cp ../../apertium-languages/apertium-kaz//kaz.autopgen.bin tyv-kaz.autopgen.bin | |
apertium-validate-transfer apertium-kaz-tyv.tyv-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t1x tyv-kaz.t1x.bin | |
apertium-validate-interchunk apertium-kaz-tyv.tyv-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t2x tyv-kaz.t2x.bin | |
apertium-validate-postchunk apertium-kaz-tyv.tyv-kaz.t3x | |
apertium-preprocess-transfer apertium-kaz-tyv.tyv-kaz.t3x tyv-kaz.t3x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
bible coverage kaz -> tyv | |
Number of tokenised words in the corpus: 217646 | |
Coverage: 57.56% | |
Top unknown words in the corpus: | |
1268 Иса | |
825 Құдайдың | |
808 үшін | |
762 Құдай | |
434 Сонда | |
414 осы | |
411 туралы | |
383 сендер | |
371 рухани | |
351 өз | |
349 Себебі | |
339 арқылы | |
323 Мәсіх | |
309 Киелі | |
308 сендерге | |
298 Құдайға | |
284 Исаның | |
270 Иеміз | |
246 Мәсіхтің | |
240 қатты | |
Translation time: 2.413213014602661 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tyv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> tyv | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2980 | |
Coverage: 40.77% | |
Top unknown words in the corpus: | |
51 Қазақстан | |
11 км | |
10 бойынша | |
8 мемлекет | |
8 Қазақстанның | |
8 КСРО | |
8 Орта | |
8 оңт | |
7 ең | |
7 негізгі | |
7 өз | |
7 тайпалар | |
6 Республикасы | |
6 орналасқан | |
6 Қазақ | |
6 шығыс | |
6 экономикалық | |
6 туралы | |
6 ірі | |
6 республика | |
Translation time: 0.06718015670776367 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-tyv.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage tyv -> kaz | |
Number of tokenised words in the corpus: 227032 | |
Coverage: 59.05% | |
Top unknown words in the corpus: | |
1547 даа | |
1179 Бурганның | |
1101 Иисус | |
703 мынча | |
678 бүгү | |
558 Бурган | |
545 силерге | |
543 Дээрги | |
532 Мен | |
501 силер | |
475 мен | |
447 дег | |
442 ла | |
430 чедип | |
423 Мээң | |
393 өске | |
373 дугайында | |
360 катап | |
321 ле | |
318 бис | |
Translation time: 1.5751702785491943 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tyv-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tyv -> kaz | |
Number of tokenised words in the corpus: 433 | |
Coverage: 49.19% | |
Top unknown words in the corpus: | |
4 В | |
4 quot | |
4 Кезер | |
4 Даңгына | |
3 Азия | |
3 Хемниң | |
3 Ачыты | |
3 Мерген | |
3 бурят | |
2 Азияның | |
2 төвү | |
2 Азий | |
2 Төвү | |
2 Тываның | |
2 тураскаал | |
2 төвүнде | |
2 он | |
2 ла | |
2 илереткен | |
2 Куулар | |
Translation time: 0.008584737777709961 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tyv-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kaz uig | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 27242d1bc93089f2430d555817239e064530f2d1 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kaz from ../../apertium-languages/apertium-kaz/ | |
Using apertium-uig from ../../apertium-languages/apertium-uig/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kaz-uig.autobil.bin uig-kaz.autobil.bin kaz-uig.automorf.bin kaz-uig.autopgen.bin kaz-uig.autogen.bin kaz-uig.t1x.bin kaz-uig.t2x.bin uig-kaz.automorf.bin uig-kaz.autopgen.bin uig-kaz.autogen.bin uig-kaz.t1x.bin uig-kaz.t2x.bin kaz-uig.rlx.bin uig-kaz.rlx.bin kaz-uig.lrx.bin uig-kaz.lrx.bin" || rm -f kaz-uig.autobil.bin uig-kaz.autobil.bin kaz-uig.automorf.bin kaz-uig.autopgen.bin kaz-uig.autogen.bin kaz-uig.t1x.bin kaz-uig.t2x.bin uig-kaz.automorf.bin uig-kaz.autopgen.bin uig-kaz.autogen.bin uig-kaz.t1x.bin uig-kaz.t2x.bin kaz-uig.rlx.bin uig-kaz.rlx.bin kaz-uig.lrx.bin uig-kaz.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kaz-uig.kaz-uig.dix | |
lt-comp lr apertium-kaz-uig.kaz-uig.dix kaz-uig.autobil.bin | |
main@standard 6798 9416 | |
apertium-validate-dictionary apertium-kaz-uig.kaz-uig.dix | |
lt-comp rl apertium-kaz-uig.kaz-uig.dix uig-kaz.autobil.bin | |
main@standard 6786 9401 | |
if [ ! -d .deps ]; then mkdir .deps; fi | |
touch .deps/.d | |
lt-print kaz-uig.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaz-uig.autobil.att | |
hfst-txt2fst -e ε < .deps/kaz-uig.autobil.att > .deps/kaz-uig.autobil.hfst | |
hfst-project -p upper .deps/kaz-uig.autobil.hfst > .deps/kaz-uig.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaz-uig.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaz-uig.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kaz//kaz.automorf.att.gz | hfst-txt2fst > .deps/kaz.automorf.hfst | |
hfst-compose-intersect -1 .deps/kaz.automorf.hfst -2 .deps/kaz-uig.autobil.prefixes -o .deps/kaz-uig.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<ltr>") in | |
transducer in file .deps/kaz.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaz-uig.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaz-uig.automorf.trimmed -o .deps/kaz-uig.automorf.trimmed.att | |
lt-comp lr .deps/kaz-uig.automorf.trimmed.att kaz-uig.automorf.bin | |
main@standard 104981 233480 | |
final@inconditional 2589 6991 | |
apertium-validate-dictionary apertium-kaz-uig.post-kaz.dix | |
lt-comp lr apertium-kaz-uig.post-kaz.dix kaz-uig.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-uig//uig.autogen.bin kaz-uig.autogen.bin | |
apertium-validate-transfer apertium-kaz-uig.kaz-uig.t1x | |
apertium-preprocess-transfer apertium-kaz-uig.kaz-uig.t1x kaz-uig.t1x.bin | |
apertium-validate-transfer apertium-kaz-uig.kaz-uig.t2x | |
apertium-preprocess-transfer apertium-kaz-uig.kaz-uig.t2x kaz-uig.t2x.bin | |
lt-print uig-kaz.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/uig-kaz.autobil.att | |
hfst-txt2fst -e ε < .deps/uig-kaz.autobil.att > .deps/uig-kaz.autobil.hfst | |
hfst-project -p upper .deps/uig-kaz.autobil.hfst > .deps/uig-kaz.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/uig-kaz.autobil.upper -2 .deps/any-symbol.hfst -o .deps/uig-kaz.autobil.prefixes | |
zcat ../../apertium-languages/apertium-uig//uig.automorf.att.gz | hfst-txt2fst > .deps/uig.automorf.hfst | |
hfst-compose-intersect -1 .deps/uig.automorf.hfst -2 .deps/uig-kaz.autobil.prefixes -o .deps/uig-kaz.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<barb>") in | |
transducer in file .deps/uig.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/uig-kaz.autobil.prefixes. | |
hfst-fst2txt -i .deps/uig-kaz.automorf.trimmed -o .deps/uig-kaz.automorf.trimmed.att | |
lt-comp lr .deps/uig-kaz.automorf.trimmed.att uig-kaz.automorf.bin | |
main@standard 7086 37292 | |
final@inconditional 17 38 | |
apertium-validate-dictionary apertium-kaz-uig.post-uig.dix | |
lt-comp lr apertium-kaz-uig.post-uig.dix uig-kaz.autopgen.bin | |
main@standard 9 114 | |
cp ../../apertium-languages/apertium-kaz//kaz.autogen.bin uig-kaz.autogen.bin | |
apertium-validate-transfer apertium-kaz-uig.uig-kaz.t1x | |
apertium-preprocess-transfer apertium-kaz-uig.uig-kaz.t1x uig-kaz.t1x.bin | |
apertium-validate-transfer apertium-kaz-uig.uig-kaz.t2x | |
apertium-preprocess-transfer apertium-kaz-uig.uig-kaz.t2x uig-kaz.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kaz//apertium-kaz.kaz.rlx kaz-uig.rlx.bin | |
Sections: 3, Rules: 150, Sets: 204, Tags: 234 | |
1 rules cannot be skipped by index. | |
cg-comp ../../apertium-languages/apertium-uig//apertium-uig.uig.rlx uig-kaz.rlx.bin | |
Sections: 1, Rules: 55, Sets: 81, Tags: 147 | |
lrx-comp apertium-kaz-uig.kaz-uig.lrx kaz-uig.lrx.bin | |
6: 99@109 | |
lrx-comp apertium-kaz-uig.uig-kaz.lrx uig-kaz.lrx.bin | |
1: 19@19 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
cp *.mode modes/ | |
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden | |
make: *** [Makefile:779: modes/kaz-uig.mode] Fehler 1 | |
bible coverage kaz -> uig | |
Number of tokenised words in the corpus: 215836 | |
Coverage: 79.13% | |
Top unknown words in the corpus: | |
1268 Иса | |
462 былай | |
434 Сонда | |
323 Мәсіх | |
284 Исаның | |
270 Иеміз | |
246 Мәсіхтің | |
238 Сондықтан | |
211 Ізгі | |
208 Содан | |
208 айтып | |
205 кезде | |
188 Алайда | |
181 етіп | |
175 Исаға | |
174 барып | |
166 жерде | |
151 Исаны | |
150 Петір | |
141 Сонымен | |
Translation time: 4.965975522994995 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-uig.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaz -> uig | |
Error: Malformed input stream.Number of tokenised words in the corpus: 2966 | |
Coverage: 70.23% | |
Top unknown words in the corpus: | |
8 КСРО | |
8 оңт | |
7 тайпалар | |
7 жерінде | |
6 Республикасы | |
6 Қазақ | |
6 шығыс | |
6 жер | |
6 республика | |
6 желтоқсанда | |
6 басшылары | |
6 республиканың | |
5 ның | |
5 батыс | |
5 Украина | |
5 Республикасының | |
5 солт | |
4 шығысында | |
4 тау | |
4 Каспий | |
Translation time: 0.15818142890930176 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaz-uig.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage uig -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 692001 | |
Coverage: 57.33% | |
Top unknown words in the corpus: | |
5391 ۋە | |
4124 بۇ | |
4115 ئۇ | |
3007 بىر | |
2610 مەن | |
2541 ئۇالر | |
2289 دەپ | |
2189 ئۈچۈن | |
2173 دېدى | |
2159 ئەيسا | |
2014 ھەزرىتى | |
1875 پەرۋەردىگار | |
1704 قىلىپ | |
1656 بولۇپ | |
1454 ئۆز | |
1379 چۈنكى | |
1377 سىلەر | |
1345 ئۇالرنىڭ | |
1297 بولغان | |
1296 قىلغان | |
Translation time: 4.557683944702148 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./uig-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage uig -> kaz | |
Error: Malformed input stream.Number of tokenised words in the corpus: 194 | |
Coverage: 41.24% | |
Top unknown words in the corpus: | |
3 ئۇيغۇر | |
3 كومپۇتەر | |
2 ۋە | |
2 بولۇپ | |
2 بیزنیڭ | |
2 ئاز | |
2 كیشیلیریمیز | |
2 جۇڭخۇا | |
2 جۇمھۇرىيىتى | |
2 شەھىرى | |
1 ئۇيغۇرچە | |
1 ۋىكىپىدىيە | |
1 خەلقئارالىق | |
1 ئۇچۇر | |
1 بېتى | |
1 ۋىكىپېدىيەنىڭ | |
1 نۇسخاسىغا | |
1 خوش | |
1 كېلىپسىز | |
1 تاللانغان | |
Translation time: 0.015642166137695312 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./uig-kaz.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
kir uzb | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 0bd73de9fd7a7b50bfb4d95ec7c3837a7c25a164 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-kir from ../../apertium-languages/apertium-kir/ | |
Using apertium-uzb from ../../apertium-languages/apertium-uzb/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "kir-uzb.autobil.bin uzb-kir.autobil.bin kir-uzb.automorf.bin kir-uzb.autopgen.bin kir-uzb.autogen.bin kir-uzb.t1x.bin kir-uzb.t2x.bin uzb-kir.automorf.bin uzb-kir.autopgen.bin uzb-kir.autogen.bin uzb-kir.t1x.bin uzb-kir.t2x.bin kir-uzb.rlx.bin uzb-kir.rlx.bin kir-uzb.autolex.bin uzb-kir.autolex.bin" || rm -f kir-uzb.autobil.bin uzb-kir.autobil.bin kir-uzb.automorf.bin kir-uzb.autopgen.bin kir-uzb.autogen.bin kir-uzb.t1x.bin kir-uzb.t2x.bin uzb-kir.automorf.bin uzb-kir.autopgen.bin uzb-kir.autogen.bin uzb-kir.t1x.bin uzb-kir.t2x.bin kir-uzb.rlx.bin uzb-kir.rlx.bin kir-uzb.autolex.bin uzb-kir.autolex.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-kir-uzb.kir-uzb.dix | |
lt-comp lr apertium-kir-uzb.kir-uzb.dix kir-uzb.autobil.bin | |
main@standard 838 1151 | |
apertium-validate-dictionary apertium-kir-uzb.kir-uzb.dix | |
lt-comp rl apertium-kir-uzb.kir-uzb.dix uzb-kir.autobil.bin | |
main@standard 838 1151 | |
if [ ! -d .deps ]; then mkdir .deps; fi | |
touch .deps/.d | |
lt-print kir-uzb.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kir-uzb.autobil.att | |
hfst-txt2fst -e ε < .deps/kir-uzb.autobil.att > .deps/kir-uzb.autobil.hfst | |
hfst-project -p upper .deps/kir-uzb.autobil.hfst > .deps/kir-uzb.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kir-uzb.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kir-uzb.autobil.prefixes | |
zcat ../../apertium-languages/apertium-kir//kir.automorf.att.gz | hfst-txt2fst > .deps/kir.automorf.hfst | |
hfst-compose-intersect -1 .deps/kir.automorf.hfst -2 .deps/kir-uzb.autobil.prefixes -o .deps/kir-uzb.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<quot>") in | |
transducer in file .deps/kir.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kir-uzb.autobil.prefixes. | |
hfst-fst2fst -O -i .deps/kir-uzb.automorf.trimmed -o kir-uzb.automorf.bin | |
hfst-fst2txt -i .deps/kir-uzb.automorf.trimmed -o .deps/kir-uzb.automorf.trimmed.att | |
lt-comp lr .deps/kir-uzb.automorf.trimmed.att kir-uzb.automorf.bin | |
main@standard 6684 15957 | |
final@inconditional 827 2299 | |
cp ../../apertium-languages/apertium-kir//kir.autopgen.bin kir-uzb.autopgen.bin | |
cp ../../apertium-languages/apertium-uzb//uzb.autogen.bin kir-uzb.autogen.bin | |
apertium-validate-transfer apertium-kir-uzb.kir-uzb.t1x | |
apertium-preprocess-transfer apertium-kir-uzb.kir-uzb.t1x kir-uzb.t1x.bin | |
apertium-validate-transfer apertium-kir-uzb.kir-uzb.t2x | |
apertium-preprocess-transfer apertium-kir-uzb.kir-uzb.t2x kir-uzb.t2x.bin | |
lt-print uzb-kir.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/uzb-kir.autobil.att | |
hfst-txt2fst -e ε < .deps/uzb-kir.autobil.att > .deps/uzb-kir.autobil.hfst | |
hfst-project -p upper .deps/uzb-kir.autobil.hfst > .deps/uzb-kir.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/uzb-kir.autobil.upper -2 .deps/any-symbol.hfst -o .deps/uzb-kir.autobil.prefixes | |
zcat ../../apertium-languages/apertium-uzb//uzb.automorf.att.gz | hfst-txt2fst > .deps/uzb.automorf.hfst | |
hfst-compose-intersect -1 .deps/uzb.automorf.hfst -2 .deps/uzb-kir.autobil.prefixes -o .deps/uzb-kir.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("{🂡}") in | |
transducer in file .deps/uzb.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/uzb-kir.autobil.prefixes. | |
hfst-fst2txt -i .deps/uzb-kir.automorf.trimmed -o .deps/uzb-kir.automorf.trimmed.att | |
lt-comp lr .deps/uzb-kir.automorf.trimmed.att uzb-kir.automorf.bin | |
main@standard 1109 1924 | |
final@inconditional 21 94 | |
apertium-validate-dictionary ../../apertium-languages/apertium-uzb//apertium-uzb.post-uzb.dix | |
lt-comp lr ../../apertium-languages/apertium-uzb//apertium-uzb.post-uzb.dix uzb-kir.autopgen.bin | |
main@standard 16 356 | |
cp ../../apertium-languages/apertium-kir//kir.autogen.bin uzb-kir.autogen.bin | |
apertium-validate-transfer apertium-kir-uzb.uzb-kir.t1x | |
apertium-preprocess-transfer apertium-kir-uzb.uzb-kir.t1x uzb-kir.t1x.bin | |
apertium-validate-transfer apertium-kir-uzb.uzb-kir.t2x | |
apertium-preprocess-transfer apertium-kir-uzb.uzb-kir.t2x uzb-kir.t2x.bin | |
cg-comp ../../apertium-languages/apertium-kir//apertium-kir.kir.rlx kir-uzb.rlx.bin | |
Sections: 3, Rules: 71, Sets: 102, Tags: 126 | |
cg-comp ../../apertium-languages/apertium-uzb//apertium-uzb.uzb.rlx uzb-kir.rlx.bin | |
Sections: 0, Rules: 62, Sets: 54, Tags: 104 | |
lrx-comp apertium-kir-uzb.kir-uzb.lrx kir-uzb.autolex.bin | |
1: 19@19 | |
lrx-comp apertium-kir-uzb.uzb-kir.lrx uzb-kir.autolex.bin | |
1: 19@19 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
cp *.mode modes/ | |
cp: der Aufruf von stat für '*.mode' ist nicht möglich: Datei oder Verzeichnis nicht gefunden | |
make: *** [Makefile:774: modes/kir-uzb.mode] Fehler 1 | |
bible coverage kir -> uzb | |
Number of tokenised words in the corpus: 205768 | |
Coverage: 64.63% | |
Top unknown words in the corpus: | |
1279 Ыйса | |
946 Кудай | |
597 Кудайдын | |
582 алып | |
380 Машаяк | |
362 Ыйсанын | |
325 өз | |
305 Кудайга | |
284 Ыйык | |
264 Анан | |
259 Эгебиз | |
246 баары | |
237 берди | |
229 ар | |
225 киши | |
208 Ыйсаны | |
204 Өз | |
189 керек | |
188 көп | |
187 эл | |
Translation time: 2.4062106609344482 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kir-uzb.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kir -> uzb | |
Error: Malformed input stream.Number of tokenised words in the corpus: 9480 | |
Coverage: 44.46% | |
Top unknown words in the corpus: | |
51 Кыргыз | |
29 Кыргызстандын | |
29 Республикасынын | |
28 табигый | |
28 географиялык | |
27 География | |
25 кылымдын | |
24 ж | |
23 илимий | |
20 ар | |
20 жылы | |
19 жайгашкан | |
18 география | |
18 кыргыз | |
18 тоо | |
17 Географиялык | |
17 А | |
16 Кыргызстан | |
15 экономикалык | |
15 С | |
Translation time: 0.09597134590148926 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kir-uzb.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage uzb -> kir | |
Number of tokenised words in the corpus: 215561 | |
Coverage: 51.41% | |
Top unknown words in the corpus: | |
3577 bo | |
3488 o | |
2129 ko | |
1423 Iso | |
1162 O | |
985 g | |
925 qo | |
854 so | |
755 yo | |
741 Xudo | |
735 to | |
715 z | |
553 Xudoning | |
450 lib | |
395 lgan | |
391 Masih | |
365 zi | |
352 har | |
345 lsa | |
333 shunday | |
Translation time: 0.743370771408081 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./uzb-kir.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage uzb -> kir | |
Error: Malformed input stream.Number of tokenised words in the corpus: 4189 | |
Coverage: 41.27% | |
Top unknown words in the corpus: | |
32 X | |
27 Oʻzbekiston | |
22 av | |
21 Xorazm | |
15 qad | |
14 boʻlgan | |
14 mil | |
12 qalʼa | |
12 Mil | |
11 asr | |
11 yasalgan | |
10 boʻlib | |
10 xom | |
10 oʻlka | |
10 ning | |
10 shim | |
10 da | |
9 jan | |
9 madaniyati | |
8 qismi | |
Translation time: 0.02355480194091797 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./uzb-kir.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
nog kaz | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 64776015694b4e339eab1cf9b23ae9f4c6c9cb28 | |
bible coverage nog -> kaz | |
[Errno 2] No such file or directory: 'nog-kaz.automorf.bin' | |
wikipedia coverage nog -> kaz | |
[Errno 2] No such file or directory: '../../apertium-languages/apertium-nog/wiki.destxt' | |
bible coverage kaz -> nog | |
[Errno 2] No such file or directory: 'kaz-nog.automorf.bin' | |
wikipedia coverage kaz -> nog | |
[Errno 2] No such file or directory: 'kaz-nog.automorf.bin' | |
tat bak | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 94b66d3c663e88ad5263734620780b2eeea80c16 | |
configure.ac:4: warning: AM_INIT_AUTOMAKE: two- and three-arguments forms are deprecated. For more info, see: | |
configure.ac:4: https://www.gnu.org/software/automake/manual/automake.html#Modernize-AM_005fINIT_005fAUTOMAKE-invocation | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-tat from ../../apertium-languages/apertium-tat/ | |
Using apertium-bak from ../../apertium-languages/apertium-bak/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "tat-bak.autobil.bin bak-tat.autobil.bin tat-bak.automorf.bin tat-bak.autopgen.bin tat-bak.autogen.bin tat-bak.t1x.bin tat-bak.t2x.bin bak-tat.automorf.bin bak-tat.autopgen.bin bak-tat.autogen.bin bak-tat.t1x.bin bak-tat.t2x.bin tat-bak.rlx.bin bak-tat.rlx.bin tat-bak.lrx.bin bak-tat.lrx.bin" || rm -f tat-bak.autobil.bin bak-tat.autobil.bin tat-bak.automorf.bin tat-bak.autopgen.bin tat-bak.autogen.bin tat-bak.t1x.bin tat-bak.t2x.bin bak-tat.automorf.bin bak-tat.autopgen.bin bak-tat.autogen.bin bak-tat.t1x.bin bak-tat.t2x.bin tat-bak.rlx.bin bak-tat.rlx.bin tat-bak.lrx.bin bak-tat.lrx.bin | |
rm -rf .deps modes | |
apertium-validate-dictionary apertium-tat-bak.tat-bak.dix | |
lt-comp lr apertium-tat-bak.tat-bak.dix tat-bak.autobil.bin | |
main@standard 71611 117353 | |
apertium-validate-dictionary apertium-tat-bak.tat-bak.dix | |
lt-comp rl apertium-tat-bak.tat-bak.dix bak-tat.autobil.bin | |
main@standard 71609 117346 | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
lt-print tat-bak.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-bak.autobil.att | |
hfst-txt2fst -e ε < .deps/tat-bak.autobil.att > .deps/tat-bak.autobil.hfst | |
hfst-project -p upper .deps/tat-bak.autobil.hfst > .deps/tat-bak.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tat-bak.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-bak.autobil.prefixes | |
zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst | |
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-bak.autobil.prefixes -o .deps/tat-bak.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<punct>") in | |
transducer in file .deps/tat.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tat-bak.autobil.prefixes. | |
hfst-fst2txt -i .deps/tat-bak.automorf.trimmed -o .deps/tat-bak.automorf.trimmed.att | |
lt-comp lr .deps/tat-bak.automorf.trimmed.att tat-bak.automorf.bin | |
main@standard 225878 445718 | |
final@inconditional 38 64 | |
apertium-validate-dictionary apertium-tat-bak.post-tat.dix | |
lt-comp lr apertium-tat-bak.post-tat.dix tat-bak.autopgen.bin | |
main@standard 16 356 | |
cp ../../apertium-languages/apertium-bak//bak.autogen.bin tat-bak.autogen.bin | |
apertium-validate-transfer apertium-tat-bak.tat-bak.t1x | |
apertium-preprocess-transfer apertium-tat-bak.tat-bak.t1x tat-bak.t1x.bin | |
apertium-validate-transfer apertium-tat-bak.tat-bak.t2x | |
apertium-preprocess-transfer apertium-tat-bak.tat-bak.t2x tat-bak.t2x.bin | |
lt-print bak-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/bak-tat.autobil.att | |
hfst-txt2fst -e ε < .deps/bak-tat.autobil.att > .deps/bak-tat.autobil.hfst | |
hfst-project -p upper .deps/bak-tat.autobil.hfst > .deps/bak-tat.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/bak-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/bak-tat.autobil.prefixes | |
zcat ../../apertium-languages/apertium-bak//bak.automorf.att.gz | hfst-txt2fst > .deps/bak.automorf.hfst | |
hfst-compose-intersect -1 .deps/bak.automorf.hfst -2 .deps/bak-tat.autobil.prefixes -o .deps/bak-tat.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<punct>") in | |
transducer in file .deps/bak.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/bak-tat.autobil.prefixes. | |
hfst-fst2txt -i .deps/bak-tat.automorf.trimmed -o .deps/bak-tat.automorf.trimmed.att | |
lt-comp lr .deps/bak-tat.automorf.trimmed.att bak-tat.automorf.bin | |
main@standard 78313 141455 | |
final@inconditional 15 35 | |
apertium-validate-dictionary apertium-tat-bak.post-bak.dix | |
lt-comp lr apertium-tat-bak.post-bak.dix bak-tat.autopgen.bin | |
main@standard 10 149 | |
cp ../../apertium-languages/apertium-tat//tat.autogen.bin bak-tat.autogen.bin | |
apertium-validate-transfer apertium-tat-bak.bak-tat.t1x | |
apertium-preprocess-transfer apertium-tat-bak.bak-tat.t1x bak-tat.t1x.bin | |
apertium-validate-transfer apertium-tat-bak.bak-tat.t2x | |
apertium-preprocess-transfer apertium-tat-bak.bak-tat.t2x bak-tat.t2x.bin | |
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-bak.rlx.bin | |
Sections: 11, Rules: 123, Sets: 154, Tags: 194 | |
cg-comp ../../apertium-languages/apertium-bak//apertium-bak.bak.rlx bak-tat.rlx.bin | |
Sections: 1, Rules: 5, Sets: 25, Tags: 44 | |
lrx-comp apertium-tat-bak.tat-bak.lrx tat-bak.lrx.bin | |
2: 34@36 | |
lrx-comp apertium-tat-bak.bak-tat.lrx bak-tat.lrx.bin | |
2: 31@33 | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
bible coverage tat -> bak | |
Number of tokenised words in the corpus: 196787 | |
Coverage: 97.34% | |
Top unknown words in the corpus: | |
57 каршында | |
52 явыз | |
52 фарисейләр | |
49 Һируд | |
49 хачка | |
47 канунчылар | |
36 Имандашлар | |
33 савыктыра | |
33 Барнаб | |
30 кайберләре | |
29 Шаул | |
29 Corinthians | |
28 Matthew | |
28 дучар | |
28 беркайчан | |
28 John | |
28 Acts | |
27 имандаш | |
26 Гәлиләя | |
26 чумдырылу | |
Translation time: 6.27307653427124 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-bak.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tat -> bak | |
Error: Malformed input stream.Number of tokenised words in the corpus: 26 | |
Coverage: 46.15% | |
Top unknown words in the corpus: | |
3 Tatnet | |
1 Tatarça | |
1 İnternet | |
1 tulısınça | |
1 Tatar | |
1 İnternetı | |
1 Tatarstan | |
1 Respublikası | |
1 däwlät | |
1 tellärendä | |
1 tatar | |
1 häm | |
Translation time: 0.12012624740600586 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-bak.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage bak -> tat | |
Number of tokenised words in the corpus: 197387 | |
Coverage: 94.05% | |
Top unknown words in the corpus: | |
176 алдында | |
144 Һөйөнөслө | |
114 китте | |
94 имандаштар | |
75 үҙҙәре | |
71 шундай | |
63 алдына | |
58 ҡыуып | |
54 арҡысаҡҡа | |
53 киткән | |
52 фарисейҙар | |
51 бөтөнөһө | |
50 ҡисса | |
49 дусар | |
49 өҫтөнән | |
48 Ирод | |
48 береһенә | |
48 Имандаштар | |
46 Йәһүҙә | |
46 халҡы | |
Translation time: 4.23078179359436 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./bak-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage bak -> tat | |
Error: Malformed input stream.Number of tokenised words in the corpus: 474 | |
Coverage: 96.20% | |
Top unknown words in the corpus: | |
4 власы | |
2 ө | |
2 н | |
1 ноябрендә | |
1 октябрендә | |
1 суверенитеты | |
1 февраленән | |
1 ТӨРКСОЙ | |
1 Халҡы | |
1 ын | |
1 тауҙарының | |
1 Ямантау | |
1 мәмерйәләре | |
Translation time: 0.06259441375732422 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./bak-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
tat kaa | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit e685b6d852eb648f87d89649c331bc75898cc1ce | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-tat from ../../apertium-languages/apertium-tat/ | |
Using apertium-kaa from ../../apertium-languages/apertium-kaa/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |
config.status: creating Makefile | |
test -z "tat-kaa.automorf.bin tat-kaa.prob tat-kaa.rlx.bin tat-kaa.autobil.bin tat-kaa.autolex.bin tat-kaa.autogen.bin tat-kaa.autopgen.bin tat-kaa.t1x.bin tat-kaa.t2x.bin tat-kaa.t3x.bin kaa-tat.automorf.bin kaa-tat.rlx.bin kaa-tat.autobil.bin kaa-tat.autolex.bin kaa-tat.autogen.bin kaa-tat.autopgen.bin kaa-tat.t1x.bin kaa-tat.t2x.bin kaa-tat.t3x.bin" || rm -f tat-kaa.automorf.bin tat-kaa.prob tat-kaa.rlx.bin tat-kaa.autobil.bin tat-kaa.autolex.bin tat-kaa.autogen.bin tat-kaa.autopgen.bin tat-kaa.t1x.bin tat-kaa.t2x.bin tat-kaa.t3x.bin kaa-tat.automorf.bin kaa-tat.rlx.bin kaa-tat.autobil.bin kaa-tat.autolex.bin kaa-tat.autogen.bin kaa-tat.autopgen.bin kaa-tat.t1x.bin kaa-tat.t2x.bin kaa-tat.t3x.bin | |
rm -rf .deps modes | |
/bin/mkdir -p .deps | |
touch .deps/.d | |
/bin/zcat ../../apertium-languages/apertium-tat//tat.automorf.att.gz | hfst-txt2fst > .deps/tat.automorf.hfst | |
apertium-validate-dictionary apertium-tat-kaa.tat-kaa.dix | |
lt-comp lr apertium-tat-kaa.tat-kaa.dix tat-kaa.autobil.bin | |
main@standard 9 17 | |
lt-print tat-kaa.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/tat-kaa.autobil.att | |
hfst-txt2fst -e ε < .deps/tat-kaa.autobil.att > .deps/tat-kaa.autobil.hfst | |
hfst-project -p upper .deps/tat-kaa.autobil.hfst > .deps/tat-kaa.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/tat-kaa.autobil.upper -2 .deps/any-symbol.hfst -o .deps/tat-kaa.autobil.prefixes | |
hfst-compose-intersect -1 .deps/tat.automorf.hfst -2 .deps/tat-kaa.autobil.prefixes -o .deps/tat-kaa.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<punct>") in | |
transducer in file .deps/tat.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/tat-kaa.autobil.prefixes. | |
hfst-fst2txt -i .deps/tat-kaa.automorf.trimmed -o .deps/tat-kaa.automorf.trimmed.att | |
lt-comp lr .deps/tat-kaa.automorf.trimmed.att tat-kaa.automorf.bin | |
main@standard 351 668 | |
final@inconditional 8 12 | |
cp ../../apertium-languages/apertium-tat//tat.prob tat-kaa.prob | |
cg-comp ../../apertium-languages/apertium-tat//apertium-tat.tat.rlx tat-kaa.rlx.bin | |
Sections: 11, Rules: 123, Sets: 154, Tags: 194 | |
lrx-comp apertium-tat-kaa.tat-kaa.lrx tat-kaa.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-kaa//kaa.autogen.bin tat-kaa.autogen.bin | |
cp ../../apertium-languages/apertium-kaa//kaa.autopgen.bin tat-kaa.autopgen.bin | |
apertium-validate-transfer apertium-tat-kaa.tat-kaa.t1x | |
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t1x tat-kaa.t1x.bin | |
apertium-validate-interchunk apertium-tat-kaa.tat-kaa.t2x | |
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t2x tat-kaa.t2x.bin | |
apertium-validate-postchunk apertium-tat-kaa.tat-kaa.t3x | |
apertium-preprocess-transfer apertium-tat-kaa.tat-kaa.t3x tat-kaa.t3x.bin | |
/bin/zcat ../../apertium-languages/apertium-kaa//kaa.automorf.att.gz | hfst-txt2fst > .deps/kaa.automorf.hfst | |
apertium-validate-dictionary apertium-tat-kaa.tat-kaa.dix | |
lt-comp rl apertium-tat-kaa.tat-kaa.dix kaa-tat.autobil.bin | |
main@standard 9 17 | |
lt-print kaa-tat.autobil.bin | sed 's/ /@_SPACE_@/g' > .deps/kaa-tat.autobil.att | |
hfst-txt2fst -e ε < .deps/kaa-tat.autobil.att > .deps/kaa-tat.autobil.hfst | |
hfst-project -p upper .deps/kaa-tat.autobil.hfst > .deps/kaa-tat.autobil.upper | |
echo " ?* " | hfst-regexp2fst > .deps/any-symbol.hfst | |
hfst-concatenate -1 .deps/kaa-tat.autobil.upper -2 .deps/any-symbol.hfst -o .deps/kaa-tat.autobil.prefixes | |
hfst-compose-intersect -1 .deps/kaa.automorf.hfst -2 .deps/kaa-tat.autobil.prefixes -o .deps/kaa-tat.automorf.trimmed | |
hfst-compose-intersect: warning: | |
Found output multi-char symbols ("<apos>") in | |
transducer in file .deps/kaa.automorf.hfst which are not found on the | |
input tapes of transducers in file .deps/kaa-tat.autobil.prefixes. | |
hfst-fst2txt -i .deps/kaa-tat.automorf.trimmed -o .deps/kaa-tat.automorf.trimmed.att | |
lt-comp lr .deps/kaa-tat.automorf.trimmed.att kaa-tat.automorf.bin | |
main@standard 183 359 | |
final@inconditional 7 12 | |
cg-comp ../../apertium-languages/apertium-kaa//apertium-kaa.kaa.rlx kaa-tat.rlx.bin | |
Sections: 1, Rules: 1, Sets: 5, Tags: 23 | |
lrx-comp apertium-tat-kaa.kaa-tat.lrx kaa-tat.autolex.bin | |
1: 28@29 | |
cp ../../apertium-languages/apertium-tat//tat.autogen.bin kaa-tat.autogen.bin | |
cp ../../apertium-languages/apertium-tat//tat.autopgen.bin kaa-tat.autopgen.bin | |
apertium-validate-transfer apertium-tat-kaa.kaa-tat.t1x | |
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t1x kaa-tat.t1x.bin | |
apertium-validate-interchunk apertium-tat-kaa.kaa-tat.t2x | |
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t2x kaa-tat.t2x.bin | |
apertium-validate-postchunk apertium-tat-kaa.kaa-tat.t3x | |
apertium-preprocess-transfer apertium-tat-kaa.kaa-tat.t3x kaa-tat.t3x.bin | |
apertium-validate-modes modes.xml | |
apertium-gen-modes modes.xml | |
lt-comp lr .deps/tat.automorf.bin.att .deps/tat.automorf.bin | |
main@standard 242055 497437 | |
final@inconditional 805 1769 | |
lt-comp lr .deps/kaa.automorf.bin.att .deps/kaa.automorf.bin | |
main@standard 22375 47983 | |
final@inconditional 443 1599 | |
bible coverage tat -> kaa | |
Number of tokenised words in the corpus: 178385 | |
Coverage: 19.96% | |
Top unknown words in the corpus: | |
3525 һәм | |
1964 белән | |
1351 Гайсә | |
1335 дип | |
1279 өчен | |
1202 дә | |
1126 Аллаһы | |
1109 да | |
1044 Ул | |
711 Мин | |
710 ул | |
630 бер | |
622 Аның | |
607 алар | |
587 иде | |
551 сез | |
533 бу | |
516 диде | |
515 итеп | |
511 ә | |
Translation time: 0.3744645118713379 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-kaa.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage tat -> kaa | |
Error: Malformed input stream.Number of tokenised words in the corpus: 17 | |
Coverage: 17.65% | |
Top unknown words in the corpus: | |
2 Tatnet | |
1 ^Tatnet | |
1 Tatarça | |
1 İnternet | |
1 tulısınça | |
1 Tatar | |
1 İnternetı | |
1 Tatarstan | |
1 Respublikası | |
1 däwlät | |
1 tellärendä | |
1 tatar | |
1 häm | |
Translation time: 0.0061550140380859375 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./tat-kaa.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
bible coverage kaa -> tat | |
Number of tokenised words in the corpus: 172711 | |
Coverage: 16.31% | |
Top unknown words in the corpus: | |
2075 hám | |
1625 menen | |
1303 ushın | |
1223 İysa | |
1223 de | |
1134 O | |
1111 bir | |
1060 da | |
1038 dep | |
1032 dedi | |
876 edi | |
817 Qudaydıń | |
807 Ol | |
710 Biraq | |
645 Quday | |
629 adam | |
620 Men | |
563 bul | |
520 Muxaddes | |
515 etip | |
Translation time: 0.3134338855743408 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaa-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
wikipedia coverage kaa -> tat | |
Error: Malformed input stream.Number of tokenised words in the corpus: 3 | |
Coverage: 33.33% | |
Top unknown words in the corpus: | |
1 ^Bas | |
1 bet | |
Translation time: 0.004499197006225586 seconds | |
Generating hitparade (might take a bit)! | |
Could not open transducer file ./kaa-tat.automorf.hfst | |
TOP UNKNOWN WORDS: | |
coverage: 0 / 0 (Error 10002) | |
remaining unknown forms: 0 | |
tat kir | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 56e673ad16a30e2a0eb0015015455265b66a3560 | |
bible coverage tat -> kir | |
[Errno 2] No such file or directory: 'tat-kir.automorf.bin' | |
wikipedia coverage tat -> kir | |
[Errno 2] No such file or directory: 'tat-kir.automorf.bin' | |
bible coverage kir -> tat | |
[Errno 2] No such file or directory: 'kir-tat.automorf.bin' | |
wikipedia coverage kir -> tat | |
[Errno 2] No such file or directory: 'kir-tat.automorf.bin' | |
tuk tur | |
Bereits auf 'master' | |
Ihr Branch ist auf demselben Stand wie 'origin/master'. | |
Bereits aktuell. | |
commit 9447fb2278ed49b2dd982d6a3871e0cc5c250bd1 | |
checking for a BSD-compatible install... /usr/bin/install -c | |
checking whether build environment is sane... yes | |
checking for a thread-safe mkdir -p... /bin/mkdir -p | |
checking for gawk... gawk | |
checking whether make sets $(MAKE)... yes | |
checking whether make supports nested variables... yes | |
checking whether ln -s works... yes | |
checking for gawk... (cached) gawk | |
checking for pkg-config... /usr/bin/pkg-config | |
checking pkg-config is at least version 0.9.0... yes | |
checking for APERTIUM... yes | |
checking for hfst-lexc... /usr/bin/hfst-lexc | |
checking for hfst-twolc... /usr/bin/hfst-twolc | |
checking for cg-comp... /usr/bin/cg-comp | |
checking for cg-proc... /usr/bin/cg-proc | |
checking for lrx-comp... /usr/bin/lrx-comp | |
checking for lrx-proc... /usr/bin/lrx-proc | |
checking for gzcat... no | |
checking for zcat... /bin/zcat | |
Using apertium-tuk from ../../apertium-languages/apertium-tuk/ | |
Using apertium-tur from ../../apertium-languages/apertium-tur/ | |
checking that generated files are newer than configure... done | |
configure: creating ./config.status | |