Difference between revisions of "UDPipe"

From Apertium
Jump to navigation Jump to search
Line 6: Line 6:
git clone https://github.com/UniversalDependencies/UD_Norwegian-Bokmaal
git clone https://github.com/UniversalDependencies/UD_Norwegian-Bokmaal
cd UD_Norwegian-Bokmaal
cd UD_Norwegian-Bokmaal
cat no-ud-train.conllu |../udpipe --train nob.udpipe
cat no_bokmaal-ud-train.conllu |../udpipe --train nob.udpipe
</pre>
</pre>


test:
test:
<pre>
<pre>
cat no-ud-test.conllu |cut -f1-6 | sed 's/$/\t_\t_\t_\t_/g' | sed 's/^\t.*//g'|../udpipe --parse nob.udpipe > output
cat no_bokmaal-ud-test.conllu |cut -f1-6 | sed 's/$/\t_\t_\t_\t_/g' | sed 's/^\t.*//g'|../udpipe --parse nob.udpipe > output
</pre>
</pre>



Revision as of 17:35, 5 March 2017

train:

git clone https://github.com/ufal/udpipe
cd udpipe/src
make
git clone https://github.com/UniversalDependencies/UD_Norwegian-Bokmaal
cd UD_Norwegian-Bokmaal
cat no_bokmaal-ud-train.conllu |../udpipe  --train nob.udpipe                  

test:

cat no_bokmaal-ud-test.conllu  |cut -f1-6 | sed 's/$/\t_\t_\t_\t_/g' | sed 's/^\t.*//g'|../udpipe --parse nob.udpipe    > output               

test (with tokeniser):

echo "Det ligger en bok på bordet." | ../udpipe --tokenize --tag --parse nob.udpipe