Difference between revisions of "Talk:Apertium New Language Pair HOWTO"
Jump to navigation
Jump to search
m (New page: Possibly, at the very end, one could mention the possibility of typing <code>make sh-en.t1x.bin</code> etc. instead of all those different commands, for the language pairs priviliged en...) |
|||
Line 5: | Line 5: | ||
etc. instead of all those different commands, for the language pairs priviliged enough to have fancy makefiles. |
etc. instead of all those different commands, for the language pairs priviliged enough to have fancy makefiles. |
||
--[[User:Unhammer|Unhammer]] |
--[[User:Unhammer|Unhammer]] |
||
==Files== |
|||
apertium-sh-en.sh-en.dix |
|||
<pre> |
|||
<?xml version="1.0" encoding="UTF-8"?> |
|||
<dictionary> |
|||
<alphabet/> |
|||
<sdefs> |
|||
<sdef n="n"/> |
|||
<sdef n="sg"/> |
|||
<sdef n="pl"/> |
|||
<sdef n="vblex"/> |
|||
</sdefs> |
|||
<section id="main" type="standard"> |
|||
<e><p><l>gramofon<s n="n"/></l><r>gramophone<s n="n"/></r></p></e> |
|||
<e><p><l>videti<s n="vblex"/></l><r>see<s n="vblex"/></r></p></e> |
|||
</section> |
|||
</dictionary> |
|||
</pre> |
|||
apertium-sh-en.sh.dix |
|||
<pre> |
|||
<?xml version="1.0" encoding="ISO-8859-2"?> |
|||
<dictionary> |
|||
<alphabet>ABCCCDDzZEFGHIJKLLjMNNjOPRSŠTUVZŽabc??ddž?efghijklljmnnjoprsštuvzž</alphabet> |
|||
<sdefs> |
|||
<sdef n="n"/> |
|||
<sdef n="sg"/> |
|||
<sdef n="pl"/> |
|||
<sdef n="vblex"/> |
|||
<sdef n="p1"/> |
|||
<sdef n="pri"/> |
|||
</sdefs> |
|||
<pardefs> |
|||
<pardef n="gramofon__n"> |
|||
<e> |
|||
<p> |
|||
<l/> |
|||
<r><s n="n"/><s n="sg"/></r> |
|||
</p> |
|||
</e> |
|||
<e> |
|||
<p> |
|||
<l>i</l> |
|||
<r><s n="n"/><s n="pl"/></r> |
|||
</p> |
|||
</e> |
|||
</pardef> |
|||
<pardef n="vid/eti__vblex"> |
|||
<e> |
|||
<p> |
|||
<l>im</l> |
|||
<r>eti<s n="vblex"/><s n="pri"/><s n="p1"/><s n="sg"/></r> |
|||
</p> |
|||
</e> |
|||
<e> |
|||
<p> |
|||
<l>imo</l> |
|||
<r>eti<s n="vblex"/><s n="pri"/><s n="p1"/><s n="pl"/></r> |
|||
</p> |
|||
</e> |
|||
</pardef> |
|||
</pardefs> |
|||
<section id="main" type="standard"> |
|||
<e lm="gramofon"><i>gramofon</i><par n="gramofon__n"/></e> |
|||
<e lm="videti"><i>vid</i><par n="vid/eti__vblex"/></e> |
|||
</section> |
|||
</dictionary> |
|||
</pre> |
|||
apertium-sh-en.sh-en.t1x |
|||
<pre> |
|||
<?xml version="1.0" encoding="UTF-8"?> |
|||
<transfer> |
|||
<section-def-cats> |
|||
<def-cat n="nom"> |
|||
<cat-item tags="n.*"/> |
|||
</def-cat> |
|||
<def-cat n="vrb"> |
|||
<cat-item tags="vblex.*"/> |
|||
</def-cat> |
|||
<def-cat n="prpers"> |
|||
<cat-item lemma="prpers" tags="prn.*"/> |
|||
</def-cat> |
|||
</section-def-cats> |
|||
<section-def-attrs> |
|||
<def-attr n="nbr"> |
|||
<attr-item tags="sg"/> |
|||
<attr-item tags="pl"/> |
|||
</def-attr> |
|||
<def-attr n="a_nom"> |
|||
<attr-item tags="n"/> |
|||
</def-attr> |
|||
<def-attr n="temps"> |
|||
<attr-item tags="pri"/> |
|||
</def-attr> |
|||
<def-attr n="pers"> |
|||
<attr-item tags="p1"/> |
|||
</def-attr> |
|||
<def-attr n="a_verb"> |
|||
<attr-item tags="vblex"/> |
|||
</def-attr> |
|||
<def-attr n="tipus_prn"> |
|||
<attr-item tags="prn.subj"/> |
|||
<attr-item tags="prn.obj"/> |
|||
</def-attr> |
|||
</section-def-attrs> |
|||
<section-def-vars> |
|||
<def-var n="number"/> |
|||
</section-def-vars> |
|||
<section-rules> |
|||
<rule> |
|||
<pattern> |
|||
<pattern-item n="nom"/> |
|||
</pattern> |
|||
<action> |
|||
<out> |
|||
<lu> |
|||
<clip pos="1" side="tl" part="lem"/> |
|||
<clip pos="1" side="tl" part="a_nom"/> |
|||
<clip pos="1" side="tl" part="nbr"/> |
|||
</lu> |
|||
</out> |
|||
</action> |
|||
</rule> |
|||
<rule> |
|||
<pattern> |
|||
<pattern-item n="vrb"/> |
|||
</pattern> |
|||
<action> |
|||
<out> |
|||
<lu> |
|||
<lit v="prpers"/> |
|||
<lit-tag v="prn"/> |
|||
<lit-tag v="subj"/> |
|||
<clip pos="1" side="tl" part="lem"/> |
|||
<clip pos="1" side="tl" part="pers"/> |
|||
<clip pos="1" side="tl" part="nbr"/> |
|||
</lu> |
|||
<b/> |
|||
<lu> |
|||
<clip pos="1" side="tl" part="lem"/> |
|||
<clip pos="1" side="tl" part="a_verb"/> |
|||
<clip pos="1" side="tl" part="temps"/> |
|||
</lu> |
|||
</out> |
|||
</action> |
|||
</rule> |
|||
</section-rules> |
|||
</transfer> |
|||
</pre> |
|||
apertium-sh-en.en.dix |
|||
<pre> |
|||
<?xml version="1.0" encoding="ISO-8859-2"?> |
|||
<dictionary> |
|||
<alphabet>ABCCCDDzZEFGHIJKLLjMNNjOPRSŠTUVZŽabc??ddž?efghijklljmnnjoprsštuvzž</alphabet> |
|||
<sdefs> |
|||
<sdef n="n"/> |
|||
<sdef n="sg"/> |
|||
<sdef n="pl"/> |
|||
<sdef n="vblex"/> |
|||
<sdef n="p1"/> |
|||
<sdef n="pri"/> |
|||
<sdef n="prn"/> |
|||
<sdef n="subj"/> |
|||
</sdefs> |
|||
<pardefs> |
|||
<pardef n="gramofon__n"> |
|||
<e> |
|||
<p> |
|||
<l/> |
|||
<r><s n="n"/><s n="sg"/></r> |
|||
</p> |
|||
</e> |
|||
<e> |
|||
<p> |
|||
<l>s</l> |
|||
<r><s n="n"/><s n="pl"/></r> |
|||
</p> |
|||
</e> |
|||
</pardef> |
|||
<pardef n="s/ee__vblex"> |
|||
<e> |
|||
<p> |
|||
<l>ee</l> |
|||
<r>ee<s n="vblex"/><s n="pri"/></r> |
|||
</p> |
|||
</e> |
|||
</pardef> |
|||
<pardef n="prsubj__prn"> |
|||
<e> |
|||
<p> |
|||
<l>I</l> |
|||
<r>prpers<s n="prn"/><s n="subj"/><s n="p1"/><s n="sg"/></r> |
|||
</p> |
|||
</e> |
|||
</pardef> |
|||
</pardefs> |
|||
<section id="main" type="standard"> |
|||
<e lm="gramophone"><i>gramophone</i><par n="gramofon__n"/></e> |
|||
<e lm="see"><i>s</i><par n="s/ee__vblex"/></e> |
|||
<e lm="personal subject pronouns"><i/><par n="prsubj__prn"/></e> |
|||
<e lm="record player"><i>record<b/>player</i><par n="gramofon__n"/></e> |
|||
</section> |
|||
</dictionary> |
|||
</pre> |
Revision as of 22:15, 29 April 2009
Possibly, at the very end, one could mention the possibility of typing
make sh-en.t1x.bin
etc. instead of all those different commands, for the language pairs priviliged enough to have fancy makefiles. --Unhammer
Files
apertium-sh-en.sh-en.dix
<?xml version="1.0" encoding="UTF-8"?> <dictionary> <alphabet/> <sdefs> <sdef n="n"/> <sdef n="sg"/> <sdef n="pl"/> <sdef n="vblex"/> </sdefs> <section id="main" type="standard"> <e><p><l>gramofon<s n="n"/></l><r>gramophone<s n="n"/></r></p></e> <e><p><l>videti<s n="vblex"/></l><r>see<s n="vblex"/></r></p></e> </section> </dictionary>
apertium-sh-en.sh.dix
<?xml version="1.0" encoding="ISO-8859-2"?> <dictionary> <alphabet>ABCCCDDzZEFGHIJKLLjMNNjOPRSŠTUVZŽabc??ddž?efghijklljmnnjoprsštuvzž</alphabet> <sdefs> <sdef n="n"/> <sdef n="sg"/> <sdef n="pl"/> <sdef n="vblex"/> <sdef n="p1"/> <sdef n="pri"/> </sdefs> <pardefs> <pardef n="gramofon__n"> <e> <p> <l/> <r><s n="n"/><s n="sg"/></r> </p> </e> <e> <p> <l>i</l> <r><s n="n"/><s n="pl"/></r> </p> </e> </pardef> <pardef n="vid/eti__vblex"> <e> <p> <l>im</l> <r>eti<s n="vblex"/><s n="pri"/><s n="p1"/><s n="sg"/></r> </p> </e> <e> <p> <l>imo</l> <r>eti<s n="vblex"/><s n="pri"/><s n="p1"/><s n="pl"/></r> </p> </e> </pardef> </pardefs> <section id="main" type="standard"> <e lm="gramofon"><i>gramofon</i><par n="gramofon__n"/></e> <e lm="videti"><i>vid</i><par n="vid/eti__vblex"/></e> </section> </dictionary>
apertium-sh-en.sh-en.t1x
<?xml version="1.0" encoding="UTF-8"?> <transfer> <section-def-cats> <def-cat n="nom"> <cat-item tags="n.*"/> </def-cat> <def-cat n="vrb"> <cat-item tags="vblex.*"/> </def-cat> <def-cat n="prpers"> <cat-item lemma="prpers" tags="prn.*"/> </def-cat> </section-def-cats> <section-def-attrs> <def-attr n="nbr"> <attr-item tags="sg"/> <attr-item tags="pl"/> </def-attr> <def-attr n="a_nom"> <attr-item tags="n"/> </def-attr> <def-attr n="temps"> <attr-item tags="pri"/> </def-attr> <def-attr n="pers"> <attr-item tags="p1"/> </def-attr> <def-attr n="a_verb"> <attr-item tags="vblex"/> </def-attr> <def-attr n="tipus_prn"> <attr-item tags="prn.subj"/> <attr-item tags="prn.obj"/> </def-attr> </section-def-attrs> <section-def-vars> <def-var n="number"/> </section-def-vars> <section-rules> <rule> <pattern> <pattern-item n="nom"/> </pattern> <action> <out> <lu> <clip pos="1" side="tl" part="lem"/> <clip pos="1" side="tl" part="a_nom"/> <clip pos="1" side="tl" part="nbr"/> </lu> </out> </action> </rule> <rule> <pattern> <pattern-item n="vrb"/> </pattern> <action> <out> <lu> <lit v="prpers"/> <lit-tag v="prn"/> <lit-tag v="subj"/> <clip pos="1" side="tl" part="lem"/> <clip pos="1" side="tl" part="pers"/> <clip pos="1" side="tl" part="nbr"/> </lu> <b/> <lu> <clip pos="1" side="tl" part="lem"/> <clip pos="1" side="tl" part="a_verb"/> <clip pos="1" side="tl" part="temps"/> </lu> </out> </action> </rule> </section-rules> </transfer>
apertium-sh-en.en.dix
<?xml version="1.0" encoding="ISO-8859-2"?> <dictionary> <alphabet>ABCCCDDzZEFGHIJKLLjMNNjOPRSŠTUVZŽabc??ddž?efghijklljmnnjoprsštuvzž</alphabet> <sdefs> <sdef n="n"/> <sdef n="sg"/> <sdef n="pl"/> <sdef n="vblex"/> <sdef n="p1"/> <sdef n="pri"/> <sdef n="prn"/> <sdef n="subj"/> </sdefs> <pardefs> <pardef n="gramofon__n"> <e> <p> <l/> <r><s n="n"/><s n="sg"/></r> </p> </e> <e> <p> <l>s</l> <r><s n="n"/><s n="pl"/></r> </p> </e> </pardef> <pardef n="s/ee__vblex"> <e> <p> <l>ee</l> <r>ee<s n="vblex"/><s n="pri"/></r> </p> </e> </pardef> <pardef n="prsubj__prn"> <e> <p> <l>I</l> <r>prpers<s n="prn"/><s n="subj"/><s n="p1"/><s n="sg"/></r> </p> </e> </pardef> </pardefs> <section id="main" type="standard"> <e lm="gramophone"><i>gramophone</i><par n="gramofon__n"/></e> <e lm="see"><i>s</i><par n="s/ee__vblex"/></e> <e lm="personal subject pronouns"><i/><par n="prsubj__prn"/></e> <e lm="record player"><i>record<b/>player</i><par n="gramofon__n"/></e> </section> </dictionary>