Skip to content

Commit

Permalink
[ca] improve rules
Browse files Browse the repository at this point in the history
  • Loading branch information
jaumeortola committed Sep 1, 2024
1 parent f3f71a6 commit ada7463
Show file tree
Hide file tree
Showing 3 changed files with 76 additions and 38 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -368,19 +368,19 @@ Copyright (C) 2012 Jaume Ortolà i Font
<pattern>
<token><exception postag="D..MS." postag_regexp="yes"/></token>
<marker>
<token>peça</token>
<token>peça</token>
</marker>
</pattern>
<disambig action="replace" postag="NCFS000"></disambig>
<disambig action="replace" postag="NCFS000"/>
</rule>
<rule>
<pattern>
<token><exception postag="D..MP." postag_regexp="yes"/></token>
<marker>
<token>peces</token>
<token>peces</token>
</marker>
</pattern>
<disambig action="replace" postag="NCFP000"></disambig>
<disambig action="replace" postag="NCFP000"/>
</rule>
</rulegroup>
<rulegroup id="PUNTUACIO" name="signes de puntuació">
Expand Down Expand Up @@ -19117,22 +19117,17 @@ Copyright (C) 2012 Jaume Ortolà i Font
<token>hi</token>
<token inflected="yes" regexp="yes">anar|venir|pujar</token>
</antipattern>
<antipattern>
<token inflected="yes">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</antipattern>
<antipattern>
<token postag="_GV_"/>
<token inflected="yes">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</antipattern>
<antipattern>
<!--<antipattern>
<token inflected="yes">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</antipattern>
</antipattern>-->
<antipattern>
<token postag="_GV_"/>
<token inflected="yes">venir</token>
Expand Down Expand Up @@ -20087,22 +20082,53 @@ Copyright (C) 2012 Jaume Ortolà i Font
<wd lemma="endurar"/>
</disambig>
</rule>
<rule id="venir_vendre" name="venir/vendre">
<pattern>
<marker>
<and>
<token postag="_reflexiu"/>
<token inflected="yes">venir</token>
<token inflected="yes">vendre</token>
</and>
</marker>
<token min="0">a</token>
<token regexp="yes">sobre|damunt</token>
</pattern>
<disambig action="remove">
<wd lemma="vendre"/>
</disambig>
</rule>
<rulegroup id="venir_vendre" name="venir/vendre">
<rule>
<pattern>
<marker>
<and>
<token postag="_reflexiu"/>
<token inflected="yes">venir</token>
<token inflected="yes">vendre</token>
</and>
</marker>
<token min="0">a</token>
<token regexp="yes">sobre|damunt</token>
</pattern>
<disambig action="remove">
<wd lemma="vendre"/>
</disambig>
</rule>
<rule>
<pattern>
<marker>
<and>
<token inflected="yes">venir</token>
<token inflected="yes">vendre</token>
</and>
</marker>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</pattern>
<disambig action="remove">
<wd lemma="vendre"/>
</disambig>
</rule>
<rule>
<pattern>
<marker>
<and>
<token inflected="yes">venir</token>
<token inflected="yes">vendre</token>
</and>
</marker>
<token>amb</token>
</pattern>
<disambig action="remove">
<wd lemma="vendre"/>
</disambig>
</rule>
</rulegroup>
<rulegroup id="femeni_inusual" name="femení inusual: amor, color...">
<rule>
<pattern>
Expand Down Expand Up @@ -20405,7 +20431,7 @@ Copyright (C) 2012 Jaume Ortolà i Font
<pattern>
<marker>
<token regexp="yes">seguit|bunga</token>
<token><match no="0"></match></token>
<token><match no="0"/></token>
</marker>
</pattern>
<disambig action="add">
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -196,7 +196,7 @@
<!--|utilitzar|usar|emprar-->
<!ENTITY verbs_colloquials "digue|vulgue|estigue|sigue|tingue|sàpigue|dugue">
<!ENTITY verbs_balears_ES "adès|avès|exprès|ingrès|procès|profès|progrès|regrès|reingrès|revès|travès">
<!ENTITY vocabulari_menjar "xocolata|xocolate|allioli|aliment|all|amanida|arròs|bolet|carn|carxofa|cep|coriandre|fava|fetge|foie|formatge|gamba|j[ou]livert|llamàntol|llobregant|lluç|macarró|magret|mandonguilla|mango|menjar|mongeta|p[éè]sol|pa|pastís|porc|r[eo]nyó|safrà|tofu|verdura|vi|ànec|gelat|llimona|maduixa|paella|fideu|orxata">
<!ENTITY vocabulari_menjar "xocolata|xocolate|allioli|aliment|all|amanida|ensalada|arròs|bolet|carn|carxofa|cep|coriandre|fava|fetge|foie|formatge|gamba|j[ou]livert|llamàntol|llobregant|lluç|macarró|magret|mandonguilla|mango|menjar|mongeta|p[éè]sol|pa|pastís|porc|r[eo]nyó|safrà|tofu|verdura|vi|xampany|cava|ànec|gelat|llimona|llima|llimó|maduixa|paella|fideu|fideuada|fideuà|orxata|mortadel·la|pernil|fuet|llonganissa|sobrassada|xoriço|oliva|oli|salsa|ametll?a|cacauet">
<!ENTITY pronom_feble "P0.{6}|PP3CN000|PP3NN000|PP3..A00|PP[123]CP000|PP3CSD00">
<!ENTITY pronom_no_determinant "et|em|es|li|ens|us|vos|hi|m'|t'|s'">
<!ENTITY os_animal "caverna|bru|grizzly|polar|hibern.*">
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -100319,7 +100319,7 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
</marker>
<token inflected="yes" regexp="yes">&vocabulari_menjar;</token>
</pattern>
<message>¿Volíeu dir <suggestion><match no="1" postag="(V.*)" postag_regexp="yes" postag_replace="$1">tastar</match></suggestion> en lloc de "<match no="1"/>"?</message>
<message>Referit a menjars o begudes, cal dir <suggestion><match no="1" postag="(V.*)" postag_regexp="yes" postag_replace="$1">tastar</match></suggestion> en lloc de "<match no="1"/>".</message>
<short>Possible confusió</short>
<example correction="tastar">No va voler <marker>provar</marker> la carn.</example>
<example correction="tastar">Vols <marker>provar</marker> el de llimona?</example>
Expand All @@ -100332,7 +100332,7 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
<token postag="V.*" postag_regexp="yes" inflected="yes">provar<exception postag="_GN_.*" postag_regexp="yes"/></token>
</marker>
</pattern>
<message>¿Volíeu dir <suggestion><match no="2" postag="(V.*)" postag_regexp="yes" postag_replace="$1">tastar</match></suggestion> en lloc de "<match no="2"/>"?</message>
<message>Referit a menjars o begudes, cal dir <suggestion><match no="2" postag="(V.*)" postag_regexp="yes" postag_replace="$1">tastar</match></suggestion> en lloc de "<match no="2"/>".</message>
<short>Possible confusió</short>
<example correction="tastà">El vi no el <marker>provà</marker>.</example>
<example>El bon vi va provar que tenia raó.</example>
Expand Down Expand Up @@ -123811,7 +123811,7 @@ No t'ho explicaré, no cal que em burxis més-->
<token><exception>a</exception></token>
</antipattern>
<antipattern>
<token inflected="yes" regexp="yes">anar|venir|pujar</token>
<token inflected="yes" regexp="yes">anar|pujar</token>
<token postag="P0.*" postag_regexp="yes" spacebefore="no" min="0"/>
<token>a</token>
<token regexp="yes">&verbs_reflexius_potencials;|&verbs_reflexius;|veure|buscar|cercar|fer</token>
Expand Down Expand Up @@ -123858,12 +123858,6 @@ No t'ho explicaré, no cal que em burxis més-->
<token regexp="yes" skip="1">es|se|s'</token>
<token inflected="yes">pujar</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="5">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
<example>Gràcies per haver-me vingut una vegada més a visitar.</example>
</antipattern>
<rule>
<pattern>
<token postag="V.[NGM].*" postag_regexp="yes" inflected="yes" regexp="yes">anar|pujar|venir<exception inflected="yes">vendre</exception></token>
Expand Down Expand Up @@ -123903,6 +123897,11 @@ No t'ho explicaré, no cal que em burxis més-->
<example>Van't Hoff.</example>
</rule>
<rule>
<antipattern>
<token inflected="yes" skip="5">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</antipattern>
<pattern>
<token postag="V.[NGM].*" postag_regexp="yes" regexp="yes" inflected="yes">anar|pujar|venir<exception inflected="yes">vendre</exception></token>
<token postag="P0.*" postag_regexp="yes" spacebefore="no" regexp="yes">.*[^e]</token>
Expand Down Expand Up @@ -124016,6 +124015,8 @@ No t'ho explicaré, no cal que em burxis més-->
<example correction="se'ns en venen|ens venen">Els problemes que <marker>se'ns venen</marker> a sobre.</example>
<example correction="ens n'anem|anem">Per començar <marker>ens anem</marker> a 1914.</example>
<example correction="se me n'havia pujat|m'havia pujat">La ciutat <marker>se m'havia pujat</marker> al cap.</example>
<example correction="Te'n vens|Vens"><marker>Et vens</marker> amb mi?</example>
<example correction="Te'n vens|Vens"><marker>Et vens</marker> a embolar un bou amb nosaltres?</example>
<example>Es pensava que les coses es venien soles.</example>
<example>Em venc la moto.</example>
<example>Joan se'n va a casa.</example>
Expand Down Expand Up @@ -124130,6 +124131,12 @@ No t'ho explicaré, no cal que em burxis més-->
<antipattern>
<token chunk="GV" regexp="yes">haver|havent</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="5">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
<example>Gràcies per haver-me vingut una vegada més a visitar.</example>
</antipattern>
<pattern>
<token regexp="yes">haver|havent</token>
<token regexp="yes">-me|-te|-se</token>
Expand All @@ -124146,6 +124153,11 @@ No t'ho explicaré, no cal que em burxis més-->
<antipattern>
<token chunk="GV" regexp="yes">haver|havent</token>
</antipattern>
<antipattern>
<token inflected="yes" skip="5">venir</token>
<token>a</token>
<token postag="V.N.*" postag_regexp="yes"/>
</antipattern>
<pattern>
<token regexp="yes">haver|havent</token>
<token regexp="yes">-nos|-vos</token>
Expand Down

0 comments on commit ada7463

Please sign in to comment.