org.languagetool.resource.ca.disambiguation.xml Maven / Gradle / Ivy
<?xml version="1.0" encoding="utf-8"?> <?xml-stylesheet type="text/xsl" href="../../../../../../../../../languagetool-core/src/main/resources/org/languagetool/rules/print.xsl" title="Pretty print" ?> <?xml-stylesheet type="text/css" href="../../../../../../../../../languagetool-core/src/main/resources/org/languagetool/rules/rules.css" title="Easy editing stylesheet" ?> <!-- Catalan Disambiguation Rules for LanguageTool Copyright (C) 2012 Jaume Ortolà i Font --> <!DOCTYPE rules [ <!ENTITY % entities SYSTEM "../../resource/ca/entities.ent" > %entities; ]> <rules lang="ca" xsi:noNamespaceSchemaLocation="../../../../../../../../../languagetool-core/src/main/resources/org/languagetool/resource/disambiguation.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xs="http://www.w3.org/2001/XMLSchema"> <unification feature="nombre"> <equivalence type="S"> <token postag="(PX..|N.{2}|[ADP].{3}|V.{4})[SN0].*|RG.*|CC|_PUNCT_CONT" postag_regexp="yes"/> </equivalence> <equivalence type="P"> <token postag="(PX..|N.{2}|[ADP].{3}|V.{4})[PN0].*|RG.*|CC|_PUNCT_CONT" postag_regexp="yes"/> </equivalence> </unification> <unification feature="genere"> <equivalence type="M"> <token postag="(PX.|N.|[ADP].{2}|V.{5})[MC].*|RG.*|CC|_PUNCT_CONT" postag_regexp="yes"/> </equivalence> <equivalence type="F"> <token postag="(PX.|N.|[ADP].{2}|V.{5})[FC].*|RG.*|CC|_PUNCT_CONT" postag_regexp="yes"/> </equivalence> </unification> <unification feature="persona"> <equivalence type="primera"> <token postag="(P.|V.{3})[10].*" postag_regexp="yes"/> </equivalence> <equivalence type="segona"> <token postag="(P.|V.{3})[20].*" postag_regexp="yes"/> </equivalence> <equivalence type="tercera"> <token postag="(P.|V.{3})[30].*" postag_regexp="yes"/> </equivalence> </unification> <rule id="genitiu_saxo" name="permet el genitiu saxó"> <pattern> <token regexp="yes">\p{Lu}.+</token> <marker> <token spacebefore="no" regexp="yes">[’']s</token> </marker> </pattern> <disambig action="add"> <wd pos="allow_saxon_genitive"/> </disambig> </rule> <rulegroup id="IGNORE_ENGLISH_WORDS" name="etiqueta paraules angleses"> <antipattern> <token regexp="yes">the|than</token> <token postag="V.P.*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <token postag="UNKNOWN" regexp="yes">&english_common;|&english_common_casesensitive;</token> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception></token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:2"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token postag="_english_ignore_"/> <marker> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception><exception postag="_english_ignore_"/></token> </marker> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:2"/> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception></token> <token postag="UNKNOWN" regexp="yes">&english_common;|&english_common_casesensitive;<exception>in</exception></token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:1"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception><exception postag="_english_ignore_"/></token> </marker> <token postag="_english_ignore_|allow_saxon_genitive" postag_regexp="yes"/> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:1"/> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token>to</token> <token regexp="yes">[a-z]+</token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:2 postags:VB"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token case_sensitive="yes">I</token> <token regexp="yes">[a-z]+<exception>buffet</exception><exception regexp="yes">&english_no;</exception></token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:2 postags:VB[PD]"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token postag="_english_ignore_|UNKNOWN" postag_regexp="yes" regexp="yes">[a-z]+<exception regexp="yes">saint|anti|&english_no;</exception></token> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception></token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:1,3"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[a-z]+<exception regexp="yes">saint|anti|&english_no;</exception></token> <token spacebefore="no">-</token> <token postag="_english_ignore_|UNKNOWN" postag_regexp="yes" spacebefore="no" regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception></token> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:1,3"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token postag="_english_ignore_"/> <marker> <token regexp="yes">a|to</token> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception><exception postag="_english_ignore_"/></token> </marker> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:3"/> <disambig action="add"> <wd pos="_english_ignore_"/> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token postag="_english_ignore_"/> <marker> <token regexp="yes">a|to</token> </marker> <token postag="_english_ignore_"/> </pattern> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <token>from</token> <token/> <marker> <token>to</token> </marker> </pattern> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> </rulegroup> <rulegroup id="IGNORE_ENGLISH_WORDS2" name="etiqueta paraules angleses"> <rule> <pattern> <token postag="_english_ignore_"/> <marker> <token regexp="yes">[a-z]+|'s<exception regexp="yes">&english_no;|&english_forward;</exception><exception postag="_english_ignore_"/></token> </marker> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:2"/> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[a-z]+<exception regexp="yes">&english_no;|&english_forward;</exception><exception postag="_english_ignore_"/></token> </marker> <token postag="_english_ignore_"/> </pattern> <filter class="org.languagetool.rules.IsEnglishWordFilter" args="formPositions:1"/> <disambig action="add"> <wd pos="_english_ignore_"/> </disambig> </rule> </rulegroup> <rulegroup id="FIX_DICTIONARY" name="fix some problems in dictionaries"> <!-- es pot eliminar quan s'arregle el diccionari --> <rule> <pattern> <token>imprimí</token> </pattern> <disambig action="remove"> <wd lemma="imprimar"/> </disambig> </rule> </rulegroup> <rulegroup id="FIX_SENTENCE_TOKENIZATION" name="fix problems with sentence tokenization"> <rule> <pattern> <token case_sensitive="yes" regexp="yes">[A-Z]</token> <marker> <token spacebefore="no">.</token> </marker> <token spacebefore="yes" postag="[VADSC].*" postag_regexp="yes" regexp="yes">\p{Lu}.*<exception postag="NP.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="SENT_START"/> </disambig> </rule> <rule> <pattern> <token case_sensitive="yes" regexp="yes">[A-Z]</token> <marker> <token spacebefore="no">.</token> </marker> <token spacebefore="yes" postag="[VADSC].*" postag_regexp="yes" regexp="yes">\p{Lu}.*<exception postag="NP.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="SENT_END"/> </disambig> </rule> </rulegroup> <rulegroup id="PUNTUACIO" name="signes de puntuació"> <rule> <pattern> <token regexp="yes">[.;:!?…()\[\]‒–—―•\-]<exception postag="LOC_.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_PUNCT"/> </disambig> </rule> <rule id="PUNTUACIO2" name="signes de puntuació que no trenquen els sintagmes"> <pattern> <token regexp="yes">[,'"‘’“”«»¡¿]</token> </pattern> <disambig action="add"> <wd pos="_PUNCT_CONT"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[mntsld]'</token> <marker> <token regexp="yes">[“‘«'"]</token> </marker> </pattern> <disambig action="add"> <wd pos="_QM_OPEN"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes" spacebefore="yes">['"]</token> </marker> <token spacebefore="no"><exception postag="_PUNCT.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_QM_OPEN"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes" spacebefore="yes">[“‘«]</token> </marker> </pattern> <disambig action="add"> <wd pos="_QM_OPEN"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <token regexp="yes">[“‘«]</token> </marker> </pattern> <disambig action="add"> <wd pos="_QM_OPEN"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes" spacebefore="no">['"’”»]<exception postag="_QM_OPEN"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_QM_CLOSE"/> </disambig> </rule> <rule id="tres_punts" name="punts suspensius"> <pattern> <token>.</token> <token>.</token> <token>.</token> </pattern> <disambig action="add"> <wd pos="_trespunts"/> <wd pos="_trespunts"/> <wd pos="_trespunts"/> </disambig> </rule> </rulegroup> <rule id="lletra_b" name="LLETRA B"> <pattern> <token regexp="yes">la|lletra|aquesta|esta|eixa|aqueixa|aquella|una</token> <marker> <token>b</token> </marker> </pattern> <disambig action="add"> <wd pos="NCFS000"/> </disambig> </rule> <rule id="la_lies" name="la lies"> <pattern> <token>la</token> <marker> <token>lies</token> </marker> </pattern> <disambig action="remove" postag="NCMN000"/> </rule> <rule id="M_nompropi" name="M. en nom propis"> <pattern> <marker> <token case_sensitive="yes">M</token> </marker> <token>.</token> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="add"> <wd lemma="M" pos="NPCNSP00"/> </disambig> </rule> <rule id="EN_PITU" name="en Pitu"> <pattern> <token>en</token> <marker> <token case_sensitive="yes">Pitu</token> </marker> </pattern> <disambig action="add"> <wd pos="NPMSSP0"/> </disambig> </rule> <rulegroup id="ENUMERACIONS" name="enumeracions amb lletres: a)"> <antipattern> <token>s</token> <token regexp="yes">[XICV]+</token> </antipattern> <antipattern> <token>a</token> <token spacebefore="no" regexp="yes">ls?</token> </antipattern> <rule> <pattern> <token regexp="yes">[a-z]</token> <token>,</token> <token regexp="yes" spacebefore="yes">[a-z]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[a-z]</token> <token>,</token> <token regexp="yes">[a-z]</token> <token regexp="yes">i|o|,|ni</token> <token regexp="yes">[a-z]</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token regexp="yes">[a-z]</token> <token regexp="yes">i|o</token> <token regexp="yes">[a-z]</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token regexp="yes">\d[\d\.]*|[a-z]</token> <token spacebefore="no">.</token> <marker> <token regexp="yes" spacebefore="no">[a-z]</token> </marker> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes" spacebefore="no">[a-z]</token> </marker> <token spacebefore="no">.</token> <token regexp="yes" spacebefore="no">[a-z]</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[a-z]<exception postag="LOC_ADV"/></token> </marker> <token spacebefore="no" regexp="yes">[\)\.]</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <token regexp="yes">[a-z]</token> </marker> <token spacebefore="no" regexp="yes">[\)\.]|&dashes;</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">,|;|i|o|ni</token> <marker> <token regexp="yes">[a-z]</token> </marker> <token spacebefore="no" regexp="yes">[\)\.]|&dashes;</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[a-z]</token> </marker> <token spacebefore="no" regexp="yes">[\)\.]|&dashes;</token> <token spacebefore="no" regexp="yes">[\)\.]|&dashes;</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">lletra|secció|apartat|panell|bloc</token> <token regexp="yes">[a-z]</token> <token regexp="yes">,|i|o|ni</token> <marker> <token regexp="yes">[a-z]</token> </marker> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">lletra|secció|apartat|panell|bloc</token> <marker> <token regexp="yes">[a-z]</token> </marker> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">vocal</token> <marker> <token regexp="yes">[aeiou]</token> </marker> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[\{\[\(]</token> <marker> <token regexp="yes" spacebefore="no">[a-z]</token> </marker> <token spacebefore="no" regexp="yes">[\)\}\]]</token> </pattern> <disambig action="add"> <wd pos="_enumeracio"/> </disambig> </rule> </rulegroup> <rulegroup id="tokenization_error" name="tokenization problem: Castella-la Manxa, D'Hondt"> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MGN].*" postag_regexp="yes"/></token> <marker> <token>-el</token> </marker> <token postag="N.[MC][SN].*" postag_regexp="yes"><exception postag="[CR].*|SP.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0MS0"/> </disambig> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MGN].*" postag_regexp="yes"/></token> <marker> <token>-els</token> </marker> <token postag="N.[MC][PN].*" postag_regexp="yes"><exception postag="[CR].*|SP.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0MP0"/> </disambig> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MGN].*" postag_regexp="yes"/></token> <marker> <token>-la</token> </marker> <token postag="N.[FC][SN].*" postag_regexp="yes"><exception postag="[CR].*|SP.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0FS0"/> </disambig> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MGN].*" postag_regexp="yes"/></token> <marker> <token>-les</token> </marker> <token postag="N.[FC][PN].*" postag_regexp="yes"><exception postag="[CR].*|SP.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0FP0"/> </disambig> </rule> <rule> <pattern> <token>d'</token> <marker> <token regexp="yes">Hond?t?</token> </marker> </pattern> <disambig action="add"> <wd pos="_possible_nompropi"/> </disambig> </rule> </rulegroup> <rulegroup id="coma_decimal" name="coma decimal"> <rule> <pattern> <token regexp="yes">\d+</token> <marker> <token spacebefore="no">,</token> </marker> <token spacebefore="no" regexp="yes">\d+</token> </pattern> <disambig action="remove"> <wd pos="_PUNCT_CONT"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">\d+</token> <marker> <token spacebefore="no">.</token> </marker> <token spacebefore="no" regexp="yes">\d+</token> </pattern> <disambig action="remove"> <wd pos="_PUNCT"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">\d+</token> <marker> <token spacebefore="no" regexp="yes">[,.]</token> </marker> <token spacebefore="no" regexp="yes">\d+</token> </pattern> <disambig action="add"> <wd pos="decimal_comma"/> </disambig> </rule> </rulegroup> <rulegroup id="NUMERALS" name="numerals i ordinals"> <antipattern> <token>R</token> <token>+</token> <token>D</token> </antipattern> <antipattern> <token>R</token> <token>+</token> <token>D</token> <token>+</token> <token>I</token> </antipattern> <rule> <pattern> <marker> <token>mil</token> <token>i</token> <token>un</token> </marker> </pattern> <disambig action="replace"> <wd pos="DN0MP0"/> <wd pos="DN0MP0"/> <wd pos="DN0MP0"/> </disambig> </rule> <rule> <pattern> <marker> <token>mil</token> <token>i</token> <token>una</token> </marker> </pattern> <disambig action="replace"> <wd pos="DN0FP0"/> <wd pos="DN0FP0"/> <wd pos="DN0FP0"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890][1234567890., ]+[1234567890]</token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="NCCN000"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890][1234567890., ]+[1234567890]</token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="DN0CP0"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890]{1,2}</token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="NCCN000"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890]{1,2}<exception>1</exception></token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="DN0CP0"/> </disambig> </rule> <rule> <pattern> <marker> <token spacebefore="yes">1</token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="DN0CS0"/> </disambig> </rule> <rule> <pattern> <marker> <token spacebefore="yes">1</token> </marker> </pattern> <disambig action="remove"> <wd lemma="numeral" pos="DN0CP0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[^.,]*</token> <marker> <token spacebefore="no">1</token> </marker> </pattern> <disambig action="add"> <wd lemma="numeral" pos="DN0CS0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[^.,]*</token> <marker> <token spacebefore="no">1</token> </marker> </pattern> <disambig action="remove"> <wd lemma="numeral" pos="DN0CP0"/> </disambig> </rule> <!-- ordinals --> <rule> <pattern> <marker> <token regexp="yes">[1234567890]+[èé]<exception postag="AO.*" postag_regexp="yes"/><exception regexp="yes">[01234][èé]</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0MS0"/> </disambig> </rule> <rule> <pattern> <token>el</token> <marker> <token regexp="yes">[1234567890]+</token> </marker> </pattern> <disambig action="add"> <wd pos="AO0MS0"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890]+a<exception postag="AO.*" postag_regexp="yes"/><exception>0a</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0FS0"/> </disambig> </rule> <rule> <pattern> <token>la<exception scope="previous" postag="D..MS." postag_regexp="yes"/></token> <marker> <token regexp="yes">[1234567890]+</token> </marker> </pattern> <disambig action="add"> <wd pos="AO0FS0"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[1234567890]+ns<exception postag="AO.*" postag_regexp="yes"/><exception regexp="yes">[01234]ns</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0MP0"/> </disambig> </rule> <!--<rule> <pattern> <token>els</token> <marker> <token regexp="yes">[1234567890]+</token> </marker> </pattern> <disambig action="add"><wd pos="AO0MP0"/></disambig> </rule>--> <rule> <pattern> <marker> <token regexp="yes">[1234567890]+es<exception postag="AO.*" postag_regexp="yes"/><exception>0es</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0FP0"/> </disambig> </rule> <rule> <pattern> <token>les</token> <marker> <token regexp="yes">[1234567890]+</token> </marker> </pattern> <disambig action="add"> <wd pos="AO0FP0"/> </disambig> </rule> <!-- romans--> <rule> <pattern case_sensitive="yes"> <marker> <token regexp="yes">(?=.)M{0,4}(CM|CD|D?C{0,3})(XC|XL|L?X{0,3})(IX|IV|V?I{0,3})<exception postag="_enumeracio"/></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <antipattern> <token regexp="yes">[dl]</token> <token spacebefore="no" regexp="yes">['’]</token> </antipattern> <pattern case_sensitive="yes"> <marker> <token regexp="yes" spacebefore="yes">(?=.)m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})<exception regexp="yes">cm|mm</exception><exception postag="_enumeracio"/></token> </marker> </pattern> <disambig action="add"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <token postag="SENT_START"/> <marker> <token regexp="yes">(?=.)m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})</token> </marker> </pattern> <disambig action="add"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <token>-</token> <marker> <token regexp="yes">(?=.)m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})</token> </marker> </pattern> <disambig action="add"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token regexp="yes">(?=.)m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})</token> </marker> <token>)</token> </pattern> <disambig action="add"> <wd pos="AO0CN0"/> </disambig> </rule> <!-- excepcions als numerals romans --> <rule> <pattern case_sensitive="yes"> <token postag="SENT_START"/> <token min="0" max="3" postag="_PUNCT.*" postag_regexp="yes"/> <marker> <token>I</token> </marker> </pattern> <disambig action="remove"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token regexp="yes">i|li|mi|vi|di</token> </marker> </pattern> <disambig action="remove"> <wd pos="AO0CN0"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token>VII</token> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[1234567890., ]+</token> <marker> <token>m</token> </marker> </pattern> <disambig action="replace" postag="NCMP000"/> </rule> <rule> <pattern> <token regexp="yes">1|/|per</token> <marker> <token>m</token> </marker> </pattern> <disambig action="replace" postag="NCMS000"/> </rule> <rule id="la_numero_dos" name="la número dos"> <pattern> <marker> <token regexp="yes">la|una|aquesta|esta|aqueixa|eixa|aquella</token> <token>número</token> <token postag="AO0C[NS]0|DN0[^F]P0" postag_regexp="yes"><exception regexp="yes">.*un</exception></token> </marker> </pattern> <disambig action="replace"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule id="la_numero_u" name="la número u"> <pattern> <marker> <token regexp="yes">la|una|aquesta|esta|aqueixa|eixa|aquella</token> <token>número</token> <token>1</token> </marker> </pattern> <disambig action="replace"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <token postag="DN.*" postag_regexp="yes"/> <marker> <token regexp="yes" case_sensitive="yes">aC|dC</token> </marker> </pattern> <disambig action="replace"> <wd pos="RG"/> </disambig> </rule> <rule id="en_base" name="en base + numeral"> <pattern> <token regexp="yes">en|de</token> <token>base</token> <marker> <token postag="DN.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="DD.FS.*" postag_regexp="yes"/> <marker> <token>deu</token> </marker> </pattern> <disambig action="filter" postag="NCFS.*|VMI.*"/> </rule> <!-- Percentatges --> <rule id="percentatges" name="percentatges"> <pattern> <token regexp="yes">[\d,. ]+[%‰‱]</token> </pattern> <disambig action="replace"> <wd pos="NCMS000"/> </disambig> </rule> <rule id="numero_graus" name="graus"> <pattern> <token regexp="yes">([\d,. ]+[°′″‴])+[CFKNSEW]?</token> </pattern> <disambig action="replace"> <wd pos="NCMP000"/> </disambig> </rule> <rule id="graus" name="graus"> <pattern> <token regexp="yes">°[CFKNSEW]</token> </pattern> <disambig action="replace"> <wd pos="NCMN000"/> </disambig> </rule> <rule id="un_grau" name="1 grau"> <pattern> <token regexp="yes">1°[CFNSEW]?</token> </pattern> <disambig action="replace"> <wd pos="NCMS000"/> </disambig> </rule> <rule id="IX" name="IX, ordinal no verb"> <pattern case_sensitive="yes"> <token>IX</token> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="vint_aniversari" name="vint aniversari"> <pattern> <marker> <and> <token postag="NCCN000"/> <token postag="DN0CP0"/> </and> </marker> <token>aniversari</token> </pattern> <disambig action="replace" postag="AO0MS0"/> </rule> </rulegroup> <rulegroup id="MILIO_K" name="numerals especials: milió, coma"> <rule> <antipattern> <!-- és una any --> <token regexp="yes">el|en|l</token> <token regexp="yes">\d\d\d\d</token> <token>i</token> <token>mig</token> </antipattern> <pattern> <token postag="DN.[MC].." postag_regexp="yes"/> <token>i</token> <marker> <token>mig</token> </marker> </pattern> <disambig action="replace" postag="DN0MP0"/> </rule> <rule> <pattern> <token postag="DN..P." postag_regexp="yes"/> <marker> <token regexp="yes" inflected="yes">milió|bilió|trlió|coma1|zero|un</token> </marker> </pattern> <disambig action="add"> <wd pos="K"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes" inflected="yes">milió|bilió|trlió|coma1|zero|un</token> </marker> <token postag="DN..P." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="K"/> </disambig> </rule> </rulegroup> <rulegroup id="PERIODES_DE_TEMPS" name="períodes de temps"> <rule> <pattern> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;<exception regexp="yes">segona|segones</exception></token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token postag="D[NI].*" postag_regexp="yes"><exception>cada</exception></token> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;<exception regexp="yes">segona|segones</exception></token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token postag="D[NI].*" postag_regexp="yes"><exception>cada</exception></token> <token postag="D[NI].*" postag_regexp="yes"><exception>cada</exception></token> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;<exception regexp="yes">segona|segones</exception></token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">més|menys</token> <token regexp="yes">de|d'</token> </marker> <token chunk="PTime"/> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;</token> <token>i</token> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;</token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token>anys</token> <token>i</token> <token>panys</token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token postag="DI.*" postag_regexp="yes"><exception>cada</exception></token> <token regexp="yes">de|d'</token> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;<exception regexp="yes">segona|segones</exception></token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token postag="DI.*" postag_regexp="yes" inflected="yes" regexp="yes">un|tot</token> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">quant|el</token> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;<exception regexp="yes">segona|segones</exception></token> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">quasi|gairebé</token> </marker> <token chunk="PTime"/> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token chunk="PTime"/> <marker> <token>i</token> <token regexp="yes">mig|mitja</token> </marker> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token chunk="PTime"/> <marker> <token postag="CC"/> </marker> <token chunk="PTime"/> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token chunk="PTime"/> <marker> <token regexp="yes">de|d'</token> <token regexp="yes">vida|servei|embaràs</token> </marker> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> <wd pos="PTime"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">portar|dur</token> <marker> <token>ja</token> </marker> <token chunk="PTime"/> </pattern> <disambig action="addchunk"> <wd pos="PTime"/> </disambig> </rule> </rulegroup> <rule id="PTIME_gerundi" name="període de temps + gerundi"> <pattern> <token chunk="PTime"><exception postag="D.*" postag_regexp="yes"/></token> <marker> <token postag="V.G.*" postag_regexp="yes"/> </marker> </pattern> <disambig postag="V.G.*" action="filter"/> </rule> <rule id="segon_ordinal" name="segon (ordinal) amb error de gènere"> <pattern> <marker> <token postag="A.*" postag_regexp="yes" regexp="yes" inflected="yes">segon|bo<exception>segons</exception></token> </marker> <!-- anàlisi, síndrome, casa... --> <token postag="NCF.*" postag_regexp="yes" regexp="yes">..+<exception postag="SPS00|C.*|P.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rulegroup id="casa_nom" name="casa (nom)"> <rule> <pattern> <token postag="A.*" postag_regexp="yes" regexp="yes" inflected="yes">segon|bo<exception>segons</exception></token> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">casa</token> </marker> </pattern> <disambig action="filter" postag="NCF.*"/> </rule> <rule> <pattern> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">casa<exception scope="previous" postag="&pronom_feble;" postag_regexp="yes"/></token> </marker> <token regexp="yes">de|d'</token> <token><exception regexp="yes">manera|forma</exception></token> </pattern> <disambig action="filter" postag="NCF.*"/> </rule> </rulegroup> <rule id="dos_o_mes" name="dos o més"> <pattern> <marker> <token postag="DN.*" postag_regexp="yes"/> </marker> <token>o</token> <token>més</token> <token postag="N..P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*"/> </rule> <rule id="des_de" name="des de/que"> <pattern> <marker> <token>des</token> </marker> <token regexp="yes">d'|de|del|dels|que</token> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule id="deu_i_ajuda" name="Déu i ajuda (nom)"> <pattern> <token inflected="yes">costar</token> <token>Déu</token> <token>i</token> <marker> <token>ajuda</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="men_guard" name="me'n guard"> <pattern> <token regexp="yes">deu|déu</token> <token regexp="yes" min="1" max="2">me|em|te|et|el|la|vos|us|els|les|en|'n</token> <marker> <token>guard</token> </marker> </pattern> <disambig action="replace"> <wd lemma="guardar" pos="VMSP1S00"/> </disambig> </rule> <rule id="de_A" name="de A"> <antipattern> <token>a</token> <token regexp="yes" spacebefore="no">ls?</token> </antipattern> <pattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"/> <marker> <token case_sensitive="yes">A</token> </marker> </pattern> <disambig action="replace"> <wd lemma="A" pos="NCCS000"/> </disambig> </rule> <rulegroup id="any_en_xifres" name="El + any (en xifres)"> <antipattern> <token regexp="yes">\d+</token> <token>%</token> </antipattern> <rule> <pattern> <token regexp="yes">en|d?els?|anys?|dècada</token> <token regexp="yes">[12][0-9]{3}</token> <token>-</token> <marker> <token regexp="yes">[0-9]{1,4}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <token postag="_PUNCT.*" postag_regexp="yes"/> <marker> <token regexp="yes">[12][0-9]{3}</token> </marker> <token><exception postag="NC.[PN].*" postag_regexp="yes"/></token> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token regexp="yes">anys?|mitjan|copyright</token> <marker> <token regexp="yes">[1-9][0-9]{0,3}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <token regexp="yes">en|el</token> <marker> <token regexp="yes">[1-2][0-9]{3}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token regexp="yes">en|el|l</token> <marker> <token regexp="yes">[1-2][0-9]{3}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token regexp="yes">en|el|l|l'</token> <marker> <token regexp="yes">[1-9][0-9]{0,3}</token> </marker> <token><exception postag="NC[MC]P.*|Y" postag_regexp="yes"/></token> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">llei|final|fi|principi|començament|inici|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre|des</token> <token>de</token> <marker> <token regexp="yes">[123456789][1234567890]{0,3}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">llei|final|fi|principi|començament|inici|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre|des</token> <token>de</token> <token spacebefore="no">l</token> <marker> <token regexp="yes">[123456789][1234567890]{0,3}</token> </marker> </pattern> <disambig action="replace" postag="_C_TEMPS"/> </rule> </rulegroup> <rule id="bo" name="bo (no interjecció)"> <pattern> <token regexp="yes">bo|bona</token> </pattern> <disambig action="remove" postag="I"/> </rule> <rule id="bo_adj" name="bo (adjectiu)"> <pattern> <token postag="SPS00"/> <marker> <token>bo</token> </marker> </pattern> <disambig action="filter" postag="AQ0MS0"/> </rule> <rule id="ADVERBI_ANTEPOSAT" name="adverbi que es pot anteposar a adjectiu"> <pattern> <token postag="RG" regexp="yes">mal|.+ment|molt|poc|moltíssim|poquíssim|tantíssim|tant|tan|aleshores|alhora|almanco|almenys|aviat|bastant|ben|encara|força|gaire|gairebé|gens|inclús|ja|llavors|mai|massa|menys|mig|millor|més|no|només|pas|pitjor|potser|prompte|prou|quasi|quelcom|sempre|sobretot|sols|suara|també|tampoc|tanmateix|tostemps|tot|tothora|àdhuc</token> </pattern> <disambig action="add"> <wd pos="RG_anteposat"/> </disambig> </rule> <rule id="PROMPTE" name="prompte (adv)"> <pattern> <token>tan</token> <marker> <token>prompte</token> </marker> <token>com</token> </pattern> <disambig action="filter" postag="RG"/> </rule> <rulegroup id="CONTRACCIONS" name="contraccions"> <rule> <pattern> <marker> <token>pe</token> </marker> <token regexp="yes">ls?</token> </pattern> <disambig action="add"> <wd lemma="per" pos="SPS00"/> </disambig> </rule> <rule> <pattern> <marker> <token>pe</token> </marker> <token regexp="yes">ls?</token> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rule> <pattern> <token regexp="yes">a|de|pe</token> <marker> <token spacebefore="no">l<exception postag=".*LOC_.*|NP.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0MS0"/> </disambig> </rule> <rule> <antipattern> <token regexp="yes">a|de|pe|ca</token> <token regexp="yes" spacebefore="no">ls?</token> </antipattern> <pattern> <token regexp="yes">ls?</token> </pattern> <disambig action="remove" postag="DA0M.0"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <token regexp="yes">ls?</token> </marker> </pattern> <disambig action="remove" postag="DA0M.0"/> </rule> <rule> <pattern> <token regexp="yes">a|de|pe|ca</token> <marker> <token spacebefore="no">ls<exception postag="NP.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0MP0"/> </disambig> </rule> <rule> <pattern> <marker> <token>l</token> </marker> <token spacebefore="no">'</token> <token spacebefore="no" regexp="yes">[1234567890]+</token> </pattern> <disambig action="replace"> <wd lemma="el" pos="DA0CS0"/> </disambig> </rule> <rule> <pattern> <token>ca</token> <marker> <token spacebefore="no">n</token> </marker> </pattern> <disambig action="add"> <wd lemma="can" pos="DA0CN0"/> </disambig> </rule> <rule> <pattern> <marker> <token>ca</token> </marker> <token spacebefore="no">n</token> </pattern> <disambig action="filter" postag="NCFS.*"/> </rule> <rule id="a_cal" name="a cal(s)"> <antipattern> <token>cal</token> <token postag="V.N.*" postag_regexp="yes"/> </antipattern> <pattern> <token regexp="yes">a|per|de</token> <marker> <token regexp="yes">cals?</token> </marker> </pattern> <disambig action="replace" postag="contraccio"/> </rule> <rule> <antipattern> <token>cal</token> <token postag="V.N.*" postag_regexp="yes"/> </antipattern> <pattern> <token regexp="yes">a|per|de</token> <marker> <token>cal</token> </marker> </pattern> <disambig action="add"> <wd lemma="el" pos="DA0MS0"/> </disambig> </rule> <rule> <pattern> <!-- <token regexp="yes">a|per|de</token> --> <marker> <token>cals</token> </marker> </pattern> <disambig action="add"> <wd lemma="el" pos="DA0MP0"/> </disambig> </rule> </rulegroup> <rulegroup id="secar" name="paraules coincidents amb el verb secar (només AVL)"> <rule> <pattern> <marker> <and> <token inflected="yes">secar<exception scope="previous" postag="P.*" postag_regexp="yes"/></token> <token negate="yes" inflected="yes">secar</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="secar"/> </disambig> </rule> <rule> <pattern> <token>el</token> <marker> <token>secà</token> </marker> </pattern> <disambig action="remove"> <wd lemma="secar"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">el|mig|l</token> <marker> <token>sec</token> </marker> </pattern> <disambig action="remove"> <wd lemma="secar"/> </disambig> </rule> <rule> <pattern> <token>la</token> <marker> <token>seca</token> </marker> </pattern> <disambig action="remove"> <wd lemma="secar"/> </disambig> </rule> </rulegroup> <rule id="nAdj" name="no adjectiu"> <!-- paraules comunes que no solen ser adjectiu gairebé mai --> <pattern> <marker> <token regexp="yes">lluny|les|música|músiques|refés|manera|maneres|minve|minva</token> </marker> </pattern> <disambig action="filter" postag="[^A].*"/> </rule> <rule id="nombres" name="nombres (no femení)"> <pattern> <token regexp="yes">nombres|segles</token> </pattern> <disambig action="remove" postag="NCFP000"/> </rule> <rule id="noNom2" name="FA LA no nom"> <pattern> <token><exception postag="D[DAI]0MS0" postag_regexp="yes" regexp="yes">l|el|un|aquest|algun</exception></token> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">fa|la</token> </marker> <token><exception regexp="yes">menor|major|sostingut|bemoll|diesi|becaire|#|b</exception></token> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rulegroup id="ESTAR_IMPERATIU" name="formes del verb estar en imperatiu"> <rule> <pattern> <marker> <token>està</token> </marker> <token><exception spacebefore="no">-te</exception></token> </pattern> <disambig action="remove" postag="V.M.*"/> <example type="untouched">Està-te quiet.</example> </rule> <rule> <pattern> <marker> <token regexp="yes">esteu|estau</token> </marker> <token><exception spacebefore="no">-vos</exception></token> </pattern> <disambig action="remove" postag="V.M.*"/> </rule> <rule> <pattern> <marker> <token>estem</token> </marker> <token><exception spacebefore="no">-nos</exception></token> </pattern> <disambig action="remove" postag="V.M.*"/> </rule> </rulegroup> <rulegroup id="nom_vocals" name="el nom de les vocals"> <rule> <antipattern> <token postag="V.[MGN].*" postag_regexp="yes"/> <!-- falta un guionet --> <token>la</token> <token>a</token> <token postag="V.N.*|contraccio|D.*" postag_regexp="yes"/> </antipattern> <pattern> <token>la</token> <marker> <token regexp="yes">a|e|i|o|u</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token>l'</token> <token>una</token> <marker> <token>a</token> </marker> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <token>una<exception postag=".*LOC.*" postag_regexp="yes"/></token> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">a|e|u</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="D..FS.|SPS00" postag_regexp="yes"/> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">i</token> </marker> <token regexp="yes">llarga|breu</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">[eo]</token> </marker> <token regexp="yes">tancada|oberta</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">es|os</token> </marker> <token regexp="yes">tancades|obertes</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rule id="ha_hectarees" name="ha (hectàrees)"> <pattern> <token postag="DN.*" postag_regexp="yes"/> <marker> <token>ha</token> </marker> <token><exception postag="V.P..SM." postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="noNom" name="no nom"> <!-- paraules comunes que no solen ser noms gairebé mai (es,...) --> <antipattern> <token regexp="yes">\d[\d\.,]*</token> <token regexp="yes">fots?</token> </antipattern> <pattern> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">fot|fots|bon|creix|ros|se|es|de|i|o|a|he|ha|hem|més|en|per|ni|no|menys|fas|com</token> <token postag="N.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rule id="mans_lliures" name="mans lliures"> <pattern> <token postag="D..M[SP]." postag_regexp="yes"/> <marker> <token>mans</token> <token>lliures</token> </marker> </pattern> <disambig action="replace"> <wd lemma="mans lliures" pos="NCMN000"/> <wd lemma="mans lliures" pos="AQ0MN0"/> </disambig> </rule> <rule id="CARA" name="cara (adj/nom)"> <pattern> <marker> <token postag="NCFS000">cara</token> </marker> <token regexp="yes">amunt|avall|enfora|endins</token> </pattern> <disambig action="filter" postag="NCFS000"/> </rule> <rulegroup id="FRONTERA" name="frontera (adj/nom)"> <rule> <pattern> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">frontera</token> </marker> <token>enllà</token> </pattern> <disambig action="filter" postag="NCF.*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">travessar|creuar</token> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">frontera</token> </marker> </pattern> <disambig action="filter" postag="NCF.*"/> </rule> </rulegroup> <rule id="A_TOCAR" name="a tocar"> <pattern> <token regexp="yes">tan|tant</token> <marker> <token>a</token> <token>tocar</token> </marker> </pattern> <disambig action="replace"> <wd lemma="a tocar" pos="LOC_ADV"/> <wd lemma="a tocar" pos="LOC_ADV"/> </disambig> </rule> <rule id="D_ACORD" name="d'acord (adv)"> <pattern> <token regexp="yes" inflected="yes">restar|quedar|estar|posar</token> <token min="0" max="3" postag="LOC_ADV|RG" postag_regexp="yes"/> <marker> <token>d'</token> <token>acord</token> </marker> </pattern> <disambig action="replace"> <wd lemma="d'acord" pos="LOC_ADV"/> <wd lemma="d'acord" pos="LOC_ADV"/> </disambig> </rule> <rule id="A_BAIX" name="a baix"> <pattern> <token>a</token> <token>baix</token> </pattern> <disambig action="replace"> <wd lemma="a baix" pos="LOC_ADV"/> <wd lemma="a baix" pos="LOC_ADV"/> </disambig> </rule> <rule id="A_DALT" name="a dalt"> <pattern> <token>a</token> <token>dalt</token> </pattern> <disambig action="replace"> <wd lemma="a dalt" pos="LOC_ADV"/> <wd lemma="a dalt" pos="LOC_ADV"/> </disambig> </rule> <rulegroup id="ALTRA_VEGADA" name="altra vegada (loc. adverbial)"> <rule> <pattern> <token>altre</token> <token regexp="yes">cop|pic|colp</token> </pattern> <disambig action="replace"> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token>altra</token> <token regexp="yes">vegada|volta</token> </pattern> <disambig action="replace"> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token>un</token> <token>altre</token> <token regexp="yes">cop|pic|colp</token> </pattern> <disambig action="replace"> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token>una</token> <token>altra</token> <token regexp="yes">vegada|volta</token> </pattern> <disambig action="replace"> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> <wd lemma="altra vegada" pos="LOC_ADV"/> </disambig> </rule> </rulegroup> <rulegroup id="LOCUCIONS" name="locucions adverbials, preposicionals, conjuntives"> <!-- locucions concretes--> <rule id="gota_a_gota" name="gota a gota (locución adverbial)"> <pattern> <token><exception postag="D.*" postag_regexp="yes"/></token> <marker> <token>gota</token> <token>a</token> <token>gota</token> </marker> </pattern> <disambig action="replace"> <wd lemma="gota a gota" pos="LOC_ADV"/> <wd lemma="gota a gota" pos="LOC_ADV"/> <wd lemma="gota a gota" pos="LOC_ADV"/> </disambig> </rule> <rule id="duna_banda" name="d'una banda (locució conj.)"> <pattern> <token>,</token> <marker> <token regexp="yes">d'|per</token> <token regexp="yes">una|altra</token> <token regexp="yes">banda|part</token> </marker> <token>,</token> </pattern> <disambig action="replace"> <wd lemma="daltra_banda" pos="LOC_CONJ"/> <wd lemma="daltra_banda" pos="LOC_CONJ"/> <wd lemma="daltra_banda" pos="LOC_CONJ"/> </disambig> </rule> <rule id="temps_ha" name="temps ha (locució adverbial)"> <pattern> <marker> <token regexp="yes">temps|anys</token> <token>ha</token> </marker> <token><exception postag="V.P.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="temps ha" pos="LOC_ADV"/> <wd lemma="temps ha" pos="LOC_ADV"/> </disambig> </rule> <rule id="a_espai" name="a espai (locució adverbial)"> <pattern> <token><exception regexp="yes" inflected="yes">com|per|dedicar</exception></token> <marker> <token>a</token> <token case_sensitive="yes">espai</token> </marker> <token><exception postag="AQ0[MC][SN].|V.P..SM." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="a espai" pos="LOC_ADV"/> <wd lemma="a espai" pos="LOC_ADV"/> </disambig> </rule> <rule id="de_prop" name="de prop (locució adverbial)"> <antipattern> <token>prop</token> <token postag="PX.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <token>de</token> <token>prop</token> </marker> </pattern> <disambig action="replace"> <wd lemma="de prop" pos="LOC_ADV"/> <wd lemma="de prop" pos="LOC_ADV"/> </disambig> </rule> <rule id="venir_de_gust" name="venir de gust (locució adverbial)"> <pattern> <token inflected="yes">venir</token> <token min="0" max="3" postag="RG|LOC_ADV" postag_regexp="yes"/> <marker> <token>de</token> <token>gust</token> </marker> </pattern> <disambig action="replace"> <wd lemma="de gust" pos="LOC_ADV"/> <wd lemma="de gust" pos="LOC_ADV"/> </disambig> </rule> <rule id="en_va1" name="en va (locució adverbial)"> <pattern> <token><exception regexp="yes">'ls|'ns|us|hi</exception></token> <marker> <token>en</token> <token>va</token> </marker> <token><exception postag="V.[NG].*|A.*|V.P.*SM.?" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="en va" pos="LOC_ADV"/> <wd lemma="en va" pos="LOC_ADV"/> </disambig> </rule> <rule id="fa_poc" name="fa poc (locució adverbial)"> <pattern> <marker> <token>fa</token> <token>poc</token> </marker> <token><exception postag="A..[MC][SN].|V.P..SM." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="fa poc" pos="LOC_ADV"/> <wd lemma="fa poc" pos="LOC_ADV"/> </disambig> </rule> <rule id="fa_molt_poc" name="fa molt poc (locució adverbial)"> <pattern> <marker> <token>fa<exception scope="previous">es</exception></token> <token>molt</token> <token>poc</token> </marker> <token><exception postag="A..[MC][SN].|V.P..SM." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="fa molt poc" pos="LOC_ADV"/> <wd lemma="fa molt poc" pos="LOC_ADV"/> <wd lemma="fa molt poc" pos="LOC_ADV"/> </disambig> </rule> <rule id="en_realitat" name="en realitat (locució adverbial)"> <pattern> <marker> <token>en</token> <token>realitat</token> </marker> <token><exception regexp="yes">augmentada|virtual</exception></token> </pattern> <disambig action="replace"> <wd lemma="en va" pos="LOC_ADV"/> <wd lemma="en va" pos="LOC_ADV"/> </disambig> </rule> <rule id="com_a_minim" name="com a mínim (locució adverbial)"> <pattern> <marker> <token>com</token> <token>a</token> <token regexp="yes">màxim|mínim</token> </marker> <token><exception postag="AQ.[MC][SN].|V.P..SM." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="com a mínim" pos="LOC_ADV"/> <wd lemma="com a mínim" pos="LOC_ADV"/> <wd lemma="com a mínim" pos="LOC_ADV"/> </disambig> </rule> <rule id="un_punt" name="un punt (locució adverbial)"> <!-- caldria concordança--> <pattern> <token postag="N.*" postag_regexp="yes"/> <marker> <token>un</token> <token>punt</token> </marker> <token min="0" regexp="yes">més|menys</token> <token postag="A.*" postag_regexp="yes"><exception>estratègic</exception></token> </pattern> <disambig action="replace"> <wd lemma="un punt" pos="LOC_ADV"/> <wd lemma="un punt" pos="LOC_ADV"/> </disambig> </rule> <rule id="al_principi" name="al principi (locució adverbial)"> <pattern> <marker> <token>a</token> <token>l</token> <token regexp="yes">principi|començament</token> </marker> <token postag="A..F..|A..MS.|V.P...F.|V.P..SM." postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd lemma="al principi" pos="LOC_ADV"/> <wd lemma="al principi" pos="LOC_ADV"/> <wd lemma="al principi" pos="LOC_ADV"/> </disambig> </rule> <rule id="de_primera" name="de primera (locució adverbial)"> <pattern> <marker> <token>de</token> <token>primera</token> </marker> <token><exception postag="NC[FC][SN].*" postag_regexp="yes"/><exception>ma</exception></token> </pattern> <disambig action="replace"> <wd lemma="de primera" pos="LOC_ADV"/> <wd lemma="de primera" pos="LOC_ADV"/> </disambig> </rule> <rule id="per_fi" name="per fi (locució adverbial)"> <pattern> <marker> <token>per</token> <token>fi</token> </marker> </pattern> <disambig action="replace"> <wd lemma="per fi" pos="LOC_ADV"/> <wd lemma="per fi" pos="LOC_ADV"/> </disambig> </rule> <rule id="de_moment" name="de moment (locució adverbial)"> <antipattern> <token>moment</token> <token regexp="yes">angular|lineal|dipolar|inercial|magnètic</token> </antipattern> <antipattern> <token>moment</token> <token>d'</token> <token>inèrcia</token> </antipattern> <pattern> <marker> <token>de</token> <token>moment</token> </marker> </pattern> <disambig action="replace"> <wd lemma="de moment" pos="LOC_ADV"/> <wd lemma="de moment" pos="LOC_ADV"/> </disambig> </rule> <rule id="de_moda" name="de moda (locució adj.)"> <pattern> <marker> <token>de</token> <token>moda</token> </marker> <token><exception postag="A..[FC][SN].|V.P..SF." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="de moda" pos="LOC_ADJ"/> <wd lemma="de moda" pos="LOC_ADJ"/> </disambig> </rule> <rule id="de_mentida" name="de mentida (locució adj.)"> <pattern> <marker> <token>de</token> <token>mentida</token> </marker> <token><exception postag="A..[FC][SN].|V.P..SF." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="de mentida" pos="LOC_ADJ"/> <wd lemma="de mentida" pos="LOC_ADJ"/> </disambig> </rule> <rule id="gracies_a" name="gràcies a (locució preposicional)"> <antipattern> <token postag="D.*" postag_regexp="yes"><exception inflected="yes" regexp="yes">tot|deu</exception></token> <token>gràcies</token> <token>a</token> </antipattern> <pattern> <marker> <token>gràcies</token> <token>a</token> </marker> </pattern> <disambig action="replace"> <wd lemma="gràcies a" pos="LOC_PREP"/> <wd lemma="gràcies a" pos="LOC_PREP"/> </disambig> <example type="untouched">Per fi, ens l'hem <marker>llevat de</marker> damunt.</example> </rule> <rule id="llevat_de" name="llevat de (locució preposicional)"> <pattern> <token><exception inflected="yes">haver</exception></token> <marker> <token>llevat</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="llevat de" pos="LOC_PREP"/> <wd lemma="llevat de" pos="LOC_PREP"/> </disambig> <example type="untouched">Per fi, ens l'hem <marker>llevat de</marker> damunt.</example> </rule> <rule id="lluny_de" name="lluny de (locució preposicional)"> <pattern> <token><exception postag="RG"/></token> <marker> <token>lluny</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="lluny de" pos="LOC_PREP"/> <wd lemma="lluny de" pos="LOC_PREP"/> </disambig> </rule> <rule id="abans_de" name="abans de (locució preposicional)"> <pattern> <marker> <token>abans</token> <token regexp="yes">de|d'<exception postag="LOC_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="replace"> <wd lemma="abans de" pos="LOC_PREP"/> <wd lemma="abans de" pos="LOC_PREP"/> </disambig> <!-- Why doesn't it work? The full hybrid disambiguator is not applied? <example type="untouched">Abans de tant en tant ho feia.</example> <example type="untouched">Abans de vegades ho feia.</example>--> </rule> <rule id="a_fi_de" name="a fi de (locució conjuntiva)"> <pattern> <marker> <token>a</token> <token>fi</token> <token regexp="yes">de|d'</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd lemma="a fi de" pos="LOC_CONJ"/> <wd lemma="a fi de" pos="LOC_CONJ"/> <wd lemma="a fi de" pos="LOC_CONJ"/> </disambig> </rule> <rule id="entorn_de" name="a entorn de (locució prepositiva)"> <pattern> <token><exception postag="D..[MC]S." postag_regexp="yes"/></token> <marker> <token>entorn</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="entorn de" pos="LOC_PREP"/> <wd lemma="entorn de" pos="LOC_PREP"/> </disambig> </rule> <rule id="en_contra_de" name="en contra de (locució prepositiva)"> <pattern> <marker> <token>en</token> <token>contra</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="en contra de" pos="LOC_PREP"/> <wd lemma="en contra de" pos="LOC_PREP"/> <wd lemma="en contra de" pos="LOC_PREP"/> </disambig> </rule> <rule id="en_contra" name="en contra (locució adverbial)"> <pattern> <marker> <token>en<exception postag="LOC_PREP"/></token> <token>contra</token> </marker> </pattern> <disambig action="replace"> <wd lemma="en contra" pos="LOC_ADV"/> <wd lemma="en contra" pos="LOC_ADV"/> </disambig> </rule> <rule id="a_part_de" name="a part de (locució prepositiva)"> <pattern> <marker> <token>a</token> <token>part</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="a part de" pos="LOC_PREP"/> <wd lemma="a part de" pos="LOC_PREP"/> <wd lemma="a part de" pos="LOC_PREP"/> </disambig> </rule> <rule id="a_part" name="a part (locució adverbial)"> <pattern> <marker> <token>a<exception postag="LOC_PREP"/></token> <token>part</token> </marker> </pattern> <disambig action="replace"> <wd lemma="a part" pos="LOC_ADV"/> <wd lemma="a part" pos="LOC_ADV"/> </disambig> </rule> <rule id="damagat_de" name="d'amagat de (locució prepositiva)"> <pattern> <marker> <token>d'</token> <token>amagat</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="d'amagat de" pos="LOC_PREP"/> <wd lemma="d'amagat de" pos="LOC_PREP"/> <wd lemma="d'amagat de" pos="LOC_PREP"/> </disambig> </rule> <rule id="damagat" name="d'amagat (locució adverbial)"> <pattern> <marker> <token>d'<exception postag="LOC_PREP"/></token> <token>amagat</token> </marker> </pattern> <disambig action="replace"> <wd lemma="d'amagat" pos="LOC_ADV"/> <wd lemma="d'amagat" pos="LOC_ADV"/> </disambig> </rule> <rule id="al_capdamunt_de" name="al capdamunt de (locució prepositiva)"> <pattern> <marker> <token>a</token> <token spacebefore="no">l</token> <token regexp="yes">capdamunt|capdavall|capdavant</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="al capdamunt de" pos="LOC_PREP"/> <wd lemma="al capdamunt de" pos="LOC_PREP"/> <wd lemma="al capdamunt de" pos="LOC_PREP"/> <wd lemma="al capdamunt de" pos="LOC_PREP"/> </disambig> </rule> <rule id="al_capdamunt" name="al capdamunt (locució adverbial)"> <pattern> <marker> <token>a<exception postag="LOC_PREP"/></token> <token spacebefore="no">l</token> <token regexp="yes">capdamunt|capdavall|capdavant</token> </marker> </pattern> <disambig action="replace"> <wd lemma="al capdamunt" pos="LOC_ADV"/> <wd lemma="al capdamunt" pos="LOC_ADV"/> <wd lemma="al capdamunt" pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token><exception>el</exception></token> <marker> <token>primer</token> <token>de</token> <token>tot</token> </marker> </pattern> <disambig action="add"> <wd lemma="primer de tot" pos="LOC_ADV"/> <wd lemma="primer de tot" pos="LOC_ADV"/> <wd lemma="primer de tot" pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <marker> <token>a</token> <token>la</token> <token regexp="yes">lleugera|valenta|llarga|callada|boja|clara|curta|descoberta|descosida|desesperada|destapada|fresca|impensada|menuda|antiga|quieta|regalada|sorda</token> </marker> <token><exception postag="NC[FC][SN].*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="a la lleugera" pos="LOC_ADV"/> <wd lemma="a la lleugera" pos="LOC_ADV"/> <wd lemma="a la lleugera" pos="LOC_ADV"/> </disambig> <example type="untouched">Es deu <marker>a la lleugera</marker> millora del mercat.</example> </rule> <rule> <pattern> <token>en</token> <token>contra</token> <token regexp="yes">[mts]e(u|ua|va)</token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <!--<rule> <pattern> <token>cada</token> <token regexp="yes">una?</token> </pattern> <disambig action="replace"> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> </disambig> </rule>--> <rule> <pattern> <token inflected="yes" skip="3" regexp="yes">girar|caure|tombar</token> <marker> <token>d'</token> <token>esquena</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="de_nou" name="de nou"> <antipattern> <token>més</token> <token>de</token> <token>nou</token> </antipattern> <pattern> <marker> <token>de</token> <token>nou</token> </marker> <token><exception postag="NC[MC][SN].*|NC.[PN].*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">Amb la proposta <marker>de nou</marker> servidor</example> <example type="untouched">Amb un termini d'execució <marker>de nou</marker> mesos.</example> <example type="untouched">N'hi havia més <marker>de nou</marker>.</example> </rule> <rule id="de_veritat" name="de veritat"> <pattern> <marker> <token>de</token> <token>veritat</token> </marker> <token><exception postag="AQ.[FC][SN]." postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">Porcions <marker>de veritat</marker> absoluta.</example> </rule> <rule id="a_mes" name="a més"> <antipattern> <token inflected="yes">donar</token> <token>lloc</token> <token>a</token> </antipattern> <pattern> <token><exception regexp="yes" inflected="yes">per|fins|arribar|correspondre|situar|col·locar|ubicar</exception></token> <marker> <token>a<exception postag="LOC_ADV"/></token> <token>més</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV" lemma="a més"/> <wd pos="LOC_ADV" lemma="a més"/> </disambig> <example type="untouched">Per <marker>a més</marker> d'un dia.</example> </rule> <rule id="en_canvi" name="en canvi"> <pattern> <marker> <token regexp="yes">en|a</token> <token>canvi</token> </marker> <token><exception regexp="yes">de|d'</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">Va dir que sí <marker>a canvi</marker> de diners.</example> </rule> <rule id="per_tant" name="per tant"> <pattern> <marker> <token>per</token> <token>tant</token> </marker> <token><exception regexp="yes">de|d'</exception><exception postag="NC[MC][SN].*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd lemma="per tant" pos="LOC_CONJ"/> <wd lemma="per tant" pos="LOC_CONJ"/> </disambig> <example type="untouched">I <marker>per tant</marker> honor.</example> </rule> <rule id="de_fiar" name="de fiar"> <pattern> <token postag="NC.*|AQ.*" postag_regexp="yes"/> <marker> <token>de</token> <token>fiar</token> </marker> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">-.*</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> </disambig> <example type="untouched">No us heu <marker>de fiar</marker> de ningú.</example> </rule> <rule id="a_prop_de" name="a prop/sobre/damunt de"> <pattern> <token><exception regexp="yes">la|cap</exception></token> <marker> <token>a</token> <token regexp="yes">prop|sobre|sota|damunt|davall|començaments?|finals?|inicis?|principis?|tocar</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> </disambig> </rule> <rule id="per_sobre_de" name="per sobre de"> <pattern> <marker> <token>per</token> <token regexp="yes">sobre|sota|damunt|davall</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> </disambig> </rule> <rule id="a_la_recerca_de" name="a la recerca de"> <pattern> <token><exception>per</exception></token> <marker> <token>a</token> <token>la</token> <token>recerca</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> <wd pos="LOC_PREP"/> </disambig> </rule> <rule id="a_prop" name="a prop/sobre/damunt"> <pattern> <token><exception>la</exception></token> <marker> <token>a</token> <token regexp="yes">prop|sobre|sota|damunt|davall|gust|pler|plaer</token> </marker> <token><exception regexp="yes">de|d'</exception><exception postag="PX.MS.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">És tan <marker>a prop</marker> meu.</example> </rule> <rule id="a_prop_seu" name="a prop/sobre/damunt... seu"> <pattern> <token><exception>la</exception></token> <marker> <token>a</token> <token regexp="yes">prop|sobre|sota|damunt|davall|gust|pler|plaer</token> <token postag="PX.MS.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="en_forma" name="en forma"> <antipattern> <token>en</token> <token>forma</token> <token postag="RG" min="0"/> <token postag="AQ.[FC]S.*|VMP..SF." postag_regexp="yes"/> </antipattern> <pattern> <marker> <token>en</token> <token>forma</token> </marker> <token><exception regexp="yes">de|d'|part</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">És <marker>en forma</marker> hexagonal.</example> </rule> <rule id="en_perill" name="en perill"> <antipattern> <token>en</token> <token>perill</token> <token postag="RG" min="0"/> <token postag="AQ.[MC]S.*|VMP..SM." postag_regexp="yes"/> </antipattern> <pattern> <marker> <token>en</token> <token>perill</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> <example type="untouched">És <marker>en perill</marker> altament crític.</example> </rule> <rule id="en_forma_n" name="en forma (nom)"> <pattern> <marker> <token postag="SPS00">en</token> <token postag="NCFS000">forma</token> </marker> <token postag="AQ.[FC]S.*|VMP..SF." postag_regexp="yes"><exception>part</exception></token> </pattern> <disambig action="filterall"/> <example type="untouched">Ell <marker>en forma</marker> part.</example> </rule> <rule> <pattern> <marker> <token>a</token> <token>la</token> <token>vora</token> </marker> <token><exception regexp="yes">de|d'|dreta|esquerra</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <marker> <token>a</token> <token>fons</token> </marker> <token><exception regexp="yes">perdut|públics</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <!--locucions adverbials de temps--> <rule id="de_tant_en_tant" name="de tant en tant"> <pattern> <marker> <token>de</token> <token><exception regexp="yes">tant?|quant?</exception></token> <token>en</token> <token><match no="1"/></token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="any_a_any" name="any a any"> <antipattern> <token inflected="yes" regexp="yes">de|a|el|l</token> <token postag="N.*" postag_regexp="yes"/> <token>a</token> </antipattern> <pattern> <marker> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">de|gota</exception></token> <token regexp="yes">per|darrere|rere|a</token> <token><match no="0"/></token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="en_pocs_anys" name="en pocs anys/dies/hores/minuts..."> <pattern> <marker> <token>en</token> <unify> <feature id="nombre"/> <feature id="genere"/> <token inflected="yes">poc</token> <token postag="NC.P.*" postag_regexp="yes" inflected="yes" regexp="yes">&unitats_temps;|&periodes_temps;</token> </unify> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="havent_dinat" name="havent dinat"> <pattern> <marker> <token>havent</token> <token postag="VMP00SM.?" postag_regexp="yes"/> </marker> <token><exception>que</exception></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="anys_i_anys" name="anys i anys"> <pattern> <marker> <token regexp="yes">hores|dies|setmanes|mesos|anys|dècades|segles</token> <token>i</token> <token><match no="0"/></token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="anys_i_anys2" name="anys i més anys"> <pattern> <marker> <token regexp="yes">hores|dies|setmanes|mesos|anys|dècades|segles</token> <token>i</token> <token>més</token> <token><match no="0"/></token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="entre_classe_i_classe" name="entre classe i classe"> <pattern> <marker> <token>entre</token> <token postag="N.*" postag_regexp="yes"/> <token>i</token> <token><match no="1"/></token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="esdiguicomesdigui" name="es digui com es digui"> <pattern> <token postag="P[P0].*" postag_regexp="yes"/> <token postag="V.S.*" postag_regexp="yes"/> <token>com</token> <token><match no="0"/></token> <token><match no="1"/></token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <!-- <rule id="cada_vegada" name="cada vegada"> <pattern> <token>cada</token> <marker> <token regexp="yes">hora|dia|mes|any|vegada|volta|cop|minut|segon|moment|setmana</token> </marker> <token regexp="yes">menors|majors</token> </pattern> <disambig action="filter" postag="[^N].*"/> </rule>--> <rule id="per_ultima_vegada" name="per última vegada"> <pattern> <marker> <token>per</token> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="AO.*" postag_regexp="yes"/> <token regexp="yes">vegada|volta|col?p</token> </unify> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV" lemma="per primera vegada"/> <wd pos="LOC_ADV" lemma="per primera vegada"/> <wd pos="LOC_ADV" lemma="per primera vegada"/> </disambig> </rule> <rule id="fruit_de" name="fruit de"> <pattern> <token postag="N.*" postag_regexp="yes"/> <marker> <token>fruit</token> <token regexp="yes">de|d'</token> </marker> </pattern> <disambig action="replace"> <wd lemma="fruit de" pos="LOC_PREP"/> <wd lemma="fruit de" pos="LOC_PREP"/> </disambig> </rule> <rule id="desquena" name="d'esquena"> <pattern> <marker> <token>d'</token> </marker> <token>esquena</token> </pattern> <disambig action="add"> <wd lemma="d'esquena" pos="LOC_ADV"/> </disambig> </rule> <rule id="donat_que" name="donat que (loc conj)"> <pattern> <token postag="SENT_START|_PUNCT.*" postag_regexp="yes"/> <marker> <token regexp="yes">donat|atès|atés</token> <!-- vigilar accentuació --> <token>que</token> </marker> </pattern> <disambig action="add"> <wd lemma="donat que" pos="LOC_CONJ"/> <wd lemma="donat que" pos="LOC_CONJ"/> </disambig> </rule> <rule id="els_ets_i_els_uts" name="els ets i els uts"> <pattern> <token>els</token> <marker> <token>ets</token> </marker> <token>i</token> <token>els</token> <token>uts</token> </pattern> <disambig action="replace"> <wd lemma="ets" pos="NCMP000"/> </disambig> </rule> <rule id="ets_i_uts" name="ets i uts"> <pattern> <marker> <token>ets</token> </marker> <token>i</token> <token>uts</token> </pattern> <disambig action="replace"> <wd lemma="ets" pos="NCMP000"/> </disambig> </rule> </rulegroup> <rulegroup id="abreviacions" name="abreviacions"> <rule> <pattern> <token>p</token> <token spacebefore="no">.</token> <token spacebefore="yes" regexp="yes">[adeopbnmi]|abs|ex</token> <token spacebefore="no">.</token> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <marker> <token>p</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">\d+</token> </pattern> <disambig action="add"> <wd pos="NCFS000" lemma="pàgina"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">\d+</token> <marker> <token>p</token> </marker> <token spacebefore="no">.</token> </pattern> <disambig action="add"> <wd pos="NCFN000" lemma="pàgina"/> </disambig> </rule> <rule> <!-- 1a ed. --> <pattern> <token regexp="yes">\d+a</token> <marker> <token>ed</token> </marker> <token spacebefore="no">.</token> </pattern> <disambig action="add"> <wd pos="NCFS000" lemma="edició"/> </disambig> </rule> <rule> <pattern> <marker> <token>min</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">\d+</token> </pattern> <disambig action="add"> <wd pos="NCMN000"/> </disambig> </rule> <rule> <pattern> <marker> <token>n</token> </marker> <token spacebefore="no">.</token> <!--<token regexp="yes">\d+</token>--> </pattern> <disambig action="add"> <wd pos="NCCN000"/> </disambig> <!-- nota, número, nom --> </rule> <rule> <pattern> <marker> <token postag="P.*" postag_regexp="yes">hi</token> <token postag="V.*" postag_regexp="yes">ha</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="abreviacions_punt" name="abreviacions seguides de punt"> <pattern> <marker> <token postag="Y"/> </marker> <token spacebefore="no">.<exception postag="SENT_END"/></token> </pattern> <disambig action="filter" postag="Y"/> </rule> <rule> <pattern> <marker> <token>loc</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">comparativa|adjectival|distributiva|preposicional|conjuncional|adverbial</token> </pattern> <disambig action="add"> <wd lemma="locució" pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">v|adj|adv|f</token> </marker> <token spacebefore="no">.</token> </pattern> <disambig action="add"> <wd lemma="cat_gramatical" pos="NCMN000"/> </disambig> </rule> </rulegroup> <rulegroup id="noms_persona" name="noms de persona abreviats"> <rule> <pattern case_sensitive="yes"> <marker> <token regexp="yes">[A-Z]</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token regexp="yes">[A-Z]</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">[A-Z]</token> <token spacebefore="no">.</token> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rule id="prefixos_amb_guionet" name="prefixos amb guionet: micro-, mini-"> <pattern> <marker> <token regexp="yes">mini|micro|semi|multi|anti|super|re|pro|sots|sobre|co</token> </marker> <token spacebefore="no">-</token> </pattern> <disambig action="replace"> <wd pos="AQ0CN0"/> </disambig> </rule> <rule id="prefixos_ortografia" name="ignora l'ortografia de prefixos correctes"> <pattern> <marker> <token regexp="yes">kilo|mini|micro|semi|multi|anti|super|re|pro|sots|arxi|bes|plus|per|post|pre|pseudo|quasi|sobre|sub|ultra|vice|auto|greco|gal·lo|inter|intra</token> </marker> <token spacebefore="no">-</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="sufixos_ortografia" name="ignora l'ortografia de sufixos"> <pattern> <token spacebefore="yes">-</token> <marker> <token regexp="yes" spacebefore="no">indre|ldre|ns|scs|scos|igs|ix|eix|é|ena|è|it|ert|ir|ar|er|re</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule id="pre_post" name="prefix pre- post"> <pattern> <marker> <token>pre</token> </marker> <token postag="CC"/> <token regexp="yes">post.*</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rulegroup id="intra_inter" name="prefix inter- intra-"> <rule> <pattern> <marker> <token>inter</token> </marker> <token postag="CC"/> <token regexp="yes">intra.*</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <marker> <token>intra</token> </marker> <token postag="CC"/> <token regexp="yes">inter.*</token> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rule id="no_ij" name="no interjecció"> <pattern> <marker> <token>salve</token> </marker> <token><exception regexp="yes">,|!</exception></token> </pattern> <disambig action="remove" postag="I"/> </rule> <rulegroup id="sigui_qui_sigui" name="sigui qui sigui"> <rule> <pattern> <token postag="VSS.*" postag_regexp="yes"/> <token regexp="yes">què|qui|quin|quins|quina|quines</token> <token><match no="0"/></token> </pattern> <disambig action="add"> <wd pos="LOC_CONJ"/> <wd pos="LOC_CONJ"/> <wd pos="LOC_CONJ"/> </disambig> </rule> <rule> <pattern> <token postag="VSS.*" postag_regexp="yes"/> <token regexp="yes">el|la|els|les</token> <token regexp="yes">que|qui</token> <token><match no="0"/></token> </pattern> <disambig action="add"> <wd pos="LOC_CONJ"/> <wd pos="LOC_CONJ"/> <wd pos="LOC_CONJ"/> <wd pos="LOC_CONJ"/> </disambig> </rule> </rulegroup> <rule id="pujar_i_baixar" name="pujar i baixar (verbs)"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes">pujar</token> <token postag="CC" regexp="yes">i|o|ni</token> <token postag="V.*" postag_regexp="yes" inflected="yes">baixar</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="VAN_GOGH" name="van Gogh"> <rule> <pattern> <marker> <token>van</token> <token regexp="yes">(?-i)Aartsen|Agt|Allen|Asperen|Baaren|Basten|Beethoven|Beinum|Belin|Bommel|Bree|Buren|Campen|Dam|Delden|der|Dijk|Dine|Dong|Dyck|Egmond|Eyck|Gaal|Goethem|Gogh|Halen|Hauwe|Hemel|Immersel|Kempen|Lier|Maldere|Marwijk|Mill|Morrison|Nieuwkerk|Nistelrooy|Otterloo|Persie|Petegem|Ragin|Rensburg|Rompuy|Schalkwyk|Someren|Vaart|Val|Valen|Van|Vliet|Vlijmen|Wassenaer</token> </marker> </pattern> <disambig action="replace"> <wd pos="NPCNSP0"/> <wd pos="NPCNSP0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">\p{Lu}.+</token> <marker> <token>van</token> </marker> <token regexp="yes">\p{Lu}.+<exception postag="V.N.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace"> <wd pos="NPCNSP0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">\p{Lu}.+</token> <marker> <token>van</token> </marker> <token regexp="yes">den|der</token> <token regexp="yes">\p{Lu}.+</token> </pattern> <disambig action="replace"> <wd pos="NPCNSP0"/> </disambig> </rule> </rulegroup> <rule id="DA_VINCI" name="da Vinci"> <pattern> <marker> <token>da</token> <token regexp="yes">(?-i)Messina|Cividale|Morte|Costa|Lingua|Língua|Gagliano|Palestrina|Perugia|Silva|Cunha|Gama|Viadana|Vinci|Ponte</token> </marker> </pattern> <disambig action="replace"> <wd pos="NPCNSP0"/> <wd pos="NPCNSP0"/> </disambig> </rule> <rule id="RIU_AMUNT" name="riu amunt/avall"> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">riu|costa|baixada|escala|escales</token> </marker> <token regexp="yes">amunt|avall</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rulegroup id="CURT" name="curt no adverbi"> <rule> <pattern> <token><exception postag="V.[MSI].*|_GV_" postag_regexp="yes"/></token> <marker> <token>curt</token> </marker> </pattern> <disambig action="remove"> <wd pos="RG"/> </disambig> </rule> <rule> <pattern> <token><exception postag="D.*" postag_regexp="yes"/></token> <marker> <token inflected="yes">curt</token> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> </rulegroup> <rulegroup id="darrera" name="permet 'darrera' en alguns casos"> <rule> <pattern> <token postag="AO.*" postag_regexp="yes"/> <token postag="CC"/> <marker> <token>darrera</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_darrera"/> </disambig> </rule> <rule> <pattern> <token postag="AO.*" postag_regexp="yes"/> <token regexp="yes">[(,]</token> <token postag="CC"/> <marker> <token>darrera</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_darrera"/> </disambig> </rule> <rule> <pattern> <token skip="1" regexp="yes">següent|.*ª</token> <token postag="CC"/> <marker> <token>darrera</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_darrera"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">,|i</token> <marker> <token>darrera</token> </marker> <token regexp="yes">abans|després|que</token> </pattern> <disambig action="add"> <wd pos="_allow_darrera"/> </disambig> </rule> </rulegroup> <rule id="valer_la_pena" name="valer la pena"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">valer|pagar</token> <token postag="D.*" postag_regexp="yes">la</token> <token postag="N.*" postag_regexp="yes">pena</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="posar_fi_a" name="posar fi a"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes">posar</token> <token postag="NCFS000">fi</token> <token postag="SPS00">a</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="tenor_nom" name="tenor, soprano (nom no adj)"> <pattern> <token postag="D.*" postag_regexp="yes"/> <marker> <token postag_regexp="yes" postag="N.*" inflected="yes">tenor</token> <!-- soprano --> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="fi_nom" name="fi de festa (nom no adj)"> <pattern> <marker> <token postag="NCFS000">fi</token> </marker> <token inflected="yes">de</token> <token min="0" postag="D.*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">festa|any|temporada|curs|lliga</token> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="deixar_a_part" name="deixar a part, a banda, de banda"> <rule> <pattern> <token inflected="yes">deixar</token> <token>a</token> <marker> <token regexp="yes">banda|part</token> </marker> </pattern> <disambig action="filter" postag="LOC_ADV"/> </rule> <rule> <pattern> <token inflected="yes">deixar</token> <token>de</token> <marker> <token>banda</token> </marker> </pattern> <disambig action="filter" postag="LOC_ADV"/> </rule> </rulegroup> <rule id="deixar_de_fer" name="deixar de fer"> <pattern> <marker> <token regexp="yes">deixa|deixes</token> </marker> <token inflected="yes">de</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="fa_entre" name="fa entre"> <!-- Problema: que es feia entre quatre --> <rule> <pattern> <token postag="V.I[PI]3S0." postag_regexp="yes" inflected="yes">fer</token> <marker> <token>entre</token> </marker> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <!-- <rule> <pattern> <marker> <token postag="V.I[PI]3S0." postag_regexp="yes" inflected="yes">fer</token> </marker> <token>entre</token> </pattern> <disambig action="filter" postag="LOC_ADV"></disambig> </rule> --> <rule> <pattern> <token regexp="yes">de|entre</token> <marker> <token postag="V.I[PI]3S0." postag_regexp="yes" inflected="yes">fer</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> </disambig> </rule> </rulegroup> <!-- <rulegroup id="fa_x_temps" name="fa tres anys, fa molt de temps"> <rule> <pattern> <token><exception postag="PI0CS000|NP..SP.*|&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <marker> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="12">fer<exception postag=".*LOC_ADV.*" postag_regexp="yes"/><exception scope="next" regexp="yes">que|en</exception><exception scope="next" postag="_PUNCT.*" postag_regexp="yes">,</exception><exception postag="V.*" postag_regexp="yes" scope="next"/></token> </marker> <token regexp="yes">segons?|minuts?|hor(a|es)|di(a|es)|setman(a|es)|mes|mesos|(tri|quadri|se)mestres?|anys?|lustres?|dècad(a|es)|segles?|mil·lennis?|moments?|instants?|temps|estona</token> </pattern> <disambig action="add"><wd pos="LOC_ADV"></wd></disambig> </rule> <rule> <pattern> <token><exception postag="PI0CS000|NP..SP.*|&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="12">fer<exception scope="next" regexp="yes">que|en</exception><exception scope="next" postag="_PUNCT.*" postag_regexp="yes">,</exception><exception postag="V.*" postag_regexp="yes" scope="next"/></token> <marker> <token regexp="yes">segons?|minuts?|hor(a|es)|di(a|es)|setman(a|es)|mes|mesos|(tri|quadri|se)mestres?|anys?|lustres?|dècad(a|es)|segles?|mil·lennis?|moments?|instants?|temps|estona</token> </marker> </pattern> <disambig action="add"><wd pos="LOC_ADV"></wd></disambig> </rule> <rule> <pattern> <token><exception postag="NP..SP.*|&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <marker> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="1">fer<exception postag=".*LOC_ADV.*" postag_regexp="yes"/><exception scope="next" regexp="yes">,|que|en</exception><exception postag="V.*" postag_regexp="yes" scope="next"/></token> </marker> <token regexp="yes">molt|poc</token> </pattern> <disambig action="add"><wd pos="LOC_ADV"></wd></disambig> </rule> <rule> <pattern> <token><exception postag="NP..SP.*|&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="1">fer<exception scope="next" regexp="yes">,|que|en</exception><exception postag="V.*" postag_regexp="yes" scope="next"/></token> <marker> <token regexp="yes">molt|poc</token> </marker> </pattern> <disambig action="add"><wd pos="LOC_ADV"></wd></disambig> </rule> </rulegroup> --> <rulegroup id="la_paraula_x" name="la paraula x + verb"> <rule> <pattern> <token postag="DA.*" postag_regexp="yes"/> <token inflected="yes" regexp="yes">mot|paraula|terme|expressió|vocable|nom|tipus|denominació</token> <marker> <and> <token postag="V.[IMS].*" postag_regexp="yes"><exception>pren</exception></token> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> <token postag="V.[IMS].*|P0.*|PP.*" postag_regexp="yes"><exception regexp="yes">si|['-].+|jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vostès?|vós</exception></token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> </rulegroup> <rulegroup id="un_penques" name="un penques"> <rule> <pattern> <token>un</token> <marker> <token>penques</token> </marker> </pattern> <disambig action="replace"> <wd lemma="penques" pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <token>uns</token> <marker> <token>penques</token> </marker> </pattern> <disambig action="replace"> <wd lemma="penques" pos="NCMP000"/> </disambig> </rule> </rulegroup> <rulegroup id="am_pm" name="am pm"> <rule> <pattern> <token regexp="yes">[012]?\d</token> <token>:</token> <token regexp="yes">[0-5]?\d</token> <marker> <token regexp="yes">am|pm</token> </marker> </pattern> <disambig action="replace"> <wd lemma="ampm" pos="Y"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[012]?\d</token> <marker> <token regexp="yes">am|pm</token> </marker> </pattern> <disambig action="replace"> <wd lemma="ampm" pos="Y"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[012]?\d\.[0-5]?\d</token> <marker> <token regexp="yes" case_sensitive="yes">am|pm|AM|PM</token> </marker> </pattern> <disambig action="replace"> <wd lemma="am_pm" pos="Y"/> </disambig> </rule> </rulegroup> <rulegroup id="unitats" name="unitats de mesura abreviades"> <rule> <pattern> <token regexp="yes">[1234567890., ]+|/|per<exception postag="_PUNCT.*" postag_regexp="yes"/></token> <marker> <token>ha</token> </marker> <token><exception postag="V.P.*(M|SF)." postag_regexp="yes"/></token> <!-- Excepció: 2012 ha sigut --> </pattern> <disambig action="filter" postag="Y"/> </rule> <rule> <pattern> <token regexp="yes">[h1234567890., ]+|/|per<exception postag="_PUNCT.*" postag_regexp="yes"/></token> <marker> <token>min</token> </marker> </pattern> <disambig action="filter" postag="Y"/> </rule> </rulegroup> <rule id="ENTRE" name="entre (verb)"> <antipattern> <token>en</token> <!-- nom de persona --> <token regexp="yes" skip="20">\p{Lu}.*</token> <token>i</token> </antipattern> <antipattern> <token>en</token> <token>a</token> <token>i</token> </antipattern> <pattern> <marker> <token postag="V.*" postag_regexp="yes">entre</token> </marker> <token regexp="yes">en|a</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="ES_CASA" name="es casa"> <pattern> <token regexp="yes">em|et|el|ens|us|vos|els|es</token> <marker> <token postag="V.*" postag_regexp="yes">casa</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="barra_es" name="persona/es"> <pattern> <token postag="[NA].*" postag_regexp="yes"/> <token spacebefore="no">/</token> <marker> <token spacebefore="no">es</token> </marker> </pattern> <disambig action="replace" postag="NCCP000"/> </rule> <rulegroup id="nom_seguitde_nompropi" name="nom seguit de nom propi: el mont Or"> <antipattern> <token regexp="yes">el|els|les</token> <token>marca</token> </antipattern> <antipattern> <token>es</token> <token>cursa</token> </antipattern> <antipattern> <token postag="V.M.*" postag_regexp="yes"/> <token postag="&pronom_feble;" postag_regexp="yes" spacebefore="no"/> </antipattern> <rule> <pattern> <token inflected="yes" regexp="yes">&nom_seguitde_nompropi;</token> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">\p{Lu}.+</token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> <example type="untouched">Amb qui es <marker>casa</marker> Lídia?</example> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">&nom_seguitde_nompropi;</token> </marker> <token regexp="yes">\p{Lu}.+</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <!-- igual però amb cometes --> <rule> <pattern> <token inflected="yes" regexp="yes">&nom_seguitde_nompropi;</token> <token regexp="yes">['"‘“«]</token> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">\p{Lu}.+</token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">&nom_seguitde_nompropi;</token> </marker> <token regexp="yes">['"‘“«]</token> <token regexp="yes">\p{Lu}.+</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rule id="figura" name="figura (nom)"> <pattern> <marker> <token>figura</token> </marker> <token postag="N.*|A.*" postag_regexp="yes"/> <token spacebefore="no" regexp="yes">-|/|>|<</token> <token postag="N.*|A.*" postag_regexp="yes" spacebefore="no"/> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rulegroup id="excepcions_nomspropis" name="excepcions a noms propis"> <rule> <pattern> <token postag="D...P." postag_regexp="yes"/> <marker> <token postag="NPCSG0V">Dolors</token> </marker> </pattern> <disambig action="remove"> <wd pos="NPCSG0V"/> </disambig> </rule> <rule> <pattern> <token postag="D..FP." postag_regexp="yes"/> <marker> <token postag="NPCSG0V">Barraques</token> </marker> </pattern> <disambig action="remove"> <wd pos="NPCSG0V"/> </disambig> </rule> <rule> <pattern> <token postag="D..FP." postag_regexp="yes"/> <marker> <token postag="NPCSG0V">Figueres</token> </marker> </pattern> <disambig action="remove"> <wd pos="NPCSG0V"/> </disambig> </rule> <rule> <!-- adjectiu a principi de frase --> <pattern> <token postag="SENT_START"/> <marker> <token postag="A.*" postag_regexp="yes" inflected="yes">antic</token> </marker> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="TOPONIMS_BALEARS_SON" name="topònims amb Son"> <pattern case_sensitive="yes"> <token>Son</token> <token regexp="yes" >Anglada|Armadans|Baco|Bacs|Bages|Balaguer|Baleu|Ballarí|Ballester|Bandoler|Banya|Banús|Baptista|Barba|Barbassa|Barbot|Barbut|Barca|Barceló|Bardissa|Barní|Barrabàs|Barraca|Barral|Barranco|Barraquer|Barrera|Barret|Barrigo|Barrina|Barriol|Bartomeu|Baró|Basca|Bascós|Basqueja|Bassa|Batle|Batlet|Batlum|Bauló|Bauçanet|Bauçà|Beco|Bejueta|Belard|Bell-lloc|Beltran|Bendinat|Benet|Bennàsser|Berenguer|Berga|Bergues|Bernadinet|Bernadàs|Bernadí|Bernadó|Bernat|Bessó|Bet|Betlem|Bibiloni|Biel|Bielí|Bieló|Binimelis|Binissalom|Bisbal|Bitzoc|Bià|Blai|Blanc|Blanco|Blanes|Blanquet|Blauet|Boga|Boi|Boiet|Boio|Boira|Boivàs|Bollaix|Bonafè|Bonany|Bonaventura|Bonavista|Bonet|Bono|Bontemps|Bordils|Bordoll|Boronat|Borràs|Borrós|Bosc|Boscana|Boscanet|Boscà|Bosquer|Boter|Bou|Bouet|Brau|Braó|Brindis|Brondo|Brotat|Bruc|Brull|Brun|Budella|Bufarell|Bugadelles|Buit|Bujosa|Bunyola|Burball|Burguera|Burgues|Burguet|Burixó|Buscall|Busqueret|Busquet|Ca|Cabaspre|Cabellut|Cabila|Cabot|Cabrer|Cabrisses|Cadell|Cagalls|Caimari|Caios|Calafat|Calafató|Calbet|Calco|Calders|Calderó|Calent|Caliu|Calletes|Calma|Calquet|Calussa|Calvó|Calàpet|Camaró|Caminal|Campanario|Campaner|Campanet|Campins|Campmar|Camps|Campà|Canals|Candeler|Canet|Canta|Cantagall|Cantó|Canyelles|Caparrot|Capellet|Capellot|Capellà|Capó|Carabassa|Caragol|Carbonell|Carbó|Card|Cardaix|Cardell|Cardona|Caret|Carles|Carreró|Carretó|Carrió|Carro|Cartet|Carulles|Carut|Casesnoves|Castanyer|Castell|Castelló|Català|Catalí|Catany|Catiu|Catiuet|Catlar|Catlaret|Catxo|Caulelles|Caules|Cavaller|Ceba|Cebrià|Cega|Celiano|Cella|Cellard|Cerdà|Cero|Cerol|Cervera|Cigala|Cilis|Cintes|Ciriet|Claret|Cledera|Cloques|Cloquis|Coador|Coc|Cocó|Codony|Coix|Colam|Coletes|Coll|Collell|Collet|Colom|Colomar|Colombars|Colomí|Comelles|Comes|Company|Comparet|Comte|Conill|Corb|Corcó|Corem|Corona|Coronell|Corpetí|Corró|Corso|Cortell|Cosina|Cosme|Cosmet|Cosmè|Costa|Costes|Cota|Cotoner|Cotoneret|Cotxer|Cotà|Coure|Coves|Credo|Creixell|Cremat|Crespí|Cresta|Creuades|Creuer|Creus|Cruu|Cuca|Cucullada|Cucuí|Cucó|Cudem|Cuines|Culdeporc|Culenrere|Cullera|Cuquellada|Curt|Cusseta|Cànaves|Còdol|Cós|Dagueta|Dalabau|Dalmau|Dameto|Danusset|Danús|Dardò|Daurat|Daviu|Deixobte|Deiò|Demés|Dico|Dimoni|Divertit|Doblons|Doctor|Dolç|Domingo|Domènec|Dotze|Drago|Draguet|Dragó|Duc|Dulei|Duran|Dureta|Durí|Fabiol|Fadrinet|Fadrí|Falconer|Falcó|Fam|Famioler|Fanals|Fang|Fango|Fangos|Farratge|Fava|Favar|Fe|Febrer|Fedelic|Feina|Felip|Feliu|Femella|Femenia|Ferragut|Ferrandell|Ferrando|Ferrer|Ferreret|Ferretjans|Ferriol|Ferrà|Fideu|Figuera|Figuerola|Fillol|Fillolet|Filmorat|Flor|Floriana|Fluixà|Fogueró|Fogó|Fondo|Fonoll|Fonollar|Font|Fony|Foradat|Forat|Forcall|Fornari|Fornaris|Forners|Fort|Fortuny|Fosquet|Fotja|Francesc|Francí|Françoi|Frare|Frau|Fred|Frigoleta|Frit|Frontera|Frígola|Fullana|Fullaneta|Fullaní|Fullós|Fum|Fuster|Fusteret|Gabellí|Gabriel|Gabriela|Gaieta|Gaià|Galceran|Galera|Galerí|Galiana|Galianeta|Galileu|Galiot|Gall|Gallard|Gallardí|Gallardó|Gallet|Gallina|Galta|Gamet|Ganxo|Ganxó|Ganyada|Garbeta|Garbí|Garcia|Garcies|Garcietes|Gardana|Garivai|Garreta|Garriga|Garrit|Garrot|Garrova|Garrover|Garí|Gassó|Gat|Geant|Gelabert|Gelat|Gener|Genet|Genovoi|Genovès|Genís|Gibert|Gil|Gilet|Gili|Ginard|Ginyol|Godall|Godí|Gofis|Gorgut|Gornals|Gorreu|Gorries|Gorrió|Gotlet|Gradolí|Gran|Granada|Grandia|Granot|Gras|Grec|Gregori|Gri|Grimalt|Groc|Grua|Gual|Gualet|Gualí|Guardiola|Guaret|Guarners|Guarnesset|Guedet|Guerau|Guerauet|Gueraueta|Guerrer|Gueu|Gueuxo|Guida|Guillem|Guillemet|Guillemó|Guillot|Guineu|Guiscafrè|Guitard|Guixa|Gustí|Güells|Jan|Jardí|Jaume|Jaumell|Jaumet|Jeroni|Joan|Jofre|Joi|Jonquet|Jorbo|Jordi|Jordà|Josep|Jover|Jovera|Juaneda|Juevert|Julià|Juny|Lau|Llabià|Llagosta|Llampaies|Llaneres|Llarg|Llaura|Llaüt|Llebre|Llebrers|Lledonet|Lledó|Lleganya|Lleig|Llendera|Llençolot|Lleu|Lleó|Llinars|Lliteres|Llobera|Llobet|Llodranet|Llodrà|Llompard|Llompardet|Llompartet|Llorenç|Llorençó|Lloret|Lloriguera|Lloringo|Llorongo|Llova|Llubinet|Llubí|Lluc|Llucià|Lluent|Llull|Llunes|Lluny|Lluquet|Lluís|Llàtzer|Loco|Làdico|Mac|Macip|Macià|Maga|Maganet|Magdalè|Magina|Magraner|Magre|Magí|Maians|Maig|Maimó|Maina|Maixella|Major|Malcuit|Malferit|Mallol|Mallolí|Manenta|Mannà|Manrè|Manuel|Manyes|Manyo|Mar-i-sol|Marc|Marge|Marget|Marill|Marimon|Marinet|Marionet|Marió|Marquet|Marquès|Marranet|Marrano|Marroig|Marron|Martorell|Martorellet|Martí|Marçal|Marí|Mas|Mascaró|Mascord|Maset|Masnou|Massaguany|Massot|Matamoros|Matet|Mateu|Mateuet|Maties|Maçanet|Maó|Mel|Melero|Mengol|Menut|Mercadal|Mercer|Merlet|Mesquida|Mesquidassa|Mesquideta|Messeguer|Metge|Mevet|Mico|Micola|Mieres|Milana|Millora|Miquel|Miquelet|Mir|Miralles|Miramar|Miret|Miró|Misericòrdia|Misser|Misseret|Misseró|Mitjanada|Moio|Moix|Moixeta|Moià|Moja|Molines|Moll|Moló|Monar|Monedero|Moner|Monget|Monjo|Montserrat|Moraduix|Moragues|Moranta|Morei|Moreions|Morell|Morlanet|Morlà|Moro|Morral|Morro|Moscard|Mosquer|Mosson|Mossènyer|Muda|Mulet|Muletó|Munar|Munaret|Muntaner|Murta|Murtó|Mut|Mutet|Màtger|Móra|Nadal|Nadaler|Nasi|Nasvermell|Navata|Naveta|Nebot|Negre|Nero|Neula|Nicolau|Nicolauet|Niell|Ninetes|Nis|Niu|Nivorra|Nofret|Noguera|Noguereta|Nosa|Not|Nou|Noviet|Nét|Paborde|Pacs|Palanca|Paler|Palmera|Palou|Palouet|Pancuit|Panerer|Panxeta|Paparra|Paparreta|Papeleta|Paquet|Parc|Parfunci|Parragó|Parric|Parrol|Pascol|Pastera|Pastereta|Pastor|Patró|Patxeco|Pau|Paulo|Pebre|Peixet|Peladí|Pelai|Pelat|Pelea|Pellisser|Pelut|Penaflor|Penjoll|Pentinador|Pentinat|Penya|Perdiu|Perdiuet|Perdut|Pere|Perellonet|Perelló|Peretó|Pericasses|Pericassó|Pericàs|Perllonga|Peroi|Perot|Perotí|Perpinyà|Perro|Perroquet|Perxa|Pesca|Petit|Peu|Pi|Picard|Picornell|Picó|Pieres|Pijolí|Pillo|Pinet|Pinta|Pinya|Piol|Piris|Pisanet|Pistola|Pisà|Piulo|Pixedis|Plaent|Planes|Plata|Poca-sang|Pocapalla|Pocos|Poder|Poi|Pol|Pollencí|Poma|Pomar|Poncet|Pont-i-Vic|Pont|Pontet|Pontiró|Ponç|Poquet|Porc|Porcell|Porquer|Porrassa|Porret|Porro|Porroner|Portell|Pou|Pouet|Poufondo|Prestfet|Prim|Primer|Primet|Proenç|Pruna|Príam|Puig|Puigcerver|Puigdorfila|Pujau|Pujol|Pujolet|Pujolí|Pulla|Punta|Punyal|Puput|Pur|Putxet|Puça|Pèl|Quart|Quartana|Quartera|Quartinel·lo|Quel|Quelet|Quelles|Queló|Quet|Quetoi|Quillo|Quint|Rabassa|Rafalasso|Rafel|Rafelet|Rafeló|Ramell|Ramions|Ramis|Ramon|Ramona|Ramonell|Ramonet|Rapinya|Ras|Rasca|Rata|Ratet|Ratolí|Ravenet|Real|Reboll|Rebostet|Redó|Regaladet|Regalat|Rei|Reig|Reiners|Reixac|Reixart|Remei|Renego|Rengo|Renou|Reus|Revell|Reviscolat|Reviu|Rialles|Ribes|Ribot|Ribotet|Ric|Riera|Rigo|Ripoll|Riutort|Robat|Roc|Roca|Roger|Roig|Romaní|Romeguer|Romeguera|Roquer|Roqueta|Ros|Rosa|Roses|Roseta|Rossell|Rosselló|Rossinyol|Rubí|Rumbo|Rutlan|Sabater|Sadoll|Sagí|Sala|Salamisses|Salamó|Salat|Sales|Saleta|Saletes|Salom|Salort|Salvanet|Salvat|Salí|Samar|Samarra|Samates|Sang|Santandreu|Santet|Santjoan|Santmartí|Santos|Santpol|Santpolí|Sanutges|Sanxo|Sanç-i-Serra|Sanç|Sard|Sardina|Sastre|Saura|Sauret|Sebel·lí|Sec|Segon|Seguerut|Seguinot|Seguí|Seldat|Sempenta|Senyor|Serení|Seriol|Serra|Serralta|Serrano|Serret|Servera|Serveret|Servereta|Setrill|Sifre|Simonet|Simó|Sineu|Singala|Sitges|Siurana|Sivineta|Socarrell|Socies|Soldat|Soler|Sospirat|Suau|Sunyer|Sureda|Suredeta|Sèmola|Sèu|Sóller|Taixaquet|Talent|Taltavull|Tambor|Tano|Tarascó|Tarí|Tell|Tellet|Tema|Temet|Tenasso|Terrassa|Terrola|Tetè|Teuler|Tica|Tiranet|Tirano|Tió|Todorí|Toells|Tomaset|Tomeu|Tomàs|Tomàtiga|Toni|Toniet|Tord|Torners|Torra|Torradet|Torranet|Torrat|Torrella|Torrelleta|Torrents|Torres|Totsol|Tou|Touet|Tous|Tovell|Traginer|Tranquil|Trencaferros|Trenta-dos|Tretze|Treufoc|Triall|Trilles|Tril·lo|Trit|Trobat|Trompa|Tronxo|Truc|Truitada|Trémol|Tugores|Turturell|Tut|Tàpera|Térmens|Vador|Valentí|Valenç|Vallespir|Vallets|Vallfogó|Vallori|Valls|Vaquer|Vaumeta|Vecete|Vela|Vell|Vencís|Venrell|Vent|Ventura|Veny|Verd|Verdera|Verdereta|Verdo|Verger|Verinet|Vermell|Verro|Verí|Vespa|Vetla|Vic|Vicent|Vida|Vidal|Vigili|Viguet|Vila|Vilar|Vilardell|Viles|Vinater|Viola|Violí|Viquet|Virgo|Viroto|Viscos|Vispó|Vistós|Vitamina|Vives|Vivets|Vivot|Vivó|Xalingo|Xantre|Xapellí|Xapeta|Xema|Xemena|Xeremia|Xerubinet|Xerubí|Xeta|Xeverí|Xic|Xigala|Ximelis|Xina|Xona|Xorc|Xoric|Xoriguer|Xormes|Xoro|Xot|Xota|Xotano</token> </pattern> <disambig action="add"> <wd pos="NPMSG00"/> <wd pos="NPMSG00"/> </disambig> </rule> <rule id="han_donat" name="Han donat (verb)"> <pattern> <marker> <token postag="VAIP3P00">han</token> </marker> <token postag="V.P..SM." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="VAIP3P00"/> </rule> <rulegroup id="Nom_propi" name="noms propis"> <antipattern> <token postag="V.M.*" postag_regexp="yes"/> <token postag="&pronom_feble;" postag_regexp="yes" spacebefore="no"/> </antipattern> <rule> <!-- exception: Podem dir --> <pattern> <marker> <token postag="VMIP1P00">podem</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="VMIP1P00"/> </rule> <rule> <!-- a Barcelona: no és l'equip de futbol --> <pattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"/> <marker> <and> <token postag="NP..G.." postag_regexp="yes"/> <token postag="NP..O.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="NP..O.."/> </rule> <rule> <pattern> <token postag="SENT_START"/> <token min="0" max="3" regexp="yes">[¿?¡!"'‘“«»—–:\-]</token> <marker> <token regexp="yes">Useu|Mata</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <!-- improbable NP --> <pattern> <token postag="SENT_START"/> <token min="0" max="3" regexp="yes">[¿?¡!"'‘“«»—–:\-]</token> <marker> <and> <token postag="NP.*" postag_regexp="yes"/> <token postag="A.*|NC.*|V.[IM].*" postag_regexp="yes"><exception postag="VMIP1S0B"/><exception regexp="yes">Poe|Vogue|Arnau</exception></token> </and> </marker> <token>,</token> </pattern> <disambig action="remove" postag="NP.*"/> </rule> <rule> <!-- improbable NP --> <pattern> <token postag="SENT_START"/> <token min="0" max="3" regexp="yes">[¿?¡!"'‘“«»—–:\-]</token> <marker> <and> <token postag="NP.*" postag_regexp="yes"/> <token postag="A.*|NC.*|V.[IM].*" postag_regexp="yes"><exception postag="VMIP1S0B"/><exception regexp="yes">Poe|Gaudí</exception></token> </and> </marker> <token postag="A.*|V.P.*" postag_regexp="yes"><exception regexp="yes">\p{Lu}.*</exception><exception postag="VA.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="NP.*"/> </rule> <rule> <pattern> <token><exception postag="SENT_START"/><exception regexp="yes">[¿?¡!"'‘“«»—–:\-]</exception></token> <marker> <token postag="NP.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="NP.*"/> </rule> <rule> <!-- Lluís Nadal persegueix --> <pattern> <token postag="SENT_START"/> <marker> <token postag="NP.*" postag_regexp="yes" skip="3"><exception postag="RG|CC|DD.*" postag_regexp="yes"/><exception scope="next" postag="V.P.*|SPS00|D[AI].*|C.*" postag_regexp="yes"/><exception scope="next" postag="P.*" postag_regexp="yes" regexp="yes">['-].+</exception></token> </marker> <token postag="V.[MSI].3.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="NP.*"/> </rule> <rule> <!-- Lluís Nadal exigeix --> <pattern> <token regexp="yes">[¿?¡!"'‘“«»—–:\-]</token> <marker> <token postag="NP.*" postag_regexp="yes" skip="3"><exception postag="A.*" postag_regexp="yes"/><exception scope="next" postag="V.P.*" postag_regexp="yes"/><exception scope="next" postag="P.*" postag_regexp="yes" regexp="yes">['-].+</exception></token> </marker> <token postag="V.[MSI].3.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="NP.*"/> </rule> <rule id="senyor_senyora" name="senyor -a"> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">duc|senyor|doctor|director|rector|amic</token> </marker> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="sant" name="sant"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="AQ.*" postag_regexp="yes" inflected="yes">sant</token> <token postag="NP..SP.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="unify"/> </rule> <rule id="el_nompropi" name="el + nom propi"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.*" postag_regexp="yes" inflected="yes">el</token> <token postag="NP..SP.*" postag_regexp="yes"><exception postag="NP..G.*" postag_regexp="yes"/></token> </unify> </pattern> <disambig action="unify"/> </rule> <rule id="nompropi_ordinal" name="nom propi + ordinal: Pere III"> <pattern> <marker> <token postag="NP.S.*" postag_regexp="yes"/> </marker> <token postag="AO.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="NP.S.*"/> </rule> </rulegroup> <rulegroup id="esser" name="ésser: nom no verb"> <rule> <pattern> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">ésser|esser|ser</token> </marker> <token postag_regexp="yes" postag="&pronom_feble;" spacebefore="no"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <antipattern> <token inflected="yes" regexp="yes">deixar|haver</token> <token>d'</token> <token>ésser</token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">voler|deure</token> <token>ésser</token> </antipattern> <pattern> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes">ésser|esser</token> </marker> <token regexp="yes" inflected="yes">humà|viu|vivent|suprem</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <!-- incloent-hi errors de concordança --> <pattern> <marker> <token postag="D[^N].*" postag_regexp="yes"><exception>en</exception></token> <token postag="NCMS000" regexp="yes">ésser|esser</token> </marker> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="tret" name="tret: no preposició"> <pattern> <token postag="D[AID].MS." postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">tret</token> </marker> </pattern> <disambig action="filter" postag="N.*|V.P.*"/> </rule> <rulegroup id="interjeccions" name="interjeccions"> <rule> <pattern> <marker> <token postag="V.*" postag_regexp="yes">ha</token> </marker> <token inflected="yes">de</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <antipattern> <token>hi</token> <token>ha</token> </antipattern> <pattern> <marker> <token regexp="yes">h[ea]</token> </marker> <token>,</token> <token><match no="0"/></token> </pattern> <disambig action="replace" postag="I"/> </rule> <rule> <antipattern> <token>hi</token> <token>ha</token> </antipattern> <pattern> <token regexp="yes">h[ea]</token> <token>,</token> <marker> <token><match no="0"/></token> </marker> </pattern> <disambig action="replace" postag="I"/> </rule> <rule> <pattern> <token><exception>hi</exception></token> <marker> <token regexp="yes">h[ea]</token> </marker> <token>!</token> </pattern> <disambig action="replace" postag="I"/> </rule> <rule> <antipattern> <token>hi</token> <token>ha</token> <token>,</token> <marker> <token>ha</token> </marker> </antipattern> <pattern> <token>ha</token> <token>,</token> <marker> <token>ha</token> </marker> </pattern> <disambig action="replace" postag="I"/> </rule> <rule> <pattern> <marker> <token>la</token> </marker> <token regexp="yes">que|què|qui|qual</token> </pattern> <disambig action="filter" postag="DA.*"/> </rule> <rule> <pattern> <marker> <token skip="3">rai</token> </marker> <token>!</token> </pattern> <disambig action="filter" postag="I"/> </rule> <rule> <pattern> <token>som</token> <token>-hi</token> </pattern> <disambig action="replace"> <wd pos="I"/> <wd pos="I"/> </disambig> </rule> <rule> <pattern> <token>tant</token> <token regexp="yes">me|te|li</token> <token regexp="yes">fa|feia</token> </pattern> <disambig action="replace"> <wd pos="I"/> <wd pos="I"/> <wd pos="I"/> </disambig> </rule> <rule> <pattern> <token>tant</token> <token>se</token> <token>val</token> </pattern> <disambig action="replace"> <wd pos="I"/> <wd pos="I"/> <wd pos="I"/> </disambig> </rule> <rule> <pattern> <token>valga</token> <token spacebefore="no">'m</token> </pattern> <disambig action="replace"> <wd pos="I"/> <wd pos="I"/> </disambig> </rule> <rule> <pattern> <marker> <token>maleït</token> <token>siga</token> </marker> <token>!</token> </pattern> <disambig action="replace"> <wd pos="I"/> <wd pos="I"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|C.*" postag_regexp="yes"/> <marker> <token>tant</token> <token>de</token> <token>bo</token> </marker> </pattern> <disambig action="replace"> <wd lemma="tant_de_bo" pos="I"/> <wd lemma="tant_de_bo" pos="I"/> <wd lemma="tant_de_bo" pos="I"/> </disambig> </rule> <rule> <pattern> <marker> <token min="3">ha</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <marker> <token min="3">hi</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <marker> <token min="3">he</token> </marker> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup id="vet_aci" name="vet/veus ací"> <rule> <pattern> <marker> <token regexp="yes">vet|heus</token> </marker> <token regexp="yes">ací|aquí</token> </pattern> <disambig action="add"> <wd lemma="vet" pos="VMM02S00"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">vet|heus</token> </marker> <token postag="P.*" postag_regexp="yes" regexp="yes">-(ho|lo|la|los|les|ne|me)</token> <token regexp="yes">ací|aquí</token> </pattern> <disambig action="add"> <wd lemma="vet" pos="VMM02S00"/> </disambig> </rule> <rule> <pattern> <marker> <token>ve</token> </marker> <token postag="P.*" postag_regexp="yes">-t</token> <token postag="P.*" postag_regexp="yes">'ho</token> <token regexp="yes">ací|aquí</token> </pattern> <disambig action="add"> <wd lemma="vet" pos="VMM02S00"/> </disambig> </rule> <!-- Altres combinacions són col·loquials: ve-li aquí --> </rulegroup> <rulegroup id="no_se_quin" name="no sé quin"> <rule> <pattern> <!--<token postag="SPS00|LOC_PREP" postag_regexp="yes"/>--> <token>no</token> <token min="0" regexp="yes">se|es</token> <marker> <token inflected="yes">saber</token> </marker> <token postag="RG|LOC_ADV|SPS00" postag_regexp="yes" min="0" max="4"/> <token regexp="yes" inflected="yes">què|qui|quin|quan|quant|on|com</token> </pattern> <disambig action="add"> <wd pos="_loc_nosequi"/> </disambig> </rule> <rule> <pattern> <token>no</token> <marker> <token skip="1">sé</token> </marker> <token regexp="yes">qui|quin|quins|quina|quines|on|com|què|quan|quant|quanta|quants|quantes</token> </pattern> <disambig action="add"> <wd pos="_loc_nosequi"/> </disambig> </rule> <rule> <pattern> <token>no</token> <marker> <token>sé</token> </marker> <token regexp="yes" min="0" max="4">gaire|molt|bé|ben|el</token> <token regexp="yes">qui|quin|quins|quina|quines|on|com|què|quan|quant|quanta|quants|quantes</token> </pattern> <disambig action="add"> <wd pos="_loc_nosequi"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">ves|vés|aneu</token> </marker> <token>a</token> <token>saber</token> <token regexp="yes">qui|quin|quins|quina|quines|on|com|què|quan|quant|quants|quanta|quantes</token> </pattern> <disambig action="add"> <wd pos="_loc_nosequi"/> </disambig> </rule> </rulegroup> <rule id="diguem_ne" name="diguem-ne"> <pattern> <marker> <token>diguem</token> </marker> <token>-ne</token> </pattern> <disambig action="add"> <wd pos="_loc_nosequi"/> </disambig> </rule> <rulegroup id="nDet" name="no Determinant"> <!-- paraules comunes que no solen ser determinants gairebé mai --> <rule> <pattern> <token regexp="yes" inflected="yes">tan|tant|força|molt|el</token> <marker> <token regexp="yes">diversos|diverses|diferents</token> </marker> </pattern> <disambig action="remove" postag="D.*"/> </rule> <rule> <pattern> <marker> <token regexp="yes">diversos|diverses|diferents</token> </marker> <token><exception postag="NC.*|AQ.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="D.*"/> </rule> <rule> <antipattern> <token regexp="yes">a|de|d'|amb|per|en|devers|envers</token> <token regexp="yes">es|s'</token> </antipattern> <antipattern> <token regexp="yes">sobre|dins|dintre<exception scope="previous">a</exception></token> <token regexp="yes">es|s'</token> </antipattern> <pattern> <marker> <token regexp="yes">es|s'</token> </marker> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="[^D].*"/> </disambig> </rule> <rule> <!-- però: amb so ganivet --> <pattern> <marker> <token>so</token> </marker> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="[^D].*"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">platja|cala|carrer|avinguda|carretera</token> <marker> <token>sa</token> </marker> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="filter" postag="DA0FS0"/> </rule> <rule> <pattern> <marker> <token>sa</token> </marker> </pattern> <disambig action="remove"> <wd pos="DA0FS0"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">en</token> </marker> <token><exception regexp="yes">\p{Lu}\p{Ll}*</exception></token> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="[^D].*"/> </disambig> </rule> <rule> <!-- no usem la interpretació de determinant --> <pattern> <token regexp="yes">[nv]ostres?</token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule> <pattern> <marker> <token>eixos</token> </marker> <token>cartesians</token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule> <pattern> <marker> <token>eixos</token> </marker> <token><exception postag="N.MP.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> </rulegroup> <rule id="excepcions_preposicions" name="entre a; entre en"> <pattern> <marker> <token>entre</token> </marker> <token regexp="yes">a|en</token> <token postag="D.*|V.N.*|A.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> <example type="untouched"><marker>Entre</marker> en Pep i en Joan.</example> </rule> <rulegroup id="preposicions" name="preposicions: sobre, contra, en"> <rule> <pattern> <token regexp="yes" inflected="yes">.*caure|convertir</token> <marker> <token postag="SPS00">en</token> </marker> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <token><exception regexp="yes">em|et|li|ens|us|vos|els|el|a|de|per|que</exception></token> <marker> <token postag="SPS00">sobre</token> </marker> <token postag="D.*|NP.*|NC.[PN].*" postag_regexp="yes"><exception>s'</exception></token> </pattern> <disambig action="filter" postag="SPS00"/> <example type="untouched">Que no li <marker>sobre</marker> res.</example> </rule> <rule> <pattern> <token postag="N.*|_GV_|V.*|_GN.*" postag_regexp="yes"/> <marker> <token postag="[VN].*" postag_regexp="yes" regexp="yes">sobre|entre</token> </marker> </pattern> <disambig action="filter" postag="[^VN].*"/> </rule> <rule> <pattern> <token>un</token> <marker> <token postag="SPS00">sobre</token> </marker> <token postag="[NDP].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <marker> <token>contra</token> </marker> <token postag="D.*|NC.*|_GN.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00|.*LOC_ADV.*"/> </rule> <rule> <pattern> <token><exception postag="D..MS." postag_regexp="yes"/></token> <marker> <token>dalt</token> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="remove" postag="NCMS000"/> </rule> </rulegroup> <rule id="ara_no_conjuncio" name="ara (adverbi no conjunció)"> <!-- ¿És necessari en algun cas? --> <pattern> <marker> <token postag="RG">ara<exception postag=".*_GN_.*" postag_regexp="yes"/></token> </marker> <token><exception regexp="yes">bé|,</exception></token> </pattern> <disambig action="remove" postag="CC"/> </rule> <rule id="vol_noverb" name="vol no verb"> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">vols?</token> <token postag="V.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">xàrter|charter|comercials?|transoceànics?|privats?|freqüents?</token> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="te_substantiu" name="te/té (amb error) + substantiu"> <antipattern> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">['-].*</exception></token> <token>te</token> </antipattern> <antipattern> <token>te</token> <token inflected="yes" regexp="yes">voler|deure|poder|preferir|desitjar</token> <token postag="V.N.*" postag_regexp="yes"/> </antipattern> <pattern> <token>te</token> <marker> <token postag="NC.*" postag_regexp="yes"><exception regexp="yes">dius?|tornes|fan|don</exception></token> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="tant" name="tant (no nom)"> <pattern> <token><exception regexp="yes">el|un</exception></token> <marker> <token>tant</token> </marker> </pattern> <disambig action="remove" postag="NCMS000"/> </rule> <rule id="vol" name="vol no nom"> <pattern> <token><exception postag="D.*|A.*|V.P.*|SENT_START|SPS00|.*LOC_.*|PX.*" postag_regexp="yes"/><exception regexp="yes" inflected="yes">haver|tenir</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">vols?</token> <token postag="V.*" postag_regexp="yes"/> </and> </marker> <token><exception regexp="yes">de|d'</exception></token> </pattern> <disambig action="remove" postag="N.*"/> <example type="untouched"><marker>Vols</marker> transoceànics</example> <example type="untouched">de <marker>vols</marker> transoceànics</example> <example type="untouched">Encara hi ha <marker>vols</marker> avui?</example> </rule> <rule id="anada" name="anada (nom)"> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">anada</token> </marker> <token postag="CC"/> <token regexp="yes" inflected="yes">tornada|vinguda</token> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="carboni" name="carboni / mescla (no verb)"> <rule> <pattern> <token inflected="yes">carboni</token> <token spacebefore="no">-</token> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule> <pattern> <token>-</token> <token inflected="yes" spacebefore="no">carboni</token> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">mescla|barreja</token> </marker> <token/> <token spacebefore="no">-</token> <token spacebefore="no"/> </pattern> <disambig action="remove" postag="V.*"/> </rule> </rulegroup> <rule id="es_la" name="prevenció en error: es/és la"> <pattern> <token>es</token> <marker> <token postag="DA.*" postag_regexp="yes"/> </marker> <token postag="[NA].*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="P.*"/> </rule> <rule id="donat_cas" name="cas (masc sg)"> <pattern> <token postag="V.P..SM." postag_regexp="yes"/> <marker> <token postag="NCMS000">cas</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="el_doble" name="el doble (no verb)"> <pattern> <token postag="RG"/> <token>el</token> <marker> <token postag="V.*" postag_regexp="yes">doble</token> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rulegroup id="notes_musicals" name="notes musicals (nom)"> <rule> <pattern> <marker> <token regexp="yes">do|re|mi|fa|sol|si</token> </marker> <token regexp="yes">menor|major|sostingut|bemoll|diesi|becaire</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token>la</token> </marker> <token regexp="yes">sostingut|bemoll|diesi|becaire</token> </pattern> <disambig action="filter" postag="N.*"/> <example type="untouched">És <marker>la</marker> major concentració mundial de cotxes.</example> </rule> </rulegroup> <rulegroup id="molt_noparticipi" name="molt no participi"> <rule> <pattern> <token>hi</token> <token min="0" max="3" inflected="yes" regexp="yes">poder|anar|a|de|voler|deure</token> <token min="1" max="2" inflected="yes">haver</token> <marker> <token inflected="yes">molt</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <token>hi</token> <token inflected="yes">haver</token> <token min="0" max="3" inflected="yes" regexp="yes">poder|anar|a|de|voler|deure</token> <token min="1" max="2" inflected="yes">haver</token> <marker> <token inflected="yes">molt</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <token inflected="yes">ser</token> <marker> <token inflected="yes">molt</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <marker> <token inflected="yes">molt</token> </marker> <token>ben</token> <token postag="V.P.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token inflected="yes">molt</token> </marker> <token postag="[NA].*" postag_regexp="yes"/> </unify> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <!-- TODO: cafè molt, etc. --> <rule> <pattern> <token regexp="yes">l'|els|les|n'</token> <token inflected="yes">haver</token> <marker> <token postag="V.P.*" postag_regexp="yes" regexp="yes">molt|molts|molta|moltes</token> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token inflected="yes">haver</token> <marker> <token postag="V.P.*" postag_regexp="yes">molt</token> </marker> <token postag="D.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token postag="[DPR].*" postag_regexp="yes" regexp="yes">molt|molts|molta|moltes</token> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> </rulegroup> <rule id="molt_adverbi" name="molt (adverbi)"> <pattern> <marker> <token postag="RG.*" postag_regexp="yes">molt</token> </marker> <token postag="A.*|RG|LOC_ADV" postag_regexp="yes"><exception postag="A.*|RG|LOC_ADV|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/></token> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="fer_nVerbConjug" name="no sol ser verb conjugat: fer"> <!-- paraules comunes que no solen ser verb gairebé mai --> <pattern> <marker> <token regexp="yes">fer|refer</token> </marker> </pattern> <disambig action="filter" postag="V.N.*|AQ.*"/> </rule> <rulegroup id="PrimPersPresSing" name="verb primera persona present singular "> <rule> <antipattern> <token postag="D..MS." postag_regexp="yes"/> <token>jo</token> </antipattern> <antipattern> <token postag="V...1S.." postag_regexp="yes"/> <token>jo</token> </antipattern> <pattern> <token>jo</token> <marker> <token postag="VM[IS]P1S0.?" postag_regexp="yes"><exception regexp="yes">fem|inquiet|sol|com|despert|intern|igual|millor|cap|gran</exception><exception postag="V..I1S0.?" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="V.[IS]P1S0.?"/> </rule> <rule id="improbable_verb_balear" name="verb balear improbable"> <pattern> <marker> <token postag="V.*B" postag_regexp="yes" regexp="yes">subsol|pis|xiv|plaç|estàs|après|test|remei|estiu|feren|fem|cens|som|guaret|sent</token> </marker> </pattern> <disambig action="filter" postag=".*[^B]"/> </rule> <rule id="improbable_verb_balear2" name="verb balear improbable"> <pattern> <token regexp="yes">es|és</token> <marker> <and> <token postag="VMIP1S0B"/> <token postag="[NA].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <!-- <rule> <pattern> <token>jo</token> <token postag="PP.*|P0.*" postag_regexp="yes" /> <marker> <token postag="VM[IS]P1S0" postag_regexp="yes" /> </marker> </pattern> <disambig action="filter" postag="V.[IS]P1S0" /> </rule> <rule> <pattern> <token>jo</token> <token postag="PP.*|P0.*" postag_regexp="yes" /> <token postag="PP.*|P0.*" postag_regexp="yes" /> <marker> <token postag="VM[IS]P1S0" postag_regexp="yes" /> </marker> </pattern> <disambig action="filter" postag="V.[IS]P1S0" /> </rule> --> <rule> <!-- un cop, aquestes tres; trasbalsat estic--> <pattern> <token postag="D[DI].*|AQ.*|V.*" postag_regexp="yes"/> <marker> <and> <token postag="VMIP1S0B"><exception regexp="yes">estic|dic</exception></token> <token postag="VMIP1S0B|SENT_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rule> <!-- estic segura --> <pattern> <token><exception postag="D.*|SPS00|LOC_PREP" postag_regexp="yes"/></token> <marker> <token>estic</token> </marker> </pattern> <disambig action="filter" postag="VMIP1S00"/> </rule> <rule> <pattern> <marker> <token>entre</token> </marker> <token>d'</token> <token>altres</token> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <marker> <token postag="SPS00">entre</token> </marker> <token/> <token regexp="yes">i|o</token> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes">respecte</token> </marker> <token regexp="yes" inflected="yes">a|de</token> </pattern> <disambig action="filter" postag="<LOC_PREP>"/> </rule> <rule> <!-- cal controlar les excepcions --> <pattern> <token><exception regexp="yes">que|em|et|es|la|ens|us|els|les|en|ho|li|vos|'[ntml]|'ls|hi|'ns</exception></token> <!-- el? --> <marker> <and> <token postag="N.*" postag_regexp="yes">respecte</token> <token postag="V.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="V.[IS].*" postag_regexp="yes"/> <marker> <and> <token postag="VMIP1S0.?" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> </rulegroup> <rulegroup id="SegPersPresSing" name="verb segona persona present singular "> <rule> <pattern> <token><exception postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/></token> <token>tu</token> <marker> <token postag="V.[IS].2S0.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.[MIS].2S0.?"/> </rule> <rule> <pattern> <token><exception postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/></token> <token>tu</token> <token postag="PP.*|P0.*" postag_regexp="yes"/> <marker> <token postag="V.[IS].2S0.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.[IS].2S0.?"/> </rule> <rule> <pattern> <token><exception postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/></token> <token>tu</token> <token postag="PP.*|P0.*" postag_regexp="yes"/> <token postag="PP.*|P0.*" postag_regexp="yes"/> <marker> <token postag="V.[IS].2S0.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.[IS].2S0.?"/> </rule> </rulegroup> <rule id="peu_calces" name="peu calces"> <pattern> <token postag="NC.*" postag_regexp="yes">peu</token> <token postag="V.*" postag_regexp="yes" inflected="yes">calçar</token> </pattern> <disambig action="filterall"/> </rule> <rule id="la_torna" name="la torna"> <pattern> <token inflected="yes">ser</token> <marker> <token postag="DA0FS0">la</token> <token postag="NCFS000">torna</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="tornar_a" name="tornar a/sobre"> <pattern> <token><exception postag="SPS00"/></token> <marker> <token inflected="yes">tornar<exception>torn</exception></token> </marker> <token regexp="yes">a|sobre|de|enrere|arrere|endarrere</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="vares" name="vares + infinitiu"> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes">anar</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="SegPersSing" name="verb segona persona singular"> <rule> <antipattern> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> <token>?</token> </antipattern> <pattern> <!-- cal revisar amb cura |UNKNOWN --> <token postag="(DD|PD).*|V.*|P[P0].*|NP.*|NC.*" postag_regexp="yes"><exception postag="C.*|R.*|DA.*|V.N.*|PT.*" postag_regexp="yes"/><exception regexp="yes">tu|e[mts]|[mts]e|ens|us|[mtsln]'|'[mtsln]|'ls|'ns|li|els?|la|les|en|hi|ho|any|dia|hem</exception></token> <marker> <and> <token postag="V.[IS].2S0." postag_regexp="yes"><exception regexp="yes">&verbs_2ps;</exception></token> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[IS].2S0."/> <!-- les ha vistes estenent la roba --> <example type="untouched">Quan tingues gana te'ls menges.</example> <example type="untouched">Digues quines diferències creus que existeixen.</example> <example type="untouched">Digues quines diferències creus tu que existeixen.</example> </rule> <rule> <!-- no extremes --> <antipattern> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> <token>?</token> </antipattern> <pattern> <!-- cal revisar amb cura |UNKNOWN --> <token postag="(DD|PD).*|V.*|P[P0].*|NP.*|NC.*" postag_regexp="yes"><exception postag="C.*|R.*|DA.*|V.N.*|PT.*" postag_regexp="yes"/><exception regexp="yes">tu|e[mts]|[mts]e|ens|us|[mtsln]'|'[mtsln]|'ls|'ns|li|els?|la|les|en|hi|ho|any|dia</exception></token> <token>no</token> <token min="0">pas</token> <marker> <and> <token postag="V.[IS].2S0." postag_regexp="yes"><exception regexp="yes">&verbs_2ps;</exception></token> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[IS].2S0."/> <!-- les ha vistes estenent la roba --> <example type="untouched">Quan tingues gana te'ls menges.</example> <example type="untouched">Digues quines diferències creus que existeixen.</example> <example type="untouched">Digues quines diferències creus tu que existeixen.</example> </rule> <rule> <!-- ben paleses --> <pattern> <token regexp="yes">molt|ben|tan</token> <marker> <and> <token postag="V.[IS].2S0.?" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule> <!--avantatges (amb menys restriccions)--> <pattern> <token><exception regexp="yes">tu|ens|m'</exception></token> <marker> <and> <token postag="V.[IS].2S0." postag_regexp="yes">avantatges</token> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[IS].2S0."/> <!-- les ha vistes estenent la roba --> <example type="untouched">Ens avanatges en tot.</example> </rule> </rulegroup> <rule id="creus" name="creus (verb)"> <pattern> <token postag="SENT_START"/> <token min="0" max="3" regexp="yes">\p{P}</token> <marker> <token skip="-1">creus</token> </marker> <token>?</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="en_veu" name="en veu baixa"> <rule> <pattern> <token>en</token> <marker> <token>veu</token> </marker> <token postag="AQ.[FC][SN]." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token>en</token> <marker> <token>veu</token> </marker> <token postag="RG_anteposat"/> <token postag="AQ.[FC][SN]." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rule id="en_sec" name="en sec"> <!-- Exception to next rule --> <pattern> <token>en</token> <marker> <token>sec</token> </marker> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="en_persona" name="en persona"> <!-- Exception to next rule --> <pattern> <token>en</token> <marker> <token regexp="yes">persona|vers</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rulegroup id="TerPersPresSing" name="verb tercera persona present singular "> <!-- també qualsevol nom comú o nom+adj ??--> <rule> <pattern> <token><exception postag="SPS00"/></token> <token regexp="yes">ella?</token> <marker> <token postag="V.[IS]P3S0.?" postag_regexp="yes"><exception regexp="yes">sola?|entre|encara</exception><exception postag="V...2.." postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="V.[IS]P3S0.?"/> </rule> <rule> <!-- exception: davant d'ell el seu triomf --> <antipattern> <token>el</token> <token>tema</token> </antipattern> <pattern> <token><exception postag="SPS00"/></token> <token regexp="yes">ella?</token> <token postag="PP.*|P0.*" postag_regexp="yes"/> <marker> <token postag="V.[IS]P3S0.?" postag_regexp="yes"><exception regexp="yes">seu|.+e</exception><exception postag="V...2.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="V.[IS]P3S0.?"/> </rule> <rule> <pattern> <token><exception postag="SPS00"/></token> <token regexp="yes">ella?</token> <token postag="PP.*|P0.*" postag_regexp="yes"/> <token postag="PP.*|P0.*" postag_regexp="yes"/> <marker> <token postag="V.[IS]P3S0.?" postag_regexp="yes"><exception>seu</exception><exception postag="V...2.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="V.[IS]P3S0.?"/> </rule> </rulegroup> <rulegroup id="ORDRE" name="ordre (m/f)"> <rule> <pattern> <marker> <token>ordre</token> </marker> <token>de</token> <token>l</token> <token>dia</token> </pattern> <disambig postag="NCMS000"/> </rule> </rulegroup> <rule id="ADRECA" name="adreça"> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" inflected="yes">adreça</token> </marker> <token inflected="yes">electrònic</token> </pattern> <disambig action="filterall"/> </rule> <rule id="TRET_PARTICIPI" name="tret, salvat (participi, no preposició)"> <antipattern> <token regexp="yes">de|una|lletra|la</token> <token>e</token> </antipattern> <antipattern> <token>e</token> <token regexp="yes">oberta|tancada|llarga|breu|després</token> </antipattern> <antipattern> <token regexp="yes">com|per|fins|de|olor</token> <token>a</token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">atribuir|convertir|canviar|degradar|sentenciar|accés|accedir|exposar|desafiar|arribar|pertànyer|correspondre|condemnar|jugar|tocar|condemnació|sonar|destinar|tendir|candidat|subjecte|aspirar|passar|corresponent|elevar|candidat|candidatura|sorprendre</token> <token postag="&pronom_feble;|AQ.*|V.P.*" postag_regexp="yes" min="0"/> <token>a</token> </antipattern> <antipattern> <token>a</token> <token>tret</token> <token>de</token> <token regexp="yes">fona|pistola|escopeta|arc|ballesta|pedra</token> </antipattern> <antipattern> <token>costat</token> <token>i</token> <token>costat</token> </antipattern> <antipattern> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes"/></token> <token>a</token> <token>mort</token> </antipattern> <antipattern> <token>em<exception scope="previous" regexp="yes">t'|l'|li|ens|us|vos|els|les</exception></token> <token postag="V.[SI].*" postag_regexp="yes"/> </antipattern> <antipattern> <token>a</token> <token regexp="yes">puntada|puntades|proposta|propostes|mes|demés|tos</token> </antipattern> <antipattern> <token>fet</token> <token>i</token> <token min="0">a</token> <token>amagar</token> </antipattern> <antipattern> <token inflected="yes">jugar</token> <token>a</token> <token>fet</token> </antipattern> <antipattern> <token>a</token> <token>partit</token> <token regexp="yes">únic|doble</token> </antipattern> <antipattern> <token postag_regexp="yes" postag="V.*"/> <token postag="&pronom_feble;|R.*" postag_regexp="yes" min="0" max="2"/> <token>a</token> <token regexp="yes">mort|cobert</token> </antipattern> <antipattern> <token postag_regexp="yes" postag="V.*" inflected="yes">posar</token> <token postag="&pronom_feble;|R.*" postag_regexp="yes" min="0" max="2"/> <token>a</token> <token regexp="yes">tret</token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">adjudicar|adjudicació|assignar|assignació|nomenament|nomenar|escollir|seleccionar|triar|elegir</token> <token>a</token> <token>dit</token> </antipattern> <antipattern> <token>estat</token> <token regexp="yes">líquid|sòlid|gasós</token> </antipattern> <antipattern> <token>de</token> <token postag="NC.S.*" postag_regexp="yes"/> <token>a</token> <token postag="NC.S.*" postag_regexp="yes"/> </antipattern> <pattern> <token regexp="yes">&formes_HAVER_sense_hac;</token> <token min="0" regexp="yes">&particula_entre_auxiliar_participi;</token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception regexp="yes">mes|dificultats</exception></token> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rulegroup id="mort" name="mort"> <rule> <pattern> <token postag="[AN].*" postag_regexp="yes" regexp="yes">mort|morta|morts|mortes<exception scope="previous" inflected="yes">haver</exception></token> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <token postag="D..M.." postag_regexp="yes"/> <marker> <token regexp="yes">mort|morts<exception scope="previous" inflected="yes">haver</exception></token> </marker> </pattern> <disambig action="remove" postag="NCF.*"/> </rule> </rulegroup> <rulegroup id="possibilitat" name="possibilitat"> <rule> <pattern> <token regexp="yes">més|menys</token> <marker> <token regexp="yes">possibilitats?<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <marker> <token regexp="yes">possibilitats?<exception scope="previous" inflected="yes">haver</exception><exception scope="next" regexp="yes">per|pe</exception></token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> </rulegroup> <rule id="la_culpa" name="culpa (nom)"> <pattern> <!-- error en: te -> té --> <token>te</token> <token regexp="yes">la|l'</token> <marker> <!-- generalitzar? --> <token postag="NC.S000" postag_regexp="yes" regexp="yes">culpa|pell|avantatge</token> </marker> </pattern> <disambig action="filter" postag="NC.S000"/> </rule> <rule id="espes" name="espès (no participi)"> <pattern> <token postag="A.*|N.*" postag_regexp="yes" regexp="yes">espès|espés|costats?<exception scope="previous" inflected="yes">haver</exception></token> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rulegroup id="telegraphic_writing" name="escriptura telegràfica"> <rule> <pattern> <token regexp="yes">obert|tancat</token> <token regexp="yes" inflected="yes">matí|tarda|vesprada|vespre|nit|vespra|víspera|festiu|&dies_setmana;</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes" inflected="yes">sol·licitud</token> <token postag="N.*" postag_regexp="yes" inflected="yes">certificat</token> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">total|import|preu|remesa</token> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">factura|entrada|proveïdor|client</token> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">total|import|preu</token> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">factura|entrada|albarà</token> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rule id="el_be" name="el bé"> <antipattern> <token>lo</token> <token>bé</token> </antipattern> <pattern> <token postag="DA0MS0"/> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">bé|darrere|davant</token> </marker> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule id="mitjo_de_mitja" name="mitjó de mitja"> <pattern> <token inflected="yes" regexp="yes">mitjó|calcetí</token> <token>de</token> <marker> <token>mitja</token> </marker> </pattern> <disambig action="replace"> <wd lemma="mitja" pos="NCFS000"/> </disambig> </rule> <rule id="punta" name="punta (nom, no adjectiu) "> <pattern> <token><exception postag="NC.*" postag_regexp="yes"/></token> <marker> <token postag="NCFS000">punta</token> </marker> </pattern> <disambig action="remove" postag="AQ0CN0"/> </rule> <rule id="annual" name="desastre d'Annual"> <pattern> <token regexp="yes" inflected="yes">desastre|batalla|ocupació|victòria|desfeta|derrota</token> <token regexp="yes">d'|de|a|en</token> <marker> <token case_sensitive="yes">Annual</token> </marker> </pattern> <disambig action="add" postag="NPCSG00"/> </rule> <rulegroup id="noms_aposicio" name="noms en aposició"> <rule> <pattern> <token regexp="yes" inflected="yes">nom|paraula|mot|verb|substantiu|expressió|frase|adjectiu|apel·latiu</token> <marker> <token regexp="yes">comodí|crossa|falca</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">certificat|passi|passaport</token> <marker> <token>covid</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">dimensió|mesura|mida</token> <marker> <token regexp="yes">micro|macro</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">compte|llibre|pel·lícula|programa|espectacle|entrevista|notícia|reportatge</token> <marker> <token>paròdia</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">quadre|taula|redacció|escrit</token> <marker> <token>resum</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">estètica|personatge|còmic|llibre|pel·lícula|dibuixant|publicació</token> <marker> <token>manga</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">cotxe|vehicle|moto|furgoneta|furgona</token> <marker> <token>espiell</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">tomata|tomaca|tomàquet|tomàtec|tomàtic|tomàtiga|tomacó</token> <marker> <token>cherry</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">salsa|espagueti|macarró|pasta</token> <marker> <token>carbonara</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">pantalla|televisió|televisor|bombeta</token> <marker> <token>led</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">furgoneta|furgó|furgona|vehicle|cotxe</token> <marker> <token>càmper</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes">mètode|sistema</token> <marker> <token>cangur</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">peix</token> <marker> <token regexp="yes">manta|globus</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">població|públic|usuari|comprador</token> <marker> <token regexp="yes">diana|objectiu</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">compte</token> <marker> <token regexp="yes">negoci|expansió</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">cel·la</token> <marker> <token>unitat</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">papallona</token> <marker> <token regexp="yes">mussol|bufaforats|safranera|zebra</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <marker> <token postag="NCFS000">dona</token> </marker> <token regexp="yes">pilot|pastor|compositora|bombera</token> </pattern> <disambig action="add"> <wd lemma="dona" pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="NCFP000">dones</token> </marker> <token regexp="yes">pilots?|pastors?|compositores|bomberes</token> </pattern> <disambig action="add"> <wd lemma="dona" pos="_GN_FP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">compte</token> </marker> <token regexp="yes">expansió|negocis</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes" inflected="yes">compte</token> <marker> <token regexp="yes">expansió|negocis</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">projecte|pla|acció|conferècia|trobada|reunió|encontre</token> <marker> <token>marc</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">compareixença|acció|guerra|manifestació|intervenció|batalla|invasió|viatge|visita</token> <marker> <token>llampec</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">dona|noi|nen|infant|xiquet|xic</token> <marker> <token>soldat</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">ós|óssos|óssa|ósses|os|ossos|ossa|osses</token> <marker> <token>grizzly</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">conseller|ministre|president|vicepresident|director|viceministre</token> <marker> <token>portaveu</token> </marker> </pattern> <disambig action="replace"> <wd lemma="portaveu" pos="AQ0CN0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">transmissor|emissor|ràdio|estació</token> <marker> <token regexp="yes" case_sensitive="yes">AM|FM</token> </marker> </pattern> <disambig action="replace"> <wd pos="AQ0CN0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">astre|esport|instrument</token> <marker> <token>rei</token> </marker> </pattern> <disambig action="replace"> <wd lemma="rei" pos="AQ0CN0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">etapa|prova|competició</token> <marker> <token>reina</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">grup|classe|viatge|vol</token> <marker> <token>bombolla</token> </marker> </pattern> <disambig action="replace"> <wd lemma="bombolla" pos="AQ0CN0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">pregunta|argument|argumentació</token> <marker> <token>trampa</token> </marker> </pattern> <disambig action="replace"> <wd lemma="trampa" pos="AQ0CN0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">país|estat|llengua|cultura</token> <marker> <token>pària</token> </marker> </pattern> <disambig action="replace"> <wd lemma="paria" pos="AQ0CS0"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">països|estats|llengües|cultures</token> <marker> <token>pàries</token> </marker> </pattern> <disambig action="replace"> <wd lemma="paria" pos="AQ0CP0"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">empresa|negoci|companyia</token> <marker> <token>unicorn</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">menjar|televisió|contracte|feina|faena|treball|acció|llibre|hipoteca|bo|notícia</token> <marker> <token regexp="yes">escombraria|escombraries|porqueria|fem|brossa</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token>estat<exception scope="previous" inflected="yes" postag="V...3S.." postag_regexp="yes">haver</exception></token> <marker> <token regexp="yes">membre|nació</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token>hi</token> <token min="0" inflected="yes" regexp="yes">anar|haver</token> <token inflected="yes">haver</token> <token>estat</token> <marker> <token regexp="yes">membre|nació</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"/> <marker> <token>braille</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">camió|tren|avió|autobomba|contenidor|remolc|vagó|vaixell</token> <marker> <token>cisterna</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">llengua|idioma</token> <marker> <token>meta</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">casella|client|clientela|públic</token> <marker> <token>objectiu</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">vaixell|nau</token> <marker> <token regexp="yes">escola|factoria|almirall|insígnia|fantasma</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">plat|llibre|batalló|actor|actriu</token> <marker> <token>insígnia</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">línia|esdeveniment|escola|planta|centre|projecte|proposta|pis|apartament|casa|prova|capítol|habitatge|vivenda|fase|programa</token> <marker> <token>pilot</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">formatge</token> <marker> <token regexp="yes">brie|cabrales|camembert|cantal|edam|emmental|feta|fontal|fontina|gorgonzola|gouda|gruyère|havarti|idiazabal|limburguès|manxec|maó|mascarpone|mimolette|montsec|mozzarella|parmesà parmesana|pirineus|ragusà|rocafort|roncal|tronxon|cheddar</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">freqüència|energia|potència|valor|quantitat|xifra|import|volum|pes|durada|quantia|mesura|suma</token> <marker> <token>llindar</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">pel·lícula|film|obra|director|llibre|actor|actriu|autor|escriptor|equip|jugador|entrenador|davanter|golejador</token> <marker> <token>revelació</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">carpeta|directori|certificat</token> <marker> <token>arrel</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">ós|óssa</token> <marker> <token>panda</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes">matriu</token> <marker> <token>identitat</token> </marker> </pattern> <disambig action="replace" postag="AQ0FN0"/> </rule> <rule> <pattern> <token inflected="yes">escola</token> <marker> <token>bressol</token> </marker> </pattern> <disambig action="replace" postag="AQ0FN0"/> </rule> <rule> <pattern> <token inflected="yes">memòria</token> <marker> <token>cau</token> </marker> </pattern> <disambig action="replace" postag="AQ0FN0"/> </rule> <rule> <pattern> <token>paper</token> <marker> <token>moneda</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token>lletra</token> <marker> <token postag="NCFS.*" postag_regexp="yes" regexp="yes">.{1,6}</token> </marker> </pattern> <disambig action="replace" postag="AQ0FS0"/> </rule> <rule> <pattern> <token regexp="yes">efecte|tipus</token> <marker> <token postag="NC.*" postag_regexp="yes"><exception postag="NC.*" postag_regexp="yes" negate_pos="yes"/></token> </marker> <token><exception postag="AQ.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token regexp="yes">efecte|tipus</token> <marker> <token postag="NCFS000">cascada</token> </marker> <token><exception postag="AQ.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="NCFS000"/> </rule> <rule> <pattern> <token>anys</token> <marker> <token>llum</token> </marker> </pattern> <disambig action="replace" postag="AQ0MP0"/> </rule> <rule> <pattern> <token>any</token> <marker> <token>llum</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token>déu</token> <marker> <token regexp="yes">pare|fill|esperit</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token>pare</token> <marker> <token regexp="yes">confessor|administrador|director|prior|prefecte|rector</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token>el</token> <marker> <token>pare</token> </marker> <token postag="NCMS000"/> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <pattern> <token regexp="yes">retrats?|fotos?</token> <marker> <token>robot</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token>pantalons</token> <marker> <token>bombatxos</token> </marker> </pattern> <disambig action="replace" postag="AQ0MP0"/> </rule> <rule> <pattern> <token regexp="yes">arcs?</token> <marker> <token>iris</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes">correus?|missatges?|comentaris?|e-?mails?|continguts?</token> <marker> <token regexp="yes">brossa|escombraries|porqueria</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">menjar|televisió|contracte|feina|faena|acció|llibre|hipoteca|bo</token> <marker> <token regexp="yes">brossa|escombraries|porqueria</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">factor|efecte|convidat|convidada|invitat|invitada|festa|celebració|atac|membre|regal|element|retorn|tornada|regrés|viatge|examen|ingredient</token> <marker> <token>sorpresa</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">mot|paraula|tema|qüestió|problema|persona</token> <marker> <token>tabú</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <token>decrets</token> <marker> <token>llei</token> </marker> </pattern> <disambig action="replace" postag="AQ0MP0"/> </rule> <rule> <pattern> <token>decret</token> <marker> <token>llei</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <marker> <token inflected="yes">metge</token> </marker> <token inflected="yes" regexp="yes">.+òleg|.+iatre|.+ista|cirurgià|psiquiatre</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <!-- hauria d'anar a Multiwords: --> <pattern> <marker> <token inflected="yes">torre</token> </marker> <token inflected="yes" regexp="yes">campanar|talaia</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <pattern> <token inflected="yes">torre</token> <marker> <token inflected="yes" regexp="yes">campanar|talaia</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <!-- hauria d'anar a Multiwords: --> <pattern> <marker> <token inflected="yes" regexp="yes">poble|barri</token> </marker> <token inflected="yes" regexp="yes">fantasma|dormitori|castell|camí</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">poble|ciutat|barri</token> <marker> <token inflected="yes" regexp="yes">fantasma|dormitori|castell|camí</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <!-- hauria d'anar a Multiwords: --> <pattern> <marker> <token inflected="yes">ministre</token> </marker> <token>secretari</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <pattern> <token>sal</token> <marker> <token regexp="yes">sosa|gemma</token> </marker> </pattern> <disambig action="replace"> <wd pos="AQ0FS0"/> </disambig> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="[NA].*|_GN_.*|VMIP1S0B|V.G.*" postag_regexp="yes" negate_pos="yes"/><exception regexp="yes">gran|possible|major|petit|propi|pròpia</exception></token> <marker> <token regexp="yes" postag="NC.*" postag_regexp="yes">consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base|pont|sulfat|fosfat|calci|gas|satèl·lit|gel</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="A.*|V.N.*|PX.*|V.P.*|VMIP1S0B" postag_regexp="yes"/><exception regexp="yes">son|sa|petit</exception></token> </unify> <marker> <token regexp="yes">consort|mare|pare|fill|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base|pont|sulfat|fosfat|calci|gas|satèl·lit|gel</token> </marker> </pattern> <disambig action="replace" postag="AQ0CN0"/> <example type="untouched">El meu pare era de l'associació.</example> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="[NA].*|_GN_.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">obra|propietat|objecte</token> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="replace" postag="AQ0CN0"/> </rule> <rule> <pattern> <!--<token postag="D..MS." postag_regexp="yes"/>--> <marker> <token regexp="yes">objectes?</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule> <pattern> <token postag="N..S.*" postag_regexp="yes"><exception postag="N.*|AQ.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">víctima|màrtir|terratinent|mascle|femella|especialista</token> </marker> </pattern> <disambig action="replace" postag="AQ0CS0"/> </rule> <rule> <pattern> <token postag="N..P.*" postag_regexp="yes"><exception postag="N.*|AQ.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">víctimes|màrtirs|terratinents|mascles|femelles|membres|claus|especialistes|estàndards</token> </marker> </pattern> <disambig action="replace" postag="AQ0CP0"/> </rule> <rule> <pattern> <token postag="N.MS.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">candidat|hereu|propietari</token> </marker> </pattern> <disambig action="replace" postag="AQ0MS0"/> </rule> <rule> <pattern> <token postag="N.MP.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">candidats|hereus|propietaris</token> </marker> </pattern> <disambig action="replace" postag="AQ0MP0"/> </rule> <rule> <pattern> <token postag="N.FS.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">candidata|hereua|hereva|propietària</token> </marker> </pattern> <disambig action="replace" postag="AQ0FS0"/> </rule> <rule> <pattern> <token postag="N.FP.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token regexp="yes">candidates|hereues|hereves|propietàries</token> </marker> </pattern> <disambig action="replace" postag="AQ0FP0"/> </rule> <rule> <pattern> <token regexp="yes">cotxes?|paquets?</token> <marker> <token>bomba</token> </marker> </pattern> <disambig action="replace" postag="AQ0MN0"/> </rule> <rule> <pattern> <marker> <token inflected="yes">tren</token> </marker> <token regexp="yes">cremallera|tramvia|correu</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <pattern> <token inflected="yes">tren</token> <marker> <token regexp="yes">cremallera|tramvia|correu</token> </marker> </pattern> <disambig action="replace" postag="AQ0MN0"/> </rule> <rule> <pattern> <token inflected="yes">nota</token> <marker> <token regexp="yes">do|re|mi|sol|si</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token inflected="yes">nota</token> <marker> <token regexp="yes">la|fa</token> </marker> <token><exception>que</exception><exception postag="V.[MSI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token>carta</token> <marker> <token regexp="yes">pobla|bomba</token> </marker> </pattern> <disambig action="replace" postag="AQ0FS0"/> </rule> <rule> <pattern> <token>dona</token> <marker> <token regexp="yes">pilot|alcaldessa|(.*)presidenta|policia|astronauta|cosmonauta|bombera</token> </marker> </pattern> <disambig action="replace" postag="AQ0FS0"/> </rule> <rule> <pattern> <token>zona</token> <marker> <token regexp="yes">centre|pícnic|fumadors</token> </marker> </pattern> <disambig action="replace" postag="AQ0FS0"/> </rule> <rule> <pattern> <token>cartes</token> <marker> <token regexp="yes">pobla|bomba</token> </marker> </pattern> <disambig action="replace" postag="AQ0FP0"/> </rule> </rulegroup> <rule id="CAP" name="cap"> <pattern> <marker> <token postag="NCCS000">cap</token> </marker> <token>d'</token> <token>estudis</token> </pattern> <disambig action="filter" postag="NCCS000"/> </rule> <rule id="els_CAP" name="els CAP"> <pattern> <token postag="D..M.*" postag_regexp="yes"/> <marker> <token case_sensitive="yes">CAP</token> </marker> </pattern> <disambig action="replace" postag="NCMN000"/> </rule> <!-- verb imperatiu, infinitiu o gerundi seguit de pronom--> <rule id="VERB_PP" name="verb seguit de pronom"> <pattern> <marker> <token postag="V.[MNG].*" postag_regexp="yes"/> </marker> <token postag="&pronom_feble;" postag_regexp="yes" regexp="yes" spacebefore="no">['-].+</token> </pattern> <disambig action="filter" postag="V.[MNG].*|_GV_|_loc_nosequi|_perfet|_obligacio|_reflexiu"/> </rule> <rule id="nAdverbi" name="no adverbi"> <!-- paraules comunes que no solen ser adverbi gairebé mai --> <pattern> <marker> <token>poder</token> </marker> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> <rulegroup id="infinitiu_complement" name="Verb en infinitiu com a complement"> <!-- Les coses a observar, les coses de menjar, els efectes immediats de vomitar --> <rule> <pattern> <token postag="N.*|A.*" postag_regexp="yes"/> <token postag="SPS00"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag=".*LOC_PREP.*" postag_regexp="yes"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token>no</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="N.*|A.*" postag_regexp="yes"/> <token postag="SPS00"/> <token postag="SPS00"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">en|,|a</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|D[ADI].MS.*" postag_regexp="yes"><exception>tant</exception></token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">poder|voler|deixar</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">acabat|després</token> <token>de</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="complement"/> <token regexp="yes">i|o|ni|però|sinó|,</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> </rulegroup> <rulegroup id="dur_adjectiu" name="dur (adjectiu)"> <rule> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">ser|estar|semblar|parèixer</token> <token min="0" max="3" postag="RG|LOC_ADV" postag_regexp="yes"/> <marker> <token postag="AQ0MS0">dur</token> </marker> <token><exception postag="[DP].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="AQ0MS0"/> </rule> <rule> <pattern> <marker> <token postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="AQ0MS0">dur</token> </marker> <token><exception postag="[DP].*" postag_regexp="yes"/></token> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="Verb_infinitiu" name="Verb infinitiu darrere de preposició i de verb"> <!-- "a ser valenta", "vull ser valenta": ser és infinitiu --> <pattern> <token postag="SP.*|V.[IS].*" postag_regexp="yes"><exception postag="PX.*|AQ.*|NC.*" postag_regexp="yes"/></token> <!-- el seu poder --> <marker> <and> <token postag="N.*|A.*" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"><exception regexp="yes">deure|poder|saber|menjar|sopar|despertar</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="V.N.*|complement"/> </rule> <rulegroup id="fer_infinitiu" name="fer/ser infinitiu"> <rule> <pattern> <token postag="V.*" postag_regexp="yes"/> <marker> <token>fer</token> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <token postag="C.*" postag_regexp="yes"/> <marker> <token>fer</token> </marker> <token min="0" max="3" postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <token>a</token> <token>l</token> <marker> <token>fer</token> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <token>tant</token> <marker> <token>fer</token> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <token><exception postag="D[^R].MS." postag_regexp="yes"/></token> <marker> <token>ser</token> </marker> <token min="0" max="3" postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <marker> <token inflected="yes">fer</token> </marker> <token>acopi</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> </rulegroup> <rule id="fer_miques" name="fer miques"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes">fer</token> </marker> <token min="0">a</token> <token regexp="yes">estelles|miques|xixines|trossos|peces|pols</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="articular" name="articular (infinitiu o adj)"> <pattern> <token postag="V.*" postag_regexp="yes"/> <marker> <token postag="V.*" postag_regexp="yes">articular</token> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule id="feu_nom" name="feu (nom)"> <pattern> <token>antic</token> <marker> <token postag="N.*" postag_regexp="yes">feu</token> </marker> </pattern> <disambig action="filter" postag="N.*|.*_GN_.*"/> </rule> <rule id="perquè_conjuncio" name="perquè (conjunció)"> <pattern> <token><exception postag="D..MS." postag_regexp="yes"/></token> <marker> <token postag="CS">perquè</token> </marker> </pattern> <disambig action="filterall"/> <example type="untouched">Sense saber el perquè.</example> </rule> <rule id="feu_verb" name="feu (verb)"> <pattern> <marker> <token postag="V.*" postag_regexp="yes">feu</token> <token postag="N.*" postag_regexp="yes" regexp="yes">clic|bondat</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="fera_nom" name="fera (nom)"> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">fera</token> </marker> <token inflected="yes" regexp="yes">salvatge|feroç|ferotge</token> </pattern> <disambig action="filter" postag="N.*|.*_GN_.*"/> </rule> <rule id="fe" name="fe (verb balear)"> <antipattern> <token>fe</token> <token postag="V.N.*" postag_regexp="yes"/> </antipattern> <antipattern> <token>fe</token> <token>que</token> </antipattern> <pattern> <token><exception regexp="yes">em|et|li|us|vos|ens|els|es</exception></token> <marker> <token>fe</token> </marker> </pattern> <disambig action="remove" postag="VMIS3S0B"/> </rule> <rulegroup id="fer_nom" name="fer + nom/adj: elimina el participi"> <antipattern> <token>un</token> <token>fan</token> </antipattern> <rule> <!-- de fes --> <pattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"><exception>en</exception></token> <marker> <and> <token inflected="yes">fer</token> <token postag="NC.*|A.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[^PN].*"/> </rule> <rule> <!-- fer amistat, costat, aliat, etc. --> <pattern> <token inflected="yes" regexp="yes">fer|donar<exception regexp="yes">dona|dones</exception></token> <marker> <and> <token postag="V.P.*" postag_regexp="yes"/> <token postag="NC.*|A.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="NC.*|A.*"/> </rule> <rule> <antipattern> <token postag="D..FS." postag_regexp="yes"/> <token>fera</token> </antipattern> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes">fer<exception regexp="yes">fets?|feres|feu|fe</exception><exception postag=".*LOC_ADV.*" postag_regexp="yes"/></token> </marker> <token postag="NC.*|V.G.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <!-- fer mestral --> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes">fer<exception regexp="yes">fets?|feres|feu</exception></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="AQ.*" postag_regexp="yes"><exception postag="_GN_.*|V.G.*|SPS00|V.[IS].*" postag_regexp="yes"/></token> </and> </marker> <token><exception postag="NC.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> </rulegroup> <rule id="posar_en_marxa" name="posar en parxa"> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes">posar</token> <token postag="SPS00">en</token> <token postag="N.*" postag_regexp="yes" regexp="yes">marxa|contacte|dubte|directe</token> </pattern> <disambig action="filterall"/> </rule> <rule id="tractat_militar" name="tractat militar"> <pattern> <token postag="NCMS000" regexp="yes">tractat|agregat</token> <token postag="AQ0CS0">militar</token> </pattern> <disambig action="filterall"/> </rule> <rule id="poder_infinitiu" name="poder/saber/voler + infinitiu"> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes" inflected="yes">poder|voler|saber</token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="V.N.*" postag_regexp="yes"><exception postag="AQ.*" postag_regexp="yes"/></token> <!-- exc. el poder militar --> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="poder_substantiu" name="el poder/saber/voler + no infinitiu"> <pattern> <token postag="DA0MS0"/> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">poder|voler</token> <!-- saber?: tractament especial --> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token><exception regexp="yes">això|açò|allò</exception><exception postag="V.N.*" postag_regexp="yes"/><exception postag="P.*" postag_regexp="yes" regexp="yes">-.+</exception></token> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule id="poder_podar" name="poder/podar + infinitiu"> <pattern> <marker> <and> <token inflected="yes">poder</token> <token inflected="yes">podar</token> </and> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd lemma="podar"/> </disambig> </rule> <rule id="oldre_oliar" name="olorar_oliar"> <pattern> <marker> <and> <token inflected="yes">oldre</token> <token inflected="yes">oliar</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="oliar"/> </disambig> </rule> <rule id="poder_podrir" name="poder/podrir + infinitiu"> <pattern> <marker> <and> <token inflected="yes">poder</token> <token inflected="yes">podrir</token> </and> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd lemma="podrir"/> </disambig> </rule> <rule id="voler_volar" name="voler/volar + infinitiu"> <pattern> <marker> <and> <token inflected="yes">voler</token> <token inflected="yes">volar</token> </and> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd lemma="volar"/> </disambig> </rule> <rule id="deure_dar" name="deure/dar + infinitiu"> <pattern> <marker> <and> <token inflected="yes">deure</token> <token inflected="yes">dar</token> </and> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd lemma="dar"/> </disambig> </rule> <rule id="menjar_substantiu" name="menjar substantiu"> <pattern> <token postag="D[^R].[CM]S.*" postag_regexp="yes"><exception>tant</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">collar|parlar|avenir|menjar|berenar|sopar|esmorzar|dinar|beure|somriure|riure|solar|titular|pesar|lleure|despertar</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token><exception postag="P[0P].*" postag_regexp="yes" regexp="yes">-.+</exception></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="caldrevoler_nomparticipi" name="caldre/voler + nom/participi"> <!-- cal/vol amistat --> <pattern> <token inflected="yes" regexp="yes">caldre|voler</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"><exception>invertit</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="calent" name="calent (adj)"> <pattern> <marker> <token postag="AQ.*" postag_regexp="yes" inflected="yes">calent</token> </marker> <token>de</token> <token regexp="yes">cap|ment</token> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <rulegroup id="Poder_substantiu_infinitiu" name="Poder com a substantiu o infinitiu"> <rule> <pattern> <token inflected="yes">haver</token> <token>de</token> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> <!-- adquirir/guanyar/perdre poder--> <rule> <pattern> <token inflected="yes" regexp="yes" skip="3">relació|expansió|expandir|distribuir|distribució|tornar|accedir|accés|arribar|oferir|heretar|guanyar|perdre|adquirir|obtenir|assolir|abastar|exercir|exercici|conservar|mantenir|ocupar|recuperar</token> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token><exception postag="P.*" postag_regexp="yes" regexp="yes">-.+</exception></token> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">seu|de|d'</token> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule> <pattern> <token>com</token> <token>a</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule> <pattern> <token regexp="yes">per|a</token> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token postag="D[^R].MS." postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule id="poder_substantiu2" name="poder (substantiu) + de"> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes">poder</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">de|d'|a</token> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule id="deure_substantiu" name="el deure (substantiu) + de"> <pattern> <token postag="D..MS." postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes">deure</token> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="remove" postag="V.N.*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes" skip="2">tenir|haver</token> <token>prou</token> <token regexp="yes">amb|de</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <!-- qualsevol verb/substantiu --> <token postag="V.N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> </rulegroup> <rule id="ON_relatiu" name="on, pronom relatiu"> <pattern> <token postag="N.*|AQ.*" postag_regexp="yes"/> <marker> <token>on</token> </marker> </pattern> <disambig action="filter" postag="PR.*"/> </rule> <rulegroup id="X_per_X" name="casa per casa, porta per porta, etc "> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> <token>per</token> <token><match no="0"/></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rule id="plana_si_plana_no" name="plana sí plana no"> <pattern> <token postag="NC.*" postag_regexp="yes"/> <token>sí</token> <token postag="NC.*" postag_regexp="yes"/> <token regexp="yes">no|també</token> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="te_infusio_lletra" name="te (nom d'infusió, lletra te)"> <rule> <pattern> <marker> <token postag="P.*" postag_regexp="yes">te</token> <token postag="&pronom_feble;" postag_regexp="yes" regexp="yes">la|les|li|'l|'ls|'m|'n|'ns</token> </marker> <token postag="V.[SI].*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <marker> <token postag="P.*" postag_regexp="yes">te</token> <token postag="&pronom_feble;" postag_regexp="yes" spacebefore="no"/> </marker> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">&verbs_TE_INFUSIO;</token> <token min="0" postag="D.*|RG|&pronom_feble;" postag_regexp="yes"/> <marker> <token>te</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <marker> <token>te</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token postag="D[^R].*" postag_regexp="yes"/> <marker> <token>te</token> </marker> <token><exception postag="P.*|V.[SI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token><exception regexp="yes">ella?|vost[èé]</exception><exception postag="N.*|_GN.*" postag_regexp="yes"/></token> <token>el</token> <marker> <token>te</token> </marker> </pattern> <disambig action="filter" postag="NCMS.*"/> </rule> <rule> <pattern> <token><exception regexp="yes">la|lletra|aquesta|esta|eixa|aqueixa|aquella|una</exception></token> <marker> <token postag="NCFS000">te</token> </marker> </pattern> <disambig action="remove"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">&exceptions_TE;</token> <token regexp="yes">,|i|o|ni</token> <marker> <token>te</token> </marker> </pattern> <disambig action="filter" postag="NCMS.*"/> </rule> <rule> <pattern> <marker> <token>te</token> </marker> <token regexp="yes">,|i|o|ni</token> <token inflected="yes" regexp="yes">&exceptions_TE;</token> </pattern> <disambig action="filter" postag="NCMS.*"/> </rule> </rulegroup> <rule id="la_volta" name="la Volta"> <pattern> <token>la</token> <marker> <token>Volta</token> </marker> </pattern> <disambig action="remove" postag="NPMS.*"/> </rule> <rule id="IMPOST" name="impost (impondre)"> <pattern> <token><exception inflected="yes">haver</exception></token> <marker> <token postag="NCM[SP]000" postag_regexp="yes" regexp="yes">(pressupost|impost)(s|os)?</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule id="TEMPLE" name="temple (templar)"> <pattern> <token><exception postag="P0.{6}|PP3CN000|PP3NN000|PP3(MP|F.)A00|PP3CP000|PP3CSD00" postag_regexp="yes"/></token> <marker> <token postag="NCMS000">temple</token> </marker> </pattern> <disambig action="remove"> <wd lemma="templar"/> </disambig> </rule> <rule id="TEMPLES" name="temples (templar)"> <pattern> <token><exception postag="P0.{6}|PP3CN000|PP3NN000|PP3(MS|F.)A00|PP3CP000|PP3CSD00" postag_regexp="yes"/></token> <marker> <token postag="NCMP000">temples</token> </marker> </pattern> <disambig action="remove"> <wd lemma="templar"/> </disambig> </rule> <rule id="CAPRITXOS" name="capritxos"> <pattern> <token>capritxos</token> </pattern> <disambig action="remove"> <wd lemma="capritxo"/> </disambig> </rule> <rule id="COIXOS" name="coixos"> <pattern> <token>coixos</token> </pattern> <disambig action="remove"> <wd lemma="coixo"/> </disambig> </rule> <rule id="ROSSAR" name="rossar/rossejar"> <pattern> <and> <token postag="V.*" postag_regexp="yes" inflected="yes">rossar</token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="EXPONENT" name="exponent (expondre)"> <pattern> <token><exception inflected="yes" regexp="yes">estar|anar</exception></token> <marker> <token postag="NCMS000">exponent</token> </marker> </pattern> <disambig action="remove" postag="V.G.*"/> </rule> <rule id="DISPOST" name="dispost (dispondre)"> <pattern> <token><exception inflected="yes">haver</exception></token> <marker> <token postag="AQ0..0" postag_regexp="yes" regexp="yes">(in)?dispost(a|es|s|os)?</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule id="PROPOSTA" name="proposta (propondre)"> <pattern> <marker> <token postag="NCF[SP]000" postag_regexp="yes" regexp="yes">propost(a|es)</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule id="CONTENT" name="contenta (contentar)"> <pattern> <marker> <token postag="AQ.*" postag_regexp="yes" inflected="yes">content</token> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="TRAVAR_TRAVESSAR" name="travar/travessar"> <pattern> <marker> <and> <token inflected="yes">travessar</token> <token inflected="yes">travar</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="travar"/> </disambig> </rule> <rule id="HUMIT" name="humit"> <pattern> <marker> <and> <token regexp="yes">humit|humida|humits|humides</token> <token inflected="yes">humir</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="humir"/> </disambig> </rule> <rulegroup id="AIGUA" name="aigua (aiguar?)"> <rule> <pattern> <token regexp="yes">m'|t'|s'|ens|us|vos|li|els|les|hi|n'</token> <marker> <token postag="V.*" postag_regexp="yes">aigua</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes">aigua</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token regexp="yes">m'|t'|s'|ens|us|vos|li|els|l'|hi|n'</token> <marker> <token postag="V.*" postag_regexp="yes">aigües</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes">aigües</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rule id="tornes" name="tornés: verb o adjectiu"> <pattern> <!-- exceptions? --> <marker> <token>tornés</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="nit" name="nit: normalment nom femení"> <pattern> <marker> <token postag="NCF.*" postag_regexp="yes" regexp="yes">nits?</token> </marker> </pattern> <disambig action="remove" postag="NCM.*"/> </rule> <rule id="presta" name="presta: verb o adjectiu"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">presta|prestes|preste</token> </marker> <token postag="NC.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="tesi" name="tesi: nom"> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">tesis?</token> </marker> <token postag="A.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule id="premi" name="premi: nom"> <pattern> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">premis?</token> </marker> <token>a</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule id="duc" name="duc verb o nom"> <pattern> <token inflected="yes">ser</token> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes">ducs?</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="la_seu" name="la seu, la ment: no verb"> <pattern> <token>la</token> <marker> <token regexp="yes">seu|ment</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="seu_episcopal" name="seu: nom"> <rule> <pattern> <token postag="N.*" postag_regexp="yes" regexp="yes">seus?</token> <token postag="AQ.[CF].*" postag_regexp="yes" regexp="yes" inflected="yes">episcopal|territorial|arquebisbal|catòlic|electrònic</token> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes" regexp="yes">seus?</token> <token postag="AQ.[CF].*" postag_regexp="yes" regexp="yes" inflected="yes">episcopal|territorial|arquebisbal|catòlic|electrònic</token> <token postag="AQ.[CF].*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="de_manera_adj" name="de manera expressa"> <pattern> <token>de</token> <token>manera</token> <marker> <and> <token postag="AQ.[CF][SN]." postag_regexp="yes"/> <token postag="[^A].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rulegroup id="mig_adverbi" name="mig_adverbi"> <rule> <pattern> <token postag="VA.*" postag_regexp="yes"/> <marker> <token>mig</token> </marker> <token postag="V.[NP].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <marker> <token postag="&pronom_feble;" postag_regexp="yes"><exception>en</exception></token> <token postag="RG">mig</token> </marker> <token postag="V.[SI].*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="masses" name="masses (incorrecte)"> <pattern> <token regexp="yes">masses|un|uns</token> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">mentida|dificultat|pecat|dada</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <!-- ser + participi--> <rulegroup id="ser_participi" name="ser + participi"> <rule> <pattern> <token postag="V.[NISM].*" postag_regexp="yes" inflected="yes">ser</token> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">mentida|dificultat|pecat|dada</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="V.P.*" postag_regexp="yes" inflected="yes">ser</token> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">mentida|pecat</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <token postag="V.[NISM].*" postag_regexp="yes" inflected="yes" regexp="yes">ser|estar|venir</token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </unify> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token><exception postag="DA0[MC]S.*|SPS00" postag_regexp="yes"/></token> <unify> <feature id="nombre"/> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">ser|estar|venir</token> </marker> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </unify> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token postag="DA0[MC]S.*" postag_regexp="yes"/> <unify> <feature id="nombre"/> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">ser|estar|venir</token> </marker> <token postag="V.P00P..?|V.P00.F.?" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">ser|estar|venir<exception postag="V.P.*" postag_regexp="yes"/></token> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </unify> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> <rule> <!--fora possible--> <pattern> <marker> <token inflected="yes">ser</token> </marker> <token>possible</token> </pattern> <disambig action="filter" postag="VS.*"/> </rule> </rulegroup> <rule id="paperina" name="fer el paperina"> <pattern> <token inflected="yes" skip="4">fer</token> <token>el</token> <marker> <token>paperina</token> </marker> </pattern> <disambig action="replace" postag="NCMS000"/> </rule> <rulegroup id="SENTAR" name="sentar/sentir"> <rule> <pattern> <token regexp="yes">se|es</token> <marker> <token>senta</token> </marker> <token postag="RG.*|LOC_ADV" postag_regexp="yes" min="0" max="3"/> <token postag="V.P.*|A.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd lemma="sentar"/> </disambig> </rule> <rule> <pattern> <marker> <token>senta</token> </marker> <token postag="RG.*|LOC_ADV" postag_regexp="yes" min="0" max="3"/> <token>que</token> </pattern> <disambig action="remove"> <wd lemma="sentar"/> </disambig> </rule> </rulegroup> <rulegroup id="dur_a_terme" name="dur a terme"> <!-- plantar cara, posar/tenir/estar/mantenir al corrent --> <rule> <pattern> <token regexp="yes" inflected="yes">dur|portar|cridar</token> <token>a</token> <marker> <token inflected="yes" regexp="yes">terme|consulta</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">estar|posar</token> <token>d'</token> <marker> <token>acord</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">fer</token> <marker> <token>falta</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <marker> <token inflected="yes">fer</token> <token>falta</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">donar</token> <token regexp="yes">origen|dret</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">donar</token> <marker> <token>veu</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token inflected="yes">donar</token> <token>de</token> <marker> <token>baixa</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token inflected="yes">donar</token> <token>de</token> <marker> <token>baixa</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">posar|ficar</token> <token>en</token> <marker> <token regexp="yes">dubte|qüestió|pràctica|valor|marxa|escena|servei|servici|contacte|camí|funcionament</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">deixar|posar</token> <token regexp="yes">a|de</token> <marker> <token regexp="yes">part|banda</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">estar</token> <token>a</token> <token spacebefore="no">l</token> <marker> <token inflected="yes">corrent</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">donar</token> <token regexp="yes">de|d'</token> <marker> <token regexp="yes">alta|baixa</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">matar</token> <token>de</token> <marker> <token regexp="yes">fam|gana|set|son</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rule id="PORTAR_PRESSA" name="portar pressa"> <pattern> <marker> <token inflected="yes" postag="V.*" postag_regexp="yes" regexp="yes">donar|portar</token> <token postag="NCFS000">pressa</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="DONAR" name="donar"> <pattern> <marker> <token inflected="yes" postag="V.*" postag_regexp="yes">donar</token> </marker> <token regexp="yes">part|sentit|importància</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="seguit_nom" name="seguit: nom no participi"> <pattern> <token postag="D..MS.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes">seguit</token> </pattern> <disambig action="filterall"/> </rule> <rule id="deure_infinitiu" name="deure + infinitiu"> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes">deure</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule id="mesos" name="mesos no participi del verb metre"> <pattern> <token>mesos</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <!-- haver + participi. mogut per "han després/desprès"--> <rulegroup id="haver_participi" name="haver + participi"> <antipattern> <token postag="NC[MC][SN]000" postag_regexp="yes"><exception postag="RG|V.P.*|P.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <token postag="V.P..SM." postag_regexp="yes"/> </antipattern> <antipattern> <token postag="D..[MC][SN]." postag_regexp="yes"><exception inflected="yes">haver</exception></token> <token postag="V.P..SM." postag_regexp="yes"/> </antipattern> <antipattern> <token postag="NC[FC][SN]000|D..[FC][SN]." postag_regexp="yes"><exception postag="RG|V.P.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <token postag="V.P..SF." postag_regexp="yes"/> </antipattern> <antipattern> <token postag="NC[MC][PN]000|D..[MC][PN]." postag_regexp="yes"><exception postag="RG|V.P.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <token postag="V.P..PM." postag_regexp="yes"/> </antipattern> <antipattern> <token postag="NC[FC][PN]000|D..[FC][PN]." postag_regexp="yes"><exception postag="RG|V.P.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <token postag="V.P..PF." postag_regexp="yes"/> </antipattern> <rule> <pattern> <token inflected="yes">haver</token> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes" regexp="yes">sortida|eixida|entrada</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <!-- elimina 'hajar' --> <rule> <pattern> <and> <token inflected="yes">hajar</token> <token inflected="yes">haver</token> </and> </pattern> <disambig action="remove"> <wd lemma="hajar"/> </disambig> </rule> <rule> <!-- excepcions: hi ha necessitat. Pot havier-hi ambigüitats: s'hi havia calat foc --> <pattern> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception><exception regexp="yes">ella?</exception><exception postag="NP.*|_GN_.*" postag_regexp="yes"/></token> <token>hi</token> <token postag="VA..3S.." postag_regexp="yes" inflected="yes">haver</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"/> </and> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rule> <pattern> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception><exception regexp="yes">ella?</exception><exception postag="NP.*|_GN_.*" postag_regexp="yes"/></token> <token>hi</token> <token postag="VA..3S.." postag_regexp="yes" inflected="yes">haver</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"><exception regexp="yes">pres|dits?|ratllats?|escrits?|fets?|acabats?|col·locats?|duta|portada|dutes|portades|deixats?|deixad(a|es)|estat|posat|trobat|afegit</exception></token> </and> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <!-- excepcions: no hi va haver necessitat --> <pattern> <token>haver</token> <token>-hi</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"><exception regexp="yes">pres|dits?|ratllats?|escrits?|fets?|acabats?|col·locats?|duta|portada|dutes|portades|deixats?|deixad(a|es)|estat|posat|trobat</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <!-- excepcions: no hi va haver necessitat --> <pattern> <token>hi</token> <token regexp="yes">van?|varen</token> <token>haver</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"><exception regexp="yes">pres|dits?|ratllats?|escrits?|fets?|acabats?|col·locats?|duta|portada|dutes|portades|deixats?|deixad(a|es)|estat|posat</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <!-- permet comprovar errors amb 'heure': hagueu fet --> <pattern> <token inflected="yes">heure<exception inflected="yes">haver</exception></token> <marker> <token postag="V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <marker> <token inflected="yes" skip="6" postag="V.*" postag_regexp="yes">haver<exception scope="next" postag="V.[GN].*" postag_regexp="yes"/></token> </marker> <token postag="V.P.*" postag_regexp="yes"><exception scope="previous" postag="SPS00"/></token> </pattern> <disambig action="filter" postag="VA.*"/> <example type="untouched">Han de dit que sí.</example> </rule> <rule> <!-- no filtra les etiquetes de V.P. quan el participi està separat per a evitar falses alarmes --> <pattern> <token><exception>hi</exception></token> <token><exception>hi</exception></token> <token inflected="yes" postag="V.*" postag_regexp="yes">haver</token> <marker> <token postag="V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <token inflected="yes" postag="V.*" postag_regexp="yes">haver</token> <marker> <token postag="V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <!--<token skip="1">hi</token>--> <token inflected="yes" postag="V.*" postag_regexp="yes">haver</token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <marker> <!--<exception scope="next" postag="_GV_|_PUNCT_CONT|P.*|R.*|.*LOC_ADV.*|V.*|SENT_END|[CNDAS].*|complement" postag_regexp="yes" negate_pos="yes"/> --> <token inflected="yes" skip="6" postag="V.*" postag_regexp="yes">haver<exception scope="next" postag="V.[GN].*|VA[^P].*" postag_regexp="yes"/><exception scope="next" inflected="yes">molt</exception></token> </marker> <token postag="V.P.*" postag_regexp="yes"><exception scope="previous" inflected="yes" regexp="yes">ser|estar|continuar|seguir|matenir|romandre</exception><exception scope="previous" postag="SPS00"/></token> </pattern> <disambig action="add"> <wd pos="_GV_" lemma="haver"/> </disambig> <example type="untouched">Han de dit que sí.</example> </rule> <rule> <pattern> <token inflected="yes" postag="V...3...." postag_regexp="yes">haver</token> <token>més</token> <token>que</token> <marker> <token postag="V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_perfet" lemma="haver"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" skip="6" postag="V.*" postag_regexp="yes">haver<exception scope="next" postag="V.G.*|VA[^P].*" postag_regexp="yes"/><exception scope="next" inflected="yes">molt</exception></token> </marker> <token postag="V.P.*" postag_regexp="yes"><!--<exception inflected="yes">haver</exception>--><exception scope="previous" inflected="yes" regexp="yes">ser|estar|continuar|seguir|matenir|romandre</exception><exception scope="previous" postag="SPS00"/></token> </pattern> <disambig action="add"> <wd pos="_perfet" lemma="haver"/> </disambig> <example type="untouched">Han de dit que sí.</example> </rule> <rule> <pattern> <token inflected="yes" skip="6" postag="V.*" postag_regexp="yes">haver<exception scope="next" postag="V.G.*" postag_regexp="yes"/><exception scope="next" regexp="yes">de|d'</exception><exception scope="next" inflected="yes">molt</exception></token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception scope="previous" inflected="yes" regexp="yes">ser|estar|continuar|seguir|matenir|romandre</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <!-- <rule> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes" skip="5">anar<exception scope="next" postag="_GV_|_PUNCT_CONT|R.*|.*LOC_ADV.*|V.N.*|SENT_END|[NA].*|complement" postag_regexp="yes" negate_pos="yes"/></token> <marker> <token postag="V.N.*" postag_regexp="yes"></token> </marker> </pattern> <disambig action="add"><wd pos="_GV_"></wd> </disambig> </rule> --> <rule id="degut_participi" name="degut (participi)"> <pattern> <token inflected="yes" skip="5" regexp="yes">ser|semblar|parèixer<exception scope="next" postag="V.[GN].*|A.*" postag_regexp="yes"/></token> <marker> <token postag="V.P.*" postag_regexp="yes">degut</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <!-- encadena amb conjunció --> <rule id="haver_participi_i_participi" name="haver + participi + i/o/ni + participi"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <and> <token postag="V.P.*" postag_regexp="yes"/> <token postag="_GV_"/> </and> <token regexp="yes">i|o|ni</token> <marker> <token postag="V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <!-- haver + estat + participi --> <rule> <pattern> <token inflected="yes">haver</token> <token postag="V.P.*" postag_regexp="yes" inflected="yes">ser</token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token inflected="yes">haver</token> <token postag="V.P.*" postag_regexp="yes" inflected="yes">ser</token> <marker> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rule id="la_resta" name="la resta"> <!-- Excepció a la regla següent --> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token regexp="yes" inflected="yes">el|un</token> <marker> <token inflected="yes">resta</token> </marker> <token postag="V.P.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="venir_gerundi" name="venir gerundi (construcció incorrecta)"> <antipattern> <token postag="SPS00"/> <token min="0" postag="D.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">venir|portar|dur</token> <token postag="V.G.*" postag_regexp="yes"><exception postag="SPS00"/></token> </marker> </pattern> <disambig action="filterall"/> </rule> <!-- restar + participi--> <rulegroup id="restar_participi" name="restar + participi"> <rule> <!-- Falta un cas especial per a: haver quedat + participi --> <pattern> <unify> <feature id="nombre"/> <marker> <token postag="V.[^P].*" postag_regexp="yes" inflected="yes" regexp="yes">quedar|restar</token> <token postag="V.P.*" postag_regexp="yes"><exception>després</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <marker> <token postag="V.[^P].*" postag_regexp="yes" inflected="yes" regexp="yes">quedar|restar</token> <token postag="V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rule id="tornar_a_inf" name="tornar a + infinitiu"> <pattern> <token><exception postag="SPS00"/></token> <marker> <token inflected="yes">tornar</token> </marker> <token>a</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="ull_mig_aclucat" name="ull mig (adv) aclucat"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">troba|queda|era</exception></token> <token postag="RG.*" postag_regexp="yes">mig</token> <token postag="V.P.*|AQ.[^C][^N].*" postag_regexp="yes"/> </unify> </pattern> <disambig action="unify"/> </rule> <rule id="FOS" name="Fos (verb ser)"> <!-- És molt comú com a verb. Cal buscar excepcions específiques: metall fos, etc. --> <pattern> <token><exception regexp="yes">metall|alumini|nucli|ferro|zinc|sílex|quars|material|coure|bronze|llum</exception></token> <marker> <token postag="VS.*" postag_regexp="yes">fos<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="VS.*|_GV_|.*LOC.*"/> </rule> <rule id="fes_no_fendre" name="fes no participi del verb fendre"> <pattern> <marker> <token postag="V.*" postag_regexp="yes">fes<exception postag="_GV_"/></token> </marker> </pattern> <disambig action="filter" postag="V.[^P].*"/> </rule> <rule id="marxa" name="marxa (nom)"> <pattern> <token inflected="yes">anar</token> <marker> <token>marxa</token> </marker> <token regexp="yes">enrere|arrere|endarrere</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rulegroup id="nVerb0" name="no verb"> <rule> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">punta|puntes|davall|només|noms?<exception postag="_GV_"/></token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule> <antipattern> <token postag_regexp="yes" postag="&pronom_feble;"><exception>el</exception></token> <token postag="V.[IS].*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">projecte|nou|nous<exception postag="_GV_"/></token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> </rulegroup> <rule id="PAS_RN" name="pas (adverbi)"> <pattern> <token>no</token> <token postag="&pronom_feble;" postag_regexp="yes" min="0" max="3"/> <token postag_regexp="yes" postag="V.[IS].*"/> <marker> <token postag="RN">pas</token> </marker> </pattern> <disambig action="filter" postag="RN"/> </rule> <rulegroup id="haver_de_infinitiu" name="haver de + infinitiu"> <rule> <pattern> <token inflected="yes">haver</token> <token regexp="yes">de|d'</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <marker> <token inflected="yes" skip="6">haver<exception scope="next" postag="V.N.*|VA.*|V.[IS].*" postag_regexp="yes"/><exception postag="_perfet"/></token> <!--<exception scope="next" postag="_GV_|_PUNCT_CONT|P.*|R.*|.*LOC_ADV.*|V.*|SENT_END|[NAS].*|CC|complement" postag_regexp="yes" negate_pos="yes"/> --> </marker> <token regexp="yes">de|d'<exception scope="previous" postag="N.*|_GN_.*" postag_regexp="yes"/></token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_obligacio" lemma="haver"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">haver</token> </marker> <token skip="3">hagut<exception scope="next" postag="V.N.*|VA.*|V.[IS].*" postag_regexp="yes"/></token> <token regexp="yes">de|d'<exception scope="previous" postag="N.*|_GN_.*" postag_regexp="yes"/></token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_obligacio" lemma="haver"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" skip="1">haver<exception scope="next" postag="V.N.*" postag_regexp="yes"/></token> </marker> <token postag="LOC_ADV" skip="5" regexp="yes">de|d'</token> <token inflected="yes">de</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_obligacio" lemma="haver"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">haver<exception postag="_obligacio"/></token> </marker> <token skip="3" regexp="yes">de|d'</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_obligacio" lemma="haver"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="_obligacio" inflected="yes">haver</token> </marker> </pattern> <disambig action="filter" postag="VA.*|_obligacio|_GV_"/> </rule> </rulegroup> <rulegroup id="NUCLIS_VERBALS" name="nuclis verbals amb noms"> <rule> <pattern> <token inflected="yes" skip="1">posar</token> <token regexp="yes">de|en</token> <marker> <token>relleu</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1">tenir</token> <token>en</token> <marker> <token>compte</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token inflected="yes" skip="1">tenir</token> <token>en</token> <marker> <token>compte</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1">estar</token> <token>d'</token> <marker> <token>acord</token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rulegroup id="NO_PAS" name="no pas"> <rule> <pattern> <token skip="6">no</token> <token postag="V.*|PP.*" postag_regexp="yes"/> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token skip="5">no</token> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token skip="4">no</token> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token skip="3">no</token> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token skip="2">no</token> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <token postag="V.*|PP.*" postag_regexp="yes"/> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token>no</token> <marker> <token>pas</token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> </rulegroup> <rulegroup id="haver_hi_auxiliar" name="haver-hi auxiliar"> <rule> <pattern> <token>hi</token> <marker> <token inflected="yes">haver</token> </marker> </pattern> <disambig action="filter" postag="VA.*|_GV_|_perfet|_obligacio"/> </rule> <rule> <pattern> <marker> <token inflected="yes">haver</token> </marker> <token>-hi</token> </pattern> <disambig action="filter" postag="VA.*|_GV_|_perfet|_obligacio"/> </rule> </rulegroup> <rule id="DESPRES" name="després no participi"> <!-- cal una regla per a després/desprès --> <pattern> <marker> <token postag="RG">després<exception postag="_GV_"/></token> </marker> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule id="DESPRES_QUE" name="que (conjunció)"> <pattern> <token regexp="yes">després|abans</token> <marker> <token postag="CS">que</token> </marker> </pattern> <disambig action="filter" postag="CS"/> </rule> <rule id="nous" name="nous + nom plural"> <pattern> <marker> <token>nous</token> </marker> <token postag="N.MP.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="les_nou" name="les nou i"> <pattern> <token>les</token> <marker> <token postag="NCCN000"/> </marker> <token>i</token> </pattern> <disambig action="filter" postag="NCCN000"/> </rule> <rule id="nou0" name="nou + nom singular"> <pattern> <marker> <token postag="A.*" postag_regexp="yes">nou</token> </marker> <token postag="N.M[SN].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="el_fa" name="el fa (verb)"> <pattern> <marker> <token postag="PP3MSA00">el</token> <token postag="VMIP3S00">fa</token> </marker> <token postag="RG|LOC_ADV" min="0" max="3" postag_regexp="yes"/> <token postag="A.*|V.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="que_els_deus" name="què els deus (verb)"> <rule> <pattern> <token>què</token> <marker> <token postag="PP3CP000">els</token> <token postag="VMIP2S00">deus</token> </marker> <token regexp="yes">\p{P}</token> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token>què</token> <marker> <token postag="PP3CP000">els</token> <token postag="VMIP2S00">dius</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token>què</token> <marker> <token postag="VMIP2S00">tens</token> </marker> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rulegroup id="el_pais" name="el país, el domini, l'equilibri (nom)"> <antipattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <token postag="&pronom_feble;" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </antipattern> <antipattern> <token>s</token> <token postag="&pronom_feble;" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="DA.*" postag_regexp="yes"><exception scope="previous" postag="&pronom_feble;" postag_regexp="yes"/><exception regexp="yes">s'|es</exception></token> <marker> <!--<token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&nom_o_verb;</token>--> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> </unify> <token min="0" postag="RN|RG" postag_regexp="yes"/> <token postag="V.[SIP].*|AQ.*|&pronom_feble;" postag_regexp="yes"><exception>objecte</exception></token> </pattern> <disambig action="remove" postag="V.[SIM].*|RG|DI.*|SPS00|PI.*"/> <example type="untouched">Se la veu tranquil·la.</example> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="DA.*" postag_regexp="yes"><exception regexp="yes">s'|es</exception></token> <marker> <!--<token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&nom_o_verb;</token>--> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> </unify> <token regexp="yes">de|d'</token> <token><exception>manera</exception></token> </pattern> <disambig action="remove" postag="V.[SIM].*|RG|DI.*|SPS00|PI.*"/> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="DA.*" postag_regexp="yes"><exception>s'</exception></token> <marker> <!--<token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">&nom_o_verb;</token>--> <and> <token postag="NC.*" postag_regexp="yes"><exception regexp="yes">troba|trobes</exception></token> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> </unify> <token postag="SPS00"/> <token>què</token> </pattern> <disambig action="remove" postag="V.[SIM].*|RG|DI.*|SPS00|PI.*"/> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D.*" postag_regexp="yes"/> <marker> <token postag="NC.*" postag_regexp="yes" inflected="yes" regexp="yes">queixa|termini|papa1</token> </marker> </unify> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule> <!-- en escriptura--> <pattern> <token>en</token> <marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">[aeiou].*</token> </marker> </pattern> <disambig action="remove" postag="V.[MIS].*"/> </rule> </rulegroup> <rule id="PLAURE_PLAGAR" name="plaure/plagar"> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <marker> <and> <token inflected="yes">plaure</token> <token inflected="yes">plagar</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="plagar"/> </disambig> </rule> <rule id="CREURE_CREAR" name="creure/crear"> <pattern> <marker> <and> <token inflected="yes">creure</token> <token inflected="yes">crear</token> </and> </marker> <token>que</token> </pattern> <disambig action="remove"> <wd lemma="crear"/> </disambig> </rule> <rulegroup id="MONA" name="mona (nom o adjectiu)"> <rule> <pattern> <token postag="RG_anteposat"/> <marker> <and> <token inflected="yes">mona</token> <token inflected="yes">mono2</token> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="mona"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="NC.*" postag_regexp="yes"/> <marker> <and> <token inflected="yes">mona</token> <token inflected="yes">mono2</token> </and> </marker> </unify> </pattern> <disambig action="remove"> <wd lemma="mona"/> </disambig> </rule> </rulegroup> <rule id="SENS" name="sens + nom"> <pattern> <token>sens</token> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="formar_part" name="formar part, fer fallida"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes" inflected="yes">prendre|formar|fer</token> </marker> <token regexp="yes">part|fallida|malbé|costat</token> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rule id="formar_part2" name="formar part"> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">formar|fer|ser</token> <marker> <token>part</token> </marker> </pattern> <disambig action="filter" postag="NCFS.*"/> </rule> <rule id="fer_fallida" name="fer fallida"> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">declarar|fer</token> <marker> <token>fallida</token> </marker> </pattern> <disambig action="filter" postag="NCFS.*"/> </rule> <rulegroup id="VISTA" name="vista"> <!-- tracta la variant valenciana: jo vist| tu vistes, ell vista --> <rule> <pattern> <marker> <token>vist</token> </marker> <token min="0">-</token> <token>i</token> <token min="0">-</token> <token>plau</token> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <rule> <pattern> <token regexp="yes">es|em|el|la|els|les|ens|us|se|me|vos|jo|ell</token> <marker> <token postag="V.*V" postag_regexp="yes">vist</token> </marker> </pattern> <disambig action="filter" postag="V.*V|_GV_"/> </rule> <rule> <pattern> <token regexp="yes">es|em|el|els|les|ens|us|se|me|vos|jo|ell</token> <marker> <token postag="V.*V" postag_regexp="yes">vista</token> </marker> </pattern> <disambig action="filter" postag="V.*V|_GV_"/> </rule> <rule> <pattern> <token regexp="yes">et|te|tu</token> <marker> <token postag="V.*V" postag_regexp="yes">vistes</token> </marker> </pattern> <disambig action="filter" postag="V.*V|_GV_"/> </rule> <rule> <pattern> <marker> <token postag="V.P.*|N.*" postag_regexp="yes" regexp="yes">vist|vista|vistes</token> </marker> </pattern> <disambig action="filter" postag="V.P.*|N.*|_GV_"/> </rule> </rulegroup> <rulegroup id="VIU" name="viu (verb, adj, nom)"> <rule> <pattern> <token>no</token> <token>en</token> <marker> <token postag="VMI.*" postag_regexp="yes">viu</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token regexp="yes">.*%</token> <marker> <token postag="VMI.*" postag_regexp="yes">viu</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token><exception>no</exception></token> <token>en</token> <marker> <token postag="N.*" postag_regexp="yes">viu</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_"/> </rule> <rule> <pattern> <token postag="V.[^P].*|_GV_" postag_regexp="yes"/> <token regexp="yes">algú|ningú</token> <marker> <token postag="A.*" postag_regexp="yes">viu</token> </marker> </pattern> <disambig action="filter" postag="A.*|_GN_"/> <example type="untouched">¿Algú viu a Polònia?</example> </rule> </rulegroup> <rule id="FER" name="verb + fer"> <pattern> <token postag="V.N.*" postag_regexp="yes"/> <marker> <token>fer</token> </marker> </pattern> <disambig action="filter" postag="V.N.*|complement"/> </rule> <rule id="FER2" name="fer + pronom"> <pattern> <marker> <token>fer</token> </marker> <token postag="PP.*|P0.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.N.*|complement"/> </rule> <rule id="FER3" name="fer + infinitiu"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" inflected="yes">fer</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="DIU" name="diu (verb dir)"> <rule> <pattern> <token><exception regexp="yes">el|un|aquest</exception></token> <marker> <token postag="V.[SIG].*" postag_regexp="yes" regexp="yes">diu|deixant</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token><exception regexp="yes">els|uns|aquests</exception></token> <marker> <token postag="V.[SI].*" postag_regexp="yes">dius</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> </rulegroup> <rule id="dir" name="dir (infinitiu)"> <pattern> <token inflected="yes" regexp="yes" skip="20">escoltar|sentir</token> <marker> <token>dir</token> </marker> </pattern> <disambig action="remove" postag="NCMS000"/> </rule> <rule id="fins_nom" name="fins nom"> <pattern> <token postag="D..MP.|V.P..PM." postag_regexp="yes"/> <token min="0" postag="A..[CM]P." postag_regexp="yes"/> <marker> <token>fins</token> </marker> <token>a</token> <token>què</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rulegroup id="fins_preposicio" name="fins preposició"> <rule> <pattern> <marker> <token>fins</token> </marker> <token regexp="yes">a|que|al|als|llavors|aleshores|avui|.*demà|.*ahir|dilluns|dimarts|dimecres|dijous|divendres|dissabte|diumenge|\d+</token> </pattern> <disambig action="filter" postag="SP.*"/> </rule> <rule> <pattern> <marker> <token>fins</token> </marker> <token postag="DN.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SP.*"/> </rule> </rulegroup> <rule id="sobre_preposicio" name="sobre preposició"> <antipattern> <token>que</token> <token min="0">no</token> <token>sobre</token> </antipattern> <pattern> <marker> <token postag="SPS00">sobre<exception scope="previous" postag="&pronom_feble;" postag_regexp="yes"/></token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="fer_respecte" name="fer/tenir respecte"> <pattern> <token regexp="yes" inflected="yes">mostrar|fer|tenir</token> <marker> <token>respecte</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="fer_respecte2" name="fer/tenir respecte"> <pattern> <marker> <token regexp="yes" inflected="yes">mostrar|fer|tenir</token> </marker> <token>respecte</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="no_sols" name="no sols"> <rule> <pattern> <token inflected="yes">caldre</token> <token>no</token> <marker> <token>sols</token> </marker> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule> <pattern> <token>no</token> <token inflected="yes">ser</token> <marker> <token>sols</token> </marker> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule> <pattern> <token skip="4">no<exception scope="next" postag_regexp="yes" postag="V...2S.."/></token> <token skip="20" postag="V.N.*" postag_regexp="yes"/> <token>sinó</token> <marker> <token>sols</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG.*"/> </rule> </rulegroup> <rule id="SOBRE_VERB" name="sobre (verb)"> <pattern> <token>que</token> <marker> <token>sobre</token> </marker> <token postag="PI.*" postag_regexp="yes"/> <token postag="_PUNCT.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="POT" name="pot/pots/vol/vols + infinitiu"> <rule> <pattern> <token>no</token> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">pot|vol|sol</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">el|[-'].+</exception></token> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">pot|vol|sol</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">els|[-'].+</exception></token> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">pots|vols|sols</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <antipattern> <token postag="V.*" postag_regexp="yes"/> <token>no</token> <token>sols</token> <token postag="V.N.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">pots?|vols?|sols?</token> </marker> <token postag="V.N.*" postag_regexp="yes"><exception>poder</exception></token> <!-- és un sol poder --> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">poder|voler|saber</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"><exception postag="AQ.*" postag_regexp="yes"/></token> <!-- exc. el poder militar --> </and> </marker> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <!-- pots llavors pensar, pot no funcionar --> <pattern> <marker> <and> <token regexp="yes">pots?|vols?|sols?</token> <token postag="V.*" postag_regexp="yes"/> </and> </marker> <token postag="RG|RN" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> </rulegroup> <rule id="verb_sol" name="verb + sol"> <pattern> <token postag="V.*" postag_regexp="yes"/> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">sols?</token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="CAP1" name="cap: tractament especial (det, adj, nom, adv, verb...)"> <!-- TODO: ampliar cap cabre VMIP1S0 cap cabre VMIP3S0 cap cabre VMM02S0 cap cap DI0CS0 cap cap NCCS000 cap cap NCMS000 cap cap PI0CS000 cap cap SPS00 cap capar VMIP1S0--> <rule> <!-- hi cap --> <pattern> <token>hi</token> <marker> <token>cap</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <!-- cap home, cap dona, cap cosa --> <pattern> <token><exception postag="D[^R].*|PX.MS.*" postag_regexp="yes"/></token> <marker> <token>cap</token> </marker> <token postag="N..S.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DI.*"/> </rule> <rule> <pattern> <token><exception postag="D[^R]0MS0|PX.MS.*|SPS00" postag_regexp="yes"/></token> <marker> <token>cap</token> </marker> <token postag="RG.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <token>cap</token> </marker> <token>a</token> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule> <pattern> <marker> <token>cap</token> </marker> <token>a</token> <token postag="P[0P].*" postag_regexp="yes"><exception postag="DA.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule> <pattern> <token><exception postag="P[0P].*|DA.MS." postag_regexp="yes"/><exception>no</exception></token> <marker> <token>cap</token> </marker> <token>a</token> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule> <pattern> <token><exception postag="P[0P].*|RN" postag_regexp="yes"/></token> <marker> <token>cap</token> </marker> <token postag="DD.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule> <pattern> <token regexp="yes">col?ps?</token> <token>de</token> <marker> <token>cap</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token><exception postag="D.*|PX.*" postag_regexp="yes"/><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].*</exception></token> <marker> <token postag="PI.*" postag_regexp="yes">cap</token> </marker> <token postag="P0.{6}|PP3CN000|PP3NN000|PP3CP000|PP3CSD00|RN" postag_regexp="yes" min="0"/> <token postag="V.[MSI].*" postag_regexp="yes"/> <!-- |PP3..A00 --> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">cap</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!--abreviatura capítols: cap. 3 i 4--> <pattern> <marker> <token>cap</token> </marker> <token spacebefore="no">.</token> <token regexp="yes">\d[\d\.,]*</token> <token regexp="yes">i|o|,</token> <token regexp="yes">\d[\d\.,]*</token> </pattern> <disambig action="replace"> <wd lemma="capítol" pos="NCMP000"/> </disambig> </rule> </rulegroup> <rule id="llavors" name="llavors"> <pattern> <token><exception postag="D[^R]0FP0" postag_regexp="yes"/></token> <marker> <token>llavors</token> </marker> <token><exception postag="AQ.[FC][NP]." postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="bon" name="bon (adj)"> <pattern> <marker> <token>bon</token> </marker> <token postag="N.MS.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="COP" name="cop no verb balear"> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D.*|A.*" postag_regexp="yes"/> <marker> <token regexp="yes">cops?</token> </marker> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="LOCUCIONS_FREQUENCIA" name="locucions adverbials de freqüència: dues vegades més alt"> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token inflected="yes">un</token> <token postag="D[IN].*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|grau|octava|dia|any</token> </marker> </unify> <token regexp="yes">més|menys|manco</token> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token postag="DN.*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|grau|octava|dia|any</token> </marker> </unify> <token regexp="yes">més|menys|manco</token> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">[\d]+</token> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|grau|octava|dia|any</token> </marker> <token regexp="yes">més|menys|manco</token> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token postag="DN.*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|grau|octava|dia|any</token> </marker> </unify> <token regexp="yes">majors?|menors?|superiors?|inferiors?</token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token postag="DI.*" postag_regexp="yes" inflected="yes" regexp="yes">un|algun|molt|poc|cada</token> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|dia</token> </marker> </unify> <token regexp="yes">més|menys</token> <token postag="RG_anteposat" min="0"/> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <marker> <token>cada</token> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic|dia</token> </marker> <token>més</token> <token>i</token> <token>més</token> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token postag="DI.*" postag_regexp="yes" inflected="yes" regexp="yes">un|algun|molt|poc|cada</token> <token regexp="yes" inflected="yes">vegada|volta|cop|colp|pic</token> </marker> </unify> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token postag="N.*" postag_regexp="yes"/> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token postag="DI.*" postag_regexp="yes" inflected="yes" regexp="yes">un|algun|molt|poc|cada</token> <token regexp="yes" inflected="yes">dia|any</token> </marker> </unify> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> </rulegroup> <rulegroup id="PUNTS_CARDINALS" name="punts cardinals, sigles"> <rule> <pattern> <token postag="DA0MS0"/> <marker> <token regexp="yes">(?-i)N|S|E|W|NE|SE|NW|SW</token> </marker> </pattern> <disambig action="replace"> <wd pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">(?-i)N|S|E|W|NE|SE|NW|SW</token> <token/> <marker> <token regexp="yes">(?-i)N|S|E|W|NE|SE|NW|SW</token> </marker> </pattern> <disambig action="replace"> <wd pos="NCMS000"/> </disambig> </rule> <rule id="ET" name="ET (Estatut dels Treballadors)"> <antipattern> <token>et</token> <token postag="V.[SIM].*" postag_regexp="yes" regexp="yes">\p{Lu}+</token> </antipattern> <pattern case_sensitive="yes"> <token>ET</token> </pattern> <disambig action="replace" postag="NCMS000"/> <example type="untouched">ET DIC QUE SÍ.</example> </rule> </rulegroup> <rulegroup id="C_LLOC" name="complements de lloc"> <rule id="dins_meu" name="dins meu"> <pattern> <token><exception postag="DA.*" postag_regexp="yes"/></token> <marker> <token regexp="yes">dintre|dins|enmig|vora|davant|darrere|damunt|davall|sota|sobre|enfront</token> <token postag="PX.MS.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule id="casa_meua" name="casa meua"> <pattern> <token>casa</token> <token postag="PX.FS.*" postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd pos="_C_LLOC"/> <wd pos="_C_LLOC"/> </disambig> </rule> </rulegroup> <rulegroup id="de_color_x" name="de color x: locució"> <rule> <pattern> <marker> <token>de</token> <token>color</token> <token regexp="yes">vermell|verd|blau|taronja|groc|escarlata</token> <token postag="AQ.[MC][SN]." postag_regexp="yes"/> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> </disambig> </rule> <rule> <pattern> <marker> <token>de</token> <token>color</token> <token regexp="yes">vermell|verd|blau|taronja|groc|escarlata</token> </marker> </pattern> <disambig action="replace"> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> <wd pos="LOC_ADJ"/> </disambig> </rule> </rulegroup> <rule id="color_x" name="color x"> <pattern> <token>color</token> <marker> <token postag="NCFS000">panotxa</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="el_dia_deu" name="el dia deu"> <pattern> <unify> <feature id="genere"/> <token postag="DA0.S0" postag_regexp="yes"/> <token regexp="yes">dia|planta|pis|porta</token> </unify> <marker> <token postag="DN.[^F].*" postag_regexp="yes"/> </marker> <token><exception postag="NC.P.*" postag_regexp="yes"/></token> </pattern> <disambig action="replace" postag="AQ0CN0"/> <example type="untouched">Té al dia <marker>3.245</marker> usuaris.</example> </rule> <rulegroup id="causa_efecte" name="causa-efecte (nom no verb)"> <rule> <pattern> <marker> <token>causa</token> </marker> <token regexp="yes">[/i-]</token> <token>efecte</token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">binomi|relació|connexió|ràtio|associació|aliatge</token> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> <token regexp="yes">[/i-]</token> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rule id="deliris" name="no verb, nom / verb intransitiu"> <!-- necessari per a detectar errors de concordança det + nom. N'hi ha altres casos? "eclipsi" és semblant, però és transitiu, per tant és possible "que l'eclipsis" --> <pattern> <token postag="D.*" postag_regexp="yes"/> <marker> <token regexp="yes">deliris?|objectes?|plaça|places|taula|taules|revista|revistes</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule id="nVerb" name="no verb"> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">ous?|cables?|embalatges?|alcohol|cilindre|cilindres|missa|coma|comes|meta|metes|menta|humana|humanes|escàs|poeta|poetes|sostre|mida|mides|formatges?|exempta|exemptes|tasca|tasques|membres?|metges?|escasses|sola|soles|suau|descontent|carro|així|mes|pas|espasa|aroma|sorra|nom|sols?|via|vies|arbres?|tres|des|dos|com|res|tal|millor|pitjor|nombres?|entorn|davall|només|noms?<exception postag="_GV_"/></token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="Verb" name="verb"> <pattern> <token><exception postag="D.*|SPS00" postag_regexp="yes"/></token> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">fem|sabeu</token> <token postag="V.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="[^V].*"/> <example type="untouched">En una pila de <marker>fem</marker>.</example> </rule> <rule id="mitjana_nVerb" name="mitjana no verb"> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes">mitjana</token> <token postag="V.*" postag_regexp="yes" negate_pos="yes"/> </and> </marker> <token postag="SPS00|_PUNCT.*" postag_regexp="yes"/> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="[^V].*"/> </disambig> </rule> <rule id="el_sou" name="el sou"> <pattern> <token regexp="yes">el|un</token> <marker> <token>sou</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="el_son" name="el son"> <pattern> <token regexp="yes">el|un|la|una</token> <marker> <token>son</token> </marker> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule id="fer_be" name="fer bé"> <pattern> <token inflected="yes">fer</token> <marker> <token>bé</token> </marker> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule id="termini" name="curt/llarg/mitjà termini"> <pattern> <token regexp="yes">curt|llarg|mitjà|mig</token> <marker> <token>termini</token> </marker> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <rule id="mitja_dotzena" name="mitja dotzena"> <pattern> <marker> <token postag="A.*" postag_regexp="yes">mitja</token> <token postag="N.*" postag_regexp="yes">dotzena</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="adjectiu_inusual" name="inusual com a adjectiu davant de nom"> <pattern> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes" inflected="yes">estanc|semiconductor</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rulegroup id="AdjInv" name="adjectius invariants només darrere de nom"> <!-- relacionat amb Grups Nominals. Abans o després? La part nort i la sud--> <rule> <pattern> <token><exception postag="N.*|DA.*|CC|RG.*" postag_regexp="yes"/></token> <!-- exception: la part nord --> <marker> <and> <token postag="AQ0CN0"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^A].*"/> </rule> <!-- <rule> <pattern> <token postag="N.*|DA.*" postag_regexp="yes"><exception postag="N.*|DA.*" postag_regexp="yes" negate_pos="yes"></exception></token> <marker> <and> <token postag="AQ0CN0"></token> <token postag="N.*" postag_regexp="yes"></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*" /> </rule> --> </rulegroup> <rule id="cal_infinitiu" name="cal + infinitiu"> <pattern> <marker> <token>cal</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rulegroup id="entrevista_no_participi" name="entrevista (no participi)"> <rule> <pattern> <token><exception postag="NCFS000"/></token> <marker> <token postag="NCFS000">entrevista</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <token><exception postag="NCFP000"/></token> <marker> <token postag="NCFP000">entrevistes</token> </marker> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> </rulegroup> <rule id="NoParticipi" name="no participi, és nom"> <pattern> <token regexp="yes" inflected="yes">accedir|accés|equivaler|equivalent|duel|quant|lluita|lluitar</token> <token>a</token> <marker> <token regexp="yes">delegats?|morts?|llibertats?|capacitats?|continguts?<exception postag="_GV_"/></token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="VA" name=" va (verb/adj)"> <rule> <pattern> <marker> <token postag="VAIP3S00">va</token> </marker> <token postag="RG"/> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="VAIP3S00"/> </rule> <rule> <pattern> <marker> <token postag="VMIP3S00">va</token> </marker> <token postag="RG"/> </pattern> <disambig action="filter" postag="VMIP3S00"/> </rule> </rulegroup> <!-- verb aux seguit d'infinitiu: va donar--> <rulegroup id="VauxInf" name="Verb auxiliar seguit d'infinitiu"> <rule> <!-- desambigua "va encendre" i semblants --> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes">anar</token> <token min="0" postag="_QM_OPEN"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.N.*|_obligacio|_perfet"/> </rule> <rule> <pattern> <marker> <token postag="VA.*" postag_regexp="yes" inflected="yes" skip="5">anar<exception scope="next" postag="_QM_OPEN|_GV_|_PUNCT_CONT|R.*|.*LOC_ADV.*|V.N.*|SENT_END|[NA].*|complement|_obligacio|_perfet" postag_regexp="yes" negate_pos="yes"/></token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="VA.*"/> </disambig> </rule> <rule> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes" skip="5">anar<exception scope="next" postag="_QM_OPEN|_GV_|_PUNCT_CONT|R.*|.*LOC_ADV.*|V.N.*|SENT_END|[NA].*|complement|_obligacio|_perfet" postag_regexp="yes" negate_pos="yes"/></token> <token min="0" postag="_QM_OPEN"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.N.*|_obligacio|_perfet"/> </rule> <rule> <pattern> <marker> <token postag="VA.*" postag_regexp="yes" inflected="yes" skip="5">anar<exception scope="next" postag="_QM_OPEN|_GV_|_PUNCT_CONT|R.*|.*LOC_ADV.*|V.N.*|SENT_END|[NA].*|complement|_obligacio|_perfet" postag_regexp="yes" negate_pos="yes"/></token> </marker> <token min="0" postag="_QM_OPEN"/> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes" skip="5">anar<exception scope="next" postag="_QM_OPEN|_GV_|_PUNCT_CONT|R.*|.*LOC_ADV.*|V.N.*|SENT_END|[NA].*|complement|_obligacio|_perfet" postag_regexp="yes" negate_pos="yes"/></token> <token min="0" postag="_QM_OPEN"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rulegroup id="era_nom" name="era (nom)"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[^R].*|A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">era</token> </marker> </unify> <token postag="NP.*|_possible_nompropi" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[^R].*|A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">era</token> </marker> </unify> <token min="0" max="3" postag="&pronom_feble;|RN" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"><exception negate_pos="yes" postag="V.[MSI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <token postag="SENT_START" skip="-1"><exception scope="next" regexp="yes">que|si</exception></token> <token postag="V.[MSI].*|_GV_" postag_regexp="yes" skip="6"><exception negate_pos="yes" postag="V.[MSI].*|_GV_" postag_regexp="yes"/><exception scope="next" regexp="yes">com|perquè|que|/</exception><exception postag="_PUNCT.*|C.*|PR.*|PT.*|DT.*|.*LOC_CONJ.*|_loc_unavegada" postag_regexp="yes" scope="next"/></token> <token max="4" postag="D[^R].FS.|A..[FC][SN].|V.P..SF." postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">era</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <token postag="SENT_START" skip="-1"><exception scope="next">que</exception></token> <token postag="V.[MSI].*|_GV_" postag_regexp="yes" skip="6"><exception negate_pos="yes" postag="V.[MSI].*|_GV_" postag_regexp="yes"/><exception scope="next" regexp="yes">com|perquè|que|/</exception><exception postag="_PUNCT.*|C.*|PR.*|PT.*|DT.*|.*LOC_CONJ.*|_loc_unavegada" postag_regexp="yes" scope="next"/></token> <token postag="D[^R].FS." postag_regexp="yes" skip="6"><exception scope="next" regexp="yes">com|perquè|que|/</exception><exception postag="_PUNCT.*|C.*|PR.*|PT.*|DT.*|.*LOC_CONJ.*|_loc_unavegada" postag_regexp="yes" scope="next"/></token> <token max="4" postag="D[^R].FS.|A..[FC][SN].|V.P..SF." postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">era</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> </rulegroup> <rule id="JA_JA" name="ja: no conjunció. Excepcions?"> <pattern> <marker> <token>ja</token> </marker> <token><exception>que</exception></token> </pattern> <disambig action="filter" postag="[^C].*"/> </rule> <rule id="infinitiu_o_nom0" name="infinitiu o nom (previ)"> <pattern> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"/> </and> </marker> <token postag="P.*" postag_regexp="yes" regexp="yes">[-'].+</token> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule id="propi_adj" name="propi (anteposat) és adjectiu"> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <marker> <token inflected="yes">propi</token> </marker> <token postag="NC.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <rulegroup id="MIG_ADJ" name="mig (adv) + adjectiu: mig morta, mig nu / mig home mig dona"> <rule> <pattern> <marker> <token postag="RG">mig</token> </marker> <token postag="AQ0FS00|AQ0FP00|AQ0MP00" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule> <!-- mig + adj. masculí --> <pattern> <marker> <token postag="RG">mig</token> </marker> <token regexp="yes">ple|buit|nu|despullat|vestit|mort|cru|despectiu|sec</token> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule> <!-- mig home mig dona --> <pattern> <marker> <token postag="RG">mig</token> </marker> <token skip="1"/> <token>mig</token> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule> <pattern> <token>mig</token> <token skip="1"/> <marker> <token postag="RG">mig</token> </marker> </pattern> <disambig action="filter" postag="RG"/> </rule> </rulegroup> <rule id="Prep_Inf" name="preposició + infinitiu"> <!-- torna a encendre. Excep: amb poder, de poder, el cap militar--> <pattern> <token postag="SPS.*" postag_regexp="yes"/> <marker> <token postag="V.N.*" postag_regexp="yes"><exception regexp="yes">deure|poder|saber|militar</exception></token> </marker> </pattern> <disambig action="filter" postag="V.N.*|complement|_GV_|_perfet|_obligacio"/> </rule> <rule id="de_vas" name="de vas"> <!-- excepció a la regla "Anar" --> <pattern> <token regexp="yes">de|un|el|l</token> <marker> <token>vas</token> </marker> <token postag="V.P.*SM." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="Anar" name="Verb anar seguit de participi i gerundi"> <pattern> <marker> <token postag="VM.*" postag_regexp="yes" inflected="yes">anar</token> </marker> <token postag="V.[GP].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="VM.*|_GV_"/> </rule> <rule id="Anar2" name="Verb anar seguit de participi i gerundi"> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes">anar</token> <marker> <token postag="V.[GP].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.[GP].*|_GV_"/> </rule> <rule id="sense_poca" name="sense-veu poca-vergonya"> <pattern> <token regexp="yes">sense|poca|anti</token> <token>-</token> <marker> <and> <token postag="V.[MSI].*" postag_regexp="yes"/> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="fins_passat_el" name="fins passat el"> <pattern> <token postag="SPS00">fins</token> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="V.P.*" postag_regexp="yes" inflected="yes">passar</token> <token postag="D[^R].*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="prep_art_nomverb" name="preposició + article + nom/verb"> <!-- pels projectes, malgrat una llista --> <antipattern> <token>tot</token> <token>sou</token> </antipattern> <antipattern> <token postag="D...S." postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes" min="0"/> <token>cap</token> </antipattern> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception postag="RG"/></token> <token postag="D[AIP].*" postag_regexp="yes"><exception regexp="yes">es|s'|altres?|altra</exception></token> <!-- ¿Exigir unificació o no? (Ex. amb un tesi, d'un mitjana)--> <marker> <and> <token postag="NC.*|V.P.*|A.*" postag_regexp="yes"/> <token postag="V.[MSIG].*" postag_regexp="yes"><exception regexp="yes">era|fou|va</exception></token> </and> </marker> </pattern> <disambig action="remove" postag="V.[MSIG].*"/> <example type="untouched">Per a ambdues <marker>fou</marker> decisiva la seva negativa.</example> <example type="untouched">i per tant <marker>resta</marker> una tasca de recopilació</example> <example type="untouched">també, segons es <marker>baixa</marker>, des de Montsià</example> <example type="untouched">El que a uns <marker>va</marker> bé, a altres no.</example> </rule> <rule id="prep_art_adj_nomverb" name="preposició + article + adj + nom/verb"> <!-- amb la mateixa pasta --> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception postag="RG"/></token> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[AIP].*" postag_regexp="yes"/> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"><exception regexp="yes">era|fou</exception></token> </and> </marker> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <!-- hi haver + nom/verb Hi ha alzines--> <rulegroup id="haver_nom" name="haver + nom"> <rule> <pattern> <token>hi</token> <token inflected="yes">haver</token> <marker> <and> <token postag="V.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception>era</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <!-- no hi haurà mai poder--> <pattern> <token>hi</token> <token inflected="yes">haver</token> <token postag="RG"><exception postag="[CP].*" postag_regexp="yes"/></token> <marker> <and> <token postag="V.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception>era</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> <example type="untouched">El que hi ha quan toca de peus a terra.</example> </rule> </rulegroup> <rulegroup id="tens" name="tens (verb/adjectiu)"> <rule> <pattern> <token>el</token> <marker> <token postag="V.*" postag_regexp="yes">tens</token> </marker> <token postag="V.P.*|AQ.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <token inflected="yes" skip="1">posar</token> <marker> <token postag="AQ0MS0">tens</token> </marker> </pattern> <disambig action="filter" postag="AQ.*|_GN_.*"/> </rule> <rule> <pattern> <token inflected="yes" skip="1">quin</token> <token postag="N.*" postag_regexp="yes" skip="1"/> <marker> <token postag="V.*" postag_regexp="yes">tens</token> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> </rulegroup> <!-- continuar, seguir, estar, acabar... + gerundi Va continuar ocupant--> <rulegroup id="verb_gerundi" name="verb + gerundi"> <rule> <pattern> <marker> <token postag="V.[^P].*" postag_regexp="yes" inflected="yes" regexp="yes">acabar|començar|anar|continuar|seguir|prosseguir|estar</token> <token postag="V.G.*" postag_regexp="yes"><exception postag="_perfet"/></token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <marker> <token postag="V.[^P].*" postag_regexp="yes" inflected="yes" regexp="yes">acabar|començar|anar|continuar|seguir|prosseguir|estar</token> <token postag="V.G.*" postag_regexp="yes"><exception postag="_perfet"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <!-- gerundi amb pronoms febles no és adjectiu--> <rule id="GERUNDI" name="Gerundi no adjectiu"> <pattern> <marker> <and> <token postag="V.G.*" postag_regexp="yes"/> <token postag="V.G.*" postag_regexp="yes" negate_pos="yes"><exception postag="_GV_"/></token> </and> </marker> <token postag="P.*" postag_regexp="yes" regexp="yes">-.*</token> </pattern> <disambig action="filter" postag="V.G.*"/> </rule> <rulegroup id="NoAdverbi" name="no adverbi darrere de puntuació"> <rule> <pattern> <token regexp="yes">[,;:—–…]</token> <marker> <token regexp="yes">quan|com|però</token> </marker> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> </rulegroup> <rule id="BASTANT" name="bastant (no gerundi)"> <antipattern> <token>imponent</token> <token postag="D.*" postag_regexp="yes"/> </antipattern> <pattern> <!-- TODO: exceptions --> <token regexp="yes">bastant|imponent</token> </pattern> <disambig action="remove" postag="V.G.*"/> </rule> <!-- dos adverbis junts: una molt ben nodrida; molt més assolellada --> <rule id="adv_adv" name="adverbis junts"> <pattern> <marker> <token postag="RG_anteposat"/> </marker> <token postag="RG"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="tot_adjgerund" name="tot + adjectiu/gerundi"> <!-- tan important --> <pattern> <token postag="RG">tot</token> <marker> <and> <token postag="V.G.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.G.*"/> </rule> <rule id="adjgerund_nom" name="adjectiu/gerundi + nom"> <pattern> <token><exception postag="NC.*|SPS00|D.*" postag_regexp="yes"/></token> <marker> <and> <token postag="V.G.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> </and> </marker> <token postag="NC.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.G.*"/> </rule> <rule id="tecnicament_parlant" name="tècnicament parlant"> <pattern> <token postag="RG_anteposat|.*LOC_ADV.*" postag_regexp="yes"/> <marker> <token postag="V.G.*" postag_regexp="yes">parlant</token> </marker> </pattern> <disambig action="filter" postag="V.G.*"/> </rule> <rule id="adv_adjgerund" name="adverbi + adjectiu/gerundi"> <!-- tan important --> <antipattern> <token postag_regexp="yes" postag="VM.*" regexp="yes" skip="3" inflected="yes">estar|anar</token> <token min="0" max="3" postag="RG_anteposat|LOC_ADV" postag_regexp="yes"><exception postag="PR.*" postag_regexp="yes"/><exception regexp="yes">tant?</exception></token> <token postag="V.G.*" postag_regexp="yes"/> </antipattern> <pattern> <token postag="RG_anteposat|.*LOC_ADV.*" postag_regexp="yes"/> <marker> <and> <token postag="V.G.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"><exception regexp="yes">portant</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="adv_adjverb" name="adverbi + adjectiu/verb"> <!-- tan complexa, tant planes de sabana com regions de jungla; tan baixa com, tan seré --> <pattern> <token postag="RG_anteposat" regexp="yes">tant?</token> <marker> <and> <token postag="V.[MIS].*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> <!-- es contradiu amb la regla adv_adj. Potser no és "desambiguable" --> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="DA_PX" name="article + possessiu(nostre)"> <pattern> <token postag="DA.*" postag_regexp="yes"/> <marker> <token postag="PX.*" postag_regexp="yes" inflected="yes">nostre</token> </marker> </pattern> <disambig action="filter" postag="PX.*"/> </rule> <rule id="en_aparenca" name="en aparença"> <pattern> <token>en</token> <marker> <token>aparença</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="verbnom_sentstart" name="verb i nom a principi de frase"> <!-- Copa del món, Rates de laboratori, Formes de vida... I objectes de valor --> <pattern> <token postag="SENT_START|CC|_PUNCT.*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception regexp="yes">surts?</exception></token> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> <token inflected="yes" regexp="yes">de|entre</token> </pattern> <disambig action="filter" postag="[^V].*"/> <!-- les dues meitats dreta i esquerra (A+N+V)--> </rule> <rule id="VerbReflexiu" name="paraules que no són verb reflexiu"> <pattern> <token postag="P020S000|P0300000" postag_regexp="yes"><exception regexp="yes">['-].+</exception></token> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">-.+</exception></token> <marker> <and> <token postag="NC.*|AQ.*" postag_regexp="yes" regexp="yes">suïcidi|persona|persones|digna|dignes?</token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="remove" postag="NC.*|AQ.*"/> </rule> <rule id="NoVerbReflexiu" name="paraules que no són verb sense pronom (verb reflexiu)"> <pattern> <token><exception postag="P020S000|P0300000" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <marker> <and> <token postag="NC.*|AQ.*" postag_regexp="yes" regexp="yes">adient|fuga|fugues|arrossar|broma|bromes|vergonya|vergonyes|vergonyant|suïcidi|arròs|tinya|tinyes|esperit|salina|salines|persona|persones|olives|oliva|olivar|amiga|amigues|boira|boires|roja|roges|digna|dignes?|octubres?</token> <token postag="V.[GMNSI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token><exception postag="P020S000|P0300000" postag_regexp="yes" regexp="yes">['-].+</exception></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="nom_noverb_seguit_de" name="nom no verb seguit de de"> <antipattern> <token regexp="yes">de|d'</token> <token min="0" postag="A..[FC]S." postag_regexp="yes"/> <token>manera</token> </antipattern> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes" regexp="yes" inflected="yes">nota|signe|barreja|mescla|taxa</token> </and> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="qui_les_porta" name="qui pronom verb 3a persona sing"> <antipattern> <token regexp="yes">la|les</token> <token regexp="yes">carbonara|persona|persones</token> </antipattern> <rule> <pattern> <token><exception regexp="yes">allò|després|abans|malgrat</exception><exception postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">fer|aconseguir</exception></token> <token regexp="yes">qui|que|què<exception postag=".*LOC_CONJ.*" postag_regexp="yes"/></token> <token postag="&pronom_feble;" postag_regexp="yes"/> <token min="0" postag="_QM_OPEN"/> <marker> <token postag="VM..3S..?" postag_regexp="yes" regexp="yes">\p{Ll}.*<exception regexp="yes">seu|.+e|tema|fera|país|divisa|nous?|baixa|dona|esquerra|extrema</exception></token> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_|_obligacio|_perfet"/> </rule> <rule> <pattern> <token regexp="yes">qui|que|què</token> <token>hom</token> <marker> <token postag="VM..3S..?" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_|_obligacio|_perfet"/> </rule> <rule> <pattern> <!-- <token><exception regexp="yes">allò|després|abans</exception></token> --> <token regexp="yes">qui|que|què</token> <token>un</token> <marker> <token postag="VM..3S..?" postag_regexp="yes"><exception postag="NC[MC][SN].*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_|_obligacio|_perfet"/> </rule> </rulegroup> <rulegroup id="molt" name="molt adv"> <rule> <pattern> <token>qui</token> <marker> <token>molt</token> </marker> <token min="0" max="1" postag="&pronom_feble;" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG"/> </rule> <rule> <pattern> <token postag="V.[SI].*" postag_regexp="yes"/> <token min="0" postag="V.[NP].*" postag_regexp="yes"/> <marker> <token postag="RG.*" postag_regexp="yes"/> </marker> <token postag="RG.*|LOC_ADV" postag_regexp="yes" min="0" max="4"/> <token postag="SP.*|_PUNCT.*|D...P.|CC" postag_regexp="yes"><exception inflected="yes">de</exception></token> </pattern> <disambig action="remove" postag="DI0[MC]S0"/> </rule> <rule> <pattern> <token postag="V.[SI].*" postag_regexp="yes"/> <token min="0" postag="V.[NP].*" postag_regexp="yes"/> <marker> <token postag="RG.*" postag_regexp="yes"/> </marker> <token postag="RG.*|LOC_ADV" postag_regexp="yes" min="0" max="4"/> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="remove" postag="DI0[MC]S0"/> </rule> </rulegroup> <!-- <rule id="el_troba" name="el troba"> Es pot generalitzar... <pattern> <token postag="P.*" postag_regexp="yes">el</token> <token postag="V.*" postag_regexp="yes" regexp="yes">(trob|torn)(a|es)</token> </pattern> <disambig action="filterall"/> </rule> --> <rule id="es_diu" name="es diu Corredor (verb dir)"> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">els?</exception></token> <marker> <token postag="V.[^MNGP].*" postag_regexp="yes" regexp="yes">dius?</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="informe" name="informe (nom)"> <pattern> <marker> <token>informe</token> </marker> <token>anual</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rulegroup id="estima" name="l'informe estima, estima provat"> <rule> <pattern> <token>informe</token> <marker> <token regexp="yes">estima|anual</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <marker> <token>estima</token> </marker> <token regexp="yes">provats?|demostrats?</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> </rulegroup> <rule id="voltant" name="voltant (nom)"> <pattern> <token postag="D.*" postag_regexp="yes"/> <marker> <token>voltant</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="son_pare" name="son pare"> <pattern> <token><exception postag="D[^R].*" postag_regexp="yes"/></token> <token>son</token> <marker> <token>pare</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="son_germa" name="son germà"> <pattern> <token><exception postag="D[^R].*" postag_regexp="yes"/></token> <token>son</token> <marker> <token postag="NCMS000">germà</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="val" name="val (no nom)"> <pattern> <token>quant</token> <marker> <token>val</token> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="tema" name="tema (nom)"> <pattern> <token postag="SENT_START"/> <token regexp="yes" min="0" max="3">\p{P}</token> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">tema</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="costa" name="costa (no nom)"> <pattern> <token><exception postag="D[^D].FS.|SPS00|LOC_PREP" postag_regexp="yes"/></token> <marker> <token>costa</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="resulta" name="resulta (no nom)"> <pattern> <token><exception postag="D[^D].FS.|SPS00|LOC_PREP" postag_regexp="yes"/></token> <marker> <token>resulta</token> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="mostra" name="mostra (no nom)"> <antipattern> <token postag="D..[FC]S." postag_regexp="yes"/> <token postag="A..[FC]S." postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/></token> </antipattern> <pattern> <token><exception postag="D[^D].FS.|SPS00|LOC_PREP" postag_regexp="yes"/></token> <marker> <token>mostra</token> </marker> <token postag="[DAN].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="si_conjuncio" name="si conjunció"> <pattern> <token><exception regexp="yes">el|un</exception></token> <marker> <token>si</token> </marker> <token postag="R.*|V.[MSI].*|PP.*|P0.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="infinitiu_nomverb_nom0" name="infinitiu + verb/nom + nom"> <!-- Per a berenar menges pa--> <pattern> <token postag="V.N.*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception inflected="yes" regexp="yes">nom|persona|ritme</exception><exception regexp="yes">dona|dones</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*|A.*|PX.*|V.P.*|D.*|SPS.*" postag_regexp="yes"/></token> </and> </marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">[\p{Ll}·]+<exception postag="N.*" postag_regexp="yes" negate_pos="yes"/><exception regexp="yes">\d.*|p|propietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base</exception><exception inflected="yes" regexp="yes">&dies_setmana;</exception></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="verb_nomverb0" name="verb + verb/no_verb"> <rule> <pattern> <token postag="V.[NMIS].*" postag_regexp="yes"><exception postag="V.[NMIS].*|complement" postag_regexp="yes" negate_pos="yes"/><exception>men</exception></token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <!-- no té cap quantitat --> <token postag="NC.*|A.*|V.P.*|DN.*" postag_regexp="yes"><exception regexp="yes">som|era|va|seré|fou|recull|queda|resulta|estic|troba|estaria|estaries</exception></token> </and> </marker> <token><exception postag="P[P0].*" postag_regexp="yes" regexp="yes">['-].+</exception></token> </pattern> <disambig action="filter" postag="V.P.*|[^V].*"/> </rule> <rule> <!-- verb + verb/no_verb amb adverbi intercalat" que fos més escàs --> <pattern> <token postag="V.[NMIS].*" postag_regexp="yes"><exception postag="V.[NMIS].*|complement" postag_regexp="yes" negate_pos="yes"/></token> <token postag="RG_anteposat"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <!-- no té cap quantitat --> <token postag="NC.*|A.*|V.P.*|DN.*" postag_regexp="yes"><exception regexp="yes">som|era|va|fou|recull|estic</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="V.P.*|[^V].*"/> </rule> <rule> <!-- amb pronom enclític: fer-se palesa --> <pattern> <token postag="V.[NMIS].*" postag_regexp="yes" skip="1"><exception postag="V.[NMIS].*|complement" postag_regexp="yes" negate_pos="yes"/><exception scope="next" postag="P[P0].*" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <token postag="P.*" postag_regexp="yes" regexp="yes">['-].+</token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <!-- no té cap quantitat --> <token postag="NC.*|A.*|V.P.*|DN.*" postag_regexp="yes"><exception regexp="yes">era|va|seré|fou|recull|estic</exception></token> </and> </marker> <token><exception postag="P[P0].*" postag_regexp="yes" spacebefore="no"/></token> </pattern> <disambig action="filter" postag="V.P.*|[^V].*"/> </rule> <rule> <pattern> <token postag="V.[NMIS].*" postag_regexp="yes" skip="1"><exception postag="V.[NMIS].*|complement" postag_regexp="yes" negate_pos="yes"/></token> <token postag="P.*" postag_regexp="yes" regexp="yes">['-].+</token> <token postag="RG_anteposat"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <!-- no té cap quantitat --> <token postag="NC.*|A.*|V.P.*|DN.*" postag_regexp="yes"><exception regexp="yes">era|va</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="V.P.*|[^V].*"/> </rule> </rulegroup> <rule id="nomverb_verb0" name="verb/no_verb + verb"> <!-- Quan no hi era respiràvem més a gust. --> <antipattern> <token>va</token> <token postag="VMIS3S00"/> </antipattern> <pattern> <token><exception postag="&pronom_feble;|RN" postag_regexp="yes"/></token> <marker> <and> <token postag="V.[GIMS].*" postag_regexp="yes"/> <token postag="NC.*|A.*|V.P.*|PX.*" postag_regexp="yes"><exception regexp="yes">fan|som|era|creixen</exception></token> </and> </marker> <token min="0" max="3" postag="&pronom_feble;|RN" postag_regexp="yes"><exception regexp="yes">['-].+</exception></token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="V.[MSI].*|_GV_" postag_regexp="yes" negate_pos="yes"/><exception postag="VMIP1S0B"/></token> </pattern> <disambig action="remove" postag="V.[GMSI].*"/> </rule> <rule id="nomverb_verb0b" name="verb/no_verb + verb"> <pattern> <token><exception postag="RG.*|&pronom_feble;" postag_regexp="yes"/></token> <marker> <and> <token postag="V.[GIMS].*" postag_regexp="yes"><exception postag="_GV_"/></token> <token postag="NC.*|A.*|V.P.*" postag_regexp="yes"><exception>creixen</exception></token> </and> </marker> <token postag="_GV_"><exception postag="V.N.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="V.[GMSI].*"/> </rule> <!-- <rule id="nomverb_nomverb0" name="art det + nom/verb + verb/nom"> la creu estima. El metges estima (inclosos errors). ¿Aquesta deu era sagrada? Eliminada per problema: que els publicà fou. CAL PROVAR. <pattern> <token postag="DA.*" postag_regexp="yes"></token> <marker> <and> <token postag="V.[MIS].*" postag_regexp="yes"/> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*|A.*|PX.*|V.P.*" postag_regexp="yes"/></token> </and> </marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*|A.*|PX.*|V.P.*|DI.*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="N.*"></disambig> </rule> --> <rule id="gerundi_nomverb" name="gerundi + verb/nom"> <!-- menjant ou, donant forma --> <pattern> <token postag="V.G.*" postag_regexp="yes"><exception postag="_GN_.*|AQ.*" postag_regexp="yes"/><exception regexp="yes">corrent|estudiant</exception></token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception regexp="yes">era|eres|fou</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="A.*|V.P.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="tota_la_tarda" name="tota la tarda"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DI.*" postag_regexp="yes" inflected="yes">tot</token> <token postag="D.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"><exception postag="PX.*|V.P.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="quin_punt" name="quin punt"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[TE].*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="nomverb_nom0" name="nom + verb/nom"> <!-- la segona porta accent. Excep: el seu germà, necessità deu anys. --> <antipattern> <token postag="SPS00|D[DI].*|PX.*|.*LOC_PREP.*" postag_regexp="yes"/> <token min="0" postag="_QM_OPEN"/> <token postag="NC.*" postag_regexp="yes"/> </antipattern> <antipattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token postag="D.*|PX.*" max="2" postag_regexp="yes"/> <token min="0" postag="_QM_OPEN"/> <token postag="NC.*" postag_regexp="yes"/> </antipattern> <antipattern> <token postag="D..FS." postag_regexp="yes"/> <token regexp="yes">forma|base</token> </antipattern> <pattern> <marker> <and> <token postag="V.[GIS].*" postag_regexp="yes"><exception inflected="yes" regexp="yes">nom|persona|ritme|sexe</exception><exception postag="VMIP1S0B"/><exception regexp="yes">dona|dones</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*|A.*|PX.*|V.P.*|D.*|SPS.*" postag_regexp="yes"/></token> </and> </marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">[\p{Ll}·]+<exception postag="N.*" postag_regexp="yes" negate_pos="yes"/><exception regexp="yes">\d.*|p|propietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base|nomes</exception><exception inflected="yes" regexp="yes">&dies_setmana;</exception></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="nomadj_verbnomadj_nom" name="nom + verb/nom/adj + nom"> <!-- l'art expressa emocions. Excp: la darrera gran inundació, la greu doble crisi --> <pattern> <token postag="N.*|A.*" postag_regexp="yes"><exception postag="N.*|A.*" postag_regexp="yes" negate_pos="yes"/></token> <marker> <and> <token postag="V.[NIS].*" postag_regexp="yes"><exception regexp="yes">gran|doble|sol|major|lliure|mitjana|quarta</exception></token> <token postag="NC.*|A.*|V.P.*" postag_regexp="yes"><exception postag="_GN.*|PX.*|D.*|SPS.*|VMIP1S0B" postag_regexp="yes"/></token> </and> </marker> <token postag="NC.*" postag_regexp="yes" regexp="yes">[\p{Ll}·]+<exception postag="N.*|SENT_END" postag_regexp="yes" negate_pos="yes"/><exception regexp="yes">propietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base|nomes</exception></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="ens_nom" name="ens (nom)"> <rule> <pattern> <token regexp="yes">un|altre|aquest|aqueix|este|eixe|aquell</token> <token>nou</token> <marker> <token postag="N.*" postag_regexp="yes">ens</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <token regexp="yes">un|aquest|aqueix|este|eixe|aquell</token> <token postag="AQ.MS." postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">ens</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <token>l'</token> <marker> <token postag="N.*" postag_regexp="yes">ens</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes">ens</token> </marker> <token postag="V.P..[SP]M.|A..[MC][SPN]." postag_regexp="yes" regexp="yes" inflected="yes">gestor|crear|territorial|públic|local|metropolità|administratiu|representar|supramunicipal|supraestatal|interestatal|nacional|internacional|provincial|estatal|racional|televisiu|normatiu|autonòmic|polític|institucional|abstracte|parroquial|associatiu|sindical|matemàtic</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <antipattern> <token spacebefore="no">/</token> <token spacebefore="no">a</token> </antipattern> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <marker> <token>ens</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token postag="D[^R].[CM][SP]." postag_regexp="yes"><exception regexp="yes">tots?</exception></token> <marker> <token>ens</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <token postag="DA.MS." postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <marker> <token>ens</token> </marker> <token><exception postag="V.[IS].*|&pronom_feble;" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token>ens</token> </marker> <token>de</token> <token postag="D.*" postag_regexp="yes" skip="0"/> <token postag="[NA].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token>ens</token> </marker> <token postag="CC|_PUNCT_CONT" postag_regexp="yes"/> <token inflected="yes" regexp="yes">òrgan|comitè|organització</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rulegroup id="ens_pronom" name="ens (pronom)"> <rule> <pattern> <token postag="RG"/> <marker> <token postag="P.*" postag_regexp="yes">ens</token> </marker> <token postag="V.[SI].*|P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="P.*"/> </rule> <rule> <pattern> <marker> <token postag="P.*" postag_regexp="yes">ens</token> </marker> <token postag="V...1P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="P.*"/> </rule> </rulegroup> <rule id="PronomNom" name="nom i pronom"> <!-- jo, mi, la, te, ens. Excepció: de te. --> <pattern> <token><exception postag="D[AID].*" postag_regexp="yes"/><exception>de</exception></token> <marker> <and> <token postag="PP.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception>te</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="sere" name="seré"> <pattern> <token><exception postag="V.[MSI].*|_GV_" postag_regexp="yes"/></token> <marker> <token postag="V.*" postag_regexp="yes">seré</token> </marker> <token><exception postag="V.[MSI].*|_GV_" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="poc" name="poc (no nom)"> <pattern> <token><exception postag="D[^R].MS.*" postag_regexp="yes"/></token> <marker> <token>poc</token> </marker> <token><exception>que</exception></token> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="doble_moral" name="doble_moral"> <pattern> <token postag="A.*" postag_regexp="yes" inflected="yes">doble</token> <token postag="N.*" postag_regexp="yes" inflected="yes">moral</token> </pattern> <disambig action="filterall"/> </rule> <rule id="pobre_adj" name="pobre adjectiu"> <pattern> <token postag="A.*" postag_regexp="yes" inflected="yes">pobre</token> <token postag="N.*" postag_regexp="yes"><exception postag="V...3S.." postag_regexp="yes"/></token> </pattern> <disambig action="filterall"/> </rule> <rule id="alt_baix" name="alt/baix adjectius davant de nom"> <antipattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <token>baixa</token> </antipattern> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="AQ.*" postag_regexp="yes" regexp="yes" inflected="yes">alt|baix|doble|principal|gran|pobre</token> </marker> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <rule id="corrent_pendent_noms" name="corrent/pendent no adjectius davant d'adjectiu"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes" inflected="yes">vessant|corrent|pendent|germà|partit|empresa</token> </marker> <token postag="AQ.*|V.P.*|NPCN000" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="[^AV].*"/> </rule> <rule id="corrent_pendent_noms2" name="corrent/pendent no adjectius darrere d'adjectiu"> <pattern> <unify> <feature id="nombre"/> <token postag="D[^R].*" postag_regexp="yes"/> <token inflected="yes" regexp="yes">suau|diferent</token> <!--<exception postag="N.*" postag_regexp="yes"/></token>--> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes" inflected="yes">vessant|corrent|pendent</token> </marker> </unify> </pattern> <disambig action="filter" postag="[^AV].*"/> </rule> <rule id="corrent_pendent_adjectius" name="corrent/pendent adjectius darrere de nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="NC.*" postag_regexp="yes"><exception postag="PX.*|A.*|DN.*" postag_regexp="yes"/><exception regexp="yes">torna|massa|troba|queda|resta</exception></token> <token postag="A.*" postag_regexp="yes" regexp="yes" inflected="yes">vessant|corrent|pendent|germà|partit</token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="corrent_politic" name="corrent polític"> <pattern> <token postag="NC.*" postag_regexp="yes" regexp="yes" inflected="yes">corrent|vessant</token> <token postag="A.*" postag_regexp="yes" inflected="yes">polític</token> </pattern> <disambig action="filterall"/> </rule> <rule id="adj_costum" name="adj + costum"> <pattern> <marker> <token postag="A.*" postag_regexp="yes"/> </marker> <token inflected="yes">costum</token> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="amic_nom" name="amic nom darrere d'adjectiu"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes" inflected="yes">amic</token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="corrent_gerundi" name="corrent (gerundi)"> <pattern> <token inflected="yes" regexp="yes">anar|fugir|escapar</token> <marker> <token postag="VMG00000">corrent</token> </marker> </pattern> <disambig action="filter" postag="VMG00000"/> </rule> <rule id="petit" name="petit: adjectiu davant de nom"> <antipattern> <!-- ambiguous --> <token>a</token> <token>l</token> <token>màxim</token> </antipattern> <pattern> <marker> <token postag="AQ.*" postag_regexp="yes" inflected="yes" regexp="yes">petit|màxim|mínim|major|menor</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="AQ.*"/> <example type="untouched">Delegarà al màxim funcions i responsabilitats.</example> </rule> <rule id="vessant" name="vessant: gerundi"> <pattern> <marker> <token>vessant</token> </marker> <token regexp="yes" inflected="yes">aigua|vi|líquid</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="general_nonom" name="general/fiscal no noms darrere de nom"> <pattern> <!-- de caràcter general --> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="N.*" postag_regexp="yes"><exception>múltiples</exception></token> <marker> <and> <token postag="AQ.C.*" postag_regexp="yes"/> <token postag="NCC.*" postag_regexp="yes"/> </and> </marker> </unify> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="vers" name="vers (preposició)"> <pattern> <marker> <token>vers</token> </marker> <token postag="DA.*|NP..G.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SP.*"/> </rule> <rulegroup id="FORCA" name="força: nom, adjectiu, adverbi"> <rule> <!-- amb força indestructible, de força major --> <pattern> <token postag="SPS00|DI0FS0" postag_regexp="yes"/> <marker> <token postag="NCFS000">força</token> </marker> <token postag="AQ.[FC]S.|V.P..SF." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- Donem preferència a l'adjectiu en casos ambigus: força comuns--> <pattern> <token><exception postag="D[^R].FS." postag_regexp="yes"/><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].*</exception></token> <marker> <token postag="RG">força</token> </marker> <token postag="AQ.*|V.P.*|RG" postag_regexp="yes"><exception regexp="yes">que|major|social</exception></token> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule> <pattern> <token><exception postag="D[^R].FS." postag_regexp="yes"/><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].*</exception></token> <marker> <token postag="DI0CN0">força</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DI.*"/> </rule> </rulegroup> <rulegroup id="vora" name="vora (preposició)"> <rule> <pattern> <token><exception postag="D.*|PX.*" postag_regexp="yes"/></token> <marker> <token>vora</token> </marker> <token postag="D.*" postag_regexp="yes"><exception>es</exception></token> <token><exception postag="V.[MSI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <token postag="D..MP." postag_regexp="yes"/> <marker> <token>vora</token> </marker> <token postag="DN.*" postag_regexp="yes"><exception>es</exception></token> <token postag="NC[MC]P000" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule> <pattern> <token postag="D..FP." postag_regexp="yes"/> <marker> <token>vora</token> </marker> <token postag="DN.*" postag_regexp="yes"><exception>es</exception></token> <token postag="NC[FC]P000" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> </rulegroup> <!--<rule id="en_preposicio" name="en (preposició) + article"> <pattern> <marker> <token>en</token> </marker> <token postag="_GN.*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="SPS00"></disambig> </rule> <rule id="en_preposicio2" name="en (preposició) + article"> <pattern> <token>en</token> <marker> <token postag="_GN.*" postag_regexp="yes"></token> </marker> </pattern> <disambig action="filter" postag="D.*"></disambig> </rule> --> <rule id="en_preposicio3" name="en (preposició) + article"> <pattern> <marker> <token>en</token> </marker> <token postag="DA.*" postag_regexp="yes"/> <token postag="(A|N|PX|DN).*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="en_preposicio4" name="en (preposició) + article"> <pattern> <token>en</token> <marker> <token postag="DA.*" postag_regexp="yes"/> </marker> <token postag="(A|N|PX|DN|V.P).*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DA.*"/> </rule> <rulegroup id="elimina_alguns_balears" name="elimina verb balear en alguns casos"> <rule> <!-- Si som en una varietat no balear, aquesta regla és molt clara. En canvi, si som en balear, podria ser errònia. --> <pattern> <token postag_regexp="yes" postag="D.*"/> <marker> <and> <token postag="VMIP1S0B"/> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="VMIP1S0B"/> </rule> <rule> <!-- Si som en una varietat no balear, aquesta regla és molt clara. En canvi, si som en balear, podria ser errònia. --> <pattern> <!-- error en: em -> hem --> <token>em</token> <marker> <and> <token postag="VMIP1S0B"/> <token postag="V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="VMIP1S0B"/> </rule> </rulegroup> <rule id="en_practica" name="posar en pràctica"> <pattern> <token inflected="yes" regexp="yes">posar|tenir</token> <marker> <token postag="SPS00">en</token> </marker> <token regexp="yes" inflected="yes">marxa|pràctica|practica|compte</token> </pattern> <disambig action="remove" postag="P.*"/> </rule> <rule id="ES_GRATIS" name="es gratis (excepcions regles següents)"> <pattern> <token>es</token> <marker> <token postag="RG">gratis</token> </marker> </pattern> <disambig action="filter" postag="RG"/> </rule> <!--en l'obra, en la causa, en(s) el porten --> <!-- pronom personal + pronom personal + verb --> <rulegroup id="PPdos_VERB" name="dos o més pronoms personals i verb"> <antipattern> <token>en</token> <token regexp="yes">la|el|l'|els|les|en</token> </antipattern> <antipattern> <token postag="SPS00"/> <!-- error: vos -> vós --> <token>vos</token> </antipattern> <antipattern> <token>te</token> <token>en</token> </antipattern> <rule id="dosPP_VERB" name="dos pronoms personals més verb"> <antipattern> <!-- 'els' l': combinació vàlida de pronoms --> <token regexp="yes">la|el|les|l|ls</token> <token regexp="yes">l'|la|el</token> </antipattern> <antipattern> <token>l'</token> <token>ho</token> </antipattern> <antipattern> <token regexp="yes">ho|hi|la|lo|el|nos|los</token> <token>en</token> </antipattern> <antipattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="[NA].*|V.P.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"><exception regexp="yes">['-].+|nosaltres|vosaltres|tu|mi</exception></token> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"><exception regexp="yes">[-].+|nosaltres|vosaltres|tu|mi</exception></token> <token postag="V.[^MNPG].*|_GV_|_perfet|_obligacio" postag_regexp="yes"/> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="tresPP_VERB" name="tres pronoms personals més verb"> <pattern> <marker> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"><exception regexp="yes">['-].+|nosaltres|vosaltres|tu|mi</exception></token> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"><exception regexp="yes">[-].+|nosaltres|vosaltres|tu|mi</exception></token> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"><exception regexp="yes">[-].+|nosaltres|vosaltres|tu|mi</exception></token> <token postag="V.[^MNPG].*|_GV_|_perfet|_obligacio" postag_regexp="yes"/> </marker> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rule id="ELS_DEU" name="els deu quantitats"> <pattern> <token>els</token> <marker> <and> <token postag="DN0CP0">deu</token> <token postag="V.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> </and> </marker> <token postag="NCFP.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="en_conserva" name="en conserva (no verb)"> <pattern> <token>en</token> <marker> <token>conserva</token> </marker> <token><exception postag="D[^R].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="va_noadj" name="va (no adjectiu)"> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <marker> <token postag="V.*" postag_regexp="yes">va</token> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rule id="nova" name="nova, bona (adjectiu)"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="AQ.*" postag_regexp="yes" regexp="yes">nova|noves|bon|bona</token> </marker> <token postag="NC.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="AQ.*"/> <example type="untouched">la cara <marker>era</marker> d'un color gris</example> </rule> <rulegroup id="verbnom_de" name="art+verb_nom+de"> <!-- L'era de... No va bé per a verbs que regeixen "de" --> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.*|AQ.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/><exception>es</exception><exception scope="previous">s</exception></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[SIN].*" postag_regexp="yes"><exception inflected="yes">prendre</exception></token> </and> </marker> </unify> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="N.*"/> <example type="untouched">la cara <marker>era</marker> d'un color gris</example> </rule> <rule> <!-- a l'altre punta de carrer --> <pattern> <token inflected="yes">altre</token> <marker> <and> <token postag="V.[SI].*" postag_regexp="yes"><exception inflected="yes">prendre</exception><exception>era</exception></token> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="objecte_de" name="objecte de"> <!-- es pot generalitzar? --> <antipattern> <token>què</token> <token>creus</token> </antipattern> <pattern> <marker> <token regexp="yes">objectes?|creus?</token> </marker> <token regexp="yes">de|d'<exception postag=".*LOC_.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rule id="SET" name="set"> <pattern> <token postag="D...P.*" postag_regexp="yes"/> <token postag="A...P.*" postag_regexp="yes" min="0"/> <marker> <token>set</token> </marker> </pattern> <disambig action="remove" postag="NC.S.*"/> </rule> <rulegroup id="ALTRE" name="l'altre determinant/adjectiu/pronom"> <rule> <pattern> <token inflected="yes" regexp="yes">el|un</token> <marker> <token postag="[AP].*" postag_regexp="yes" inflected="yes">altre</token> </marker> </pattern> <disambig action="filter" postag="[AP].*"/> </rule> <rule> <pattern> <marker> <token postag="P.*" postag_regexp="yes" inflected="yes">altre<exception scope="previous" regexp="yes">ningú|algú|cadascú</exception></token> </marker> <token><exception postag="[NA].*|PX.*|V.P.*|DN.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="P.*"/> </rule> <rule> <pattern> <token inflected="yes">el</token> <token inflected="yes">un</token> <token>a</token> <token inflected="yes">el</token> <marker> <token postag="P.*" postag_regexp="yes" inflected="yes">altre</token> </marker> </pattern> <disambig action="filter" postag="P.*"/> </rule> <rule> <pattern> <token>cap</token> <marker> <token postag="D.*" postag_regexp="yes" inflected="yes">altre</token> </marker> <token postag="[NA].*|PX.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="D.*"/> </rule> </rulegroup> <rule id="es_queda" name="es queda (verb)"> <pattern> <token regexp="yes">es|se<exception scope="previous" postag="SPS00"/></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="NC.*"/> </rule> <rule id="baixa_paquets" name="baixa paquets"> <pattern> <token postag="SENT_START"/> <unify negate="yes"> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="A.*" postag_regexp="yes">baixa</token> </marker> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="remove" postag="[AN].*"/> </rule> <rule id="causar_baixa" name=" causar baixes"> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes">causar</token> <token postag="N.*" postag_regexp="yes" inflected="yes">baixa</token> </pattern> <disambig action="filterall"/> </rule> <!--<rule id="mal_adj_nom" name="mal (adj) + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="A.*" postag_regexp="yes" inflected="yes">mal</token> <token postag="N.*" postag_regexp="yes"><exception inflected="yes">entès</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule>--> <rule id="pres_politic" name="pres polític"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="NC.*" postag_regexp="yes" inflected="yes">pres</token> <token postag="AQ.*" postag_regexp="yes" inflected="yes">polític</token> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="via" name="via (preposició)"> <pattern> <token><exception postag="D..FS." postag_regexp="yes"/></token> <marker> <token postag="SPS00">via</token> </marker> <token postag="NC.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="segons" name="segons (preposició)"> <pattern> <marker> <token postag="SPS00">segons</token> </marker> <token postag="D.*" postag_regexp="yes"><exception>es</exception></token> <token postag="[NA].*|PR.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="segons_CS" name="segons (conjunció)"> <!-- potser contraproduent si hi ha un error nom/verb --> <pattern> <marker> <token postag="CS">segons</token> </marker> <token postag="&pronom_feble;|RN" min="0" max="3" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="CS"/> </rule> <rule id="fons" name="fons (singular o plural)"> <pattern> <marker> <token>fons</token> </marker> <token postag="A...P.*|V.P..PM." postag_regexp="yes"/> </pattern> <disambig action="replace"> <wd lemma="fons" pos="NCMP000"/> </disambig> </rule> <rulegroup id="DetNom_exceptions" name="excepcions a DetNom"> <rule> <!-- Amb error de concordança adjectiu-nom --> <pattern> <token postag="D[^R].*" postag_regexp="yes"/> <marker> <token postag="A.*" postag_regexp="yes" regexp="yes" inflected="yes">principal|diferent|actual</token> </marker> <token postag_regexp="yes" postag="N.*"/> </pattern> <disambig action="filter" postag="A.*|_GN_.*"/> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">diplomar|llicenciar|doctorar|estar|ser<exception postag="N.*" postag_regexp="yes"/></token> <marker> <token>en</token> </marker> </pattern> <disambig action="filter" postag="SPS00"/> </rule> </rulegroup> <rulegroup id="grups_adj_n" name="grups d'ajectius i noms"> <rule> <pattern> <token postag="NC.P.*" postag_regexp="yes"/> <token postag="A...S.*" postag_regexp="yes"/> <token postag="CC"/> <token postag="A...S.*" postag_regexp="yes"/> <token postag="A...P.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="NC.P.*" postag_regexp="yes"/> <token postag="A...S.*" postag_regexp="yes"/> <token>,</token> <token postag="A...S.*" postag_regexp="yes"/> <token postag="CC"/> <token postag="A...S.*" postag_regexp="yes"/> <token postag="A...P.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="NC[MC][SN].*|_GN_MS" postag_regexp="yes"/> <token>algun</token> <marker> <token postag="SPS00">sobre</token> </marker> <token postag="[PD].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="SPS00"/> </rule> </rulegroup> <rulegroup id="DDN" name="Det + Det + nom"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.[^F].*" postag_regexp="yes"/> <marker> <token postag="DI.*" postag_regexp="yes"><exception>cap</exception></token> </marker> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="DI.*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="DI.*" postag_regexp="yes" inflected="yes">poc</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">un|el</token> <token postag="DD.*" postag_regexp="yes" inflected="yes">tal</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D..MS." postag_regexp="yes" inflected="yes" regexp="yes">un|el</token> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">tal|poc</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D..FS." postag_regexp="yes" inflected="yes" regexp="yes">un|el</token> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">tal|poc</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D..MP." postag_regexp="yes" inflected="yes" regexp="yes">un|el</token> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">tal|poc</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D..FP." postag_regexp="yes" inflected="yes" regexp="yes">un|el</token> <token postag="D.*" postag_regexp="yes" inflected="yes" regexp="yes">tal|poc</token> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rulegroup id="DetDet" name="det + det: una certa"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes" inflected="yes">un</token> <token postag="DI.*" postag_regexp="yes" inflected="yes">cert</token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="DI.*" postag_regexp="yes"/> <token postag="DI.*" postag_regexp="yes" inflected="yes">altre</token> </marker> <token postag="[NA].*|V.P.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <rulegroup id="DANA" name="det + adj + adj + nom"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="D[NI].*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">era|fou</exception></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="DN.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">era|fou</exception></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> </rulegroup> <!-- La característica mitja canya problema: la part superior esquerra --> <rule id="DAAN" name="det + adj + adj + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"><exception scope="previous" postag="D.*" postag_regexp="yes"/></token> <token postag="A.*|V.P.*|DN.*" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*|V.G.*" postag_regexp="yes"/><exception regexp="yes">si|passa|dins|era|quina|però|fou</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="DPAAN" name="det + poss + adj + adj + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <token postag="A.*|V.P.*|DN.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">fou|era|mira|queda|cap|però</exception></token> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rule id="DANumAN" name="det + adj + numeral + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="DN.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="DANumN" name="det + adj + numeral + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="DN.*" postag_regexp="yes"/> <token postag="N.*|V.P.*|A.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="DPAN" name="Det + Possessiu + Adj + Nom"> <!-- La seva mala intenció --> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">era|mira|queda|cap</exception></token> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rule> <pattern> <marker> <token postag="D[^R].[MC][SN].*" postag_regexp="yes"/> <token postag="PX.[MC][SN].*" postag_regexp="yes"/> <token postag="A..[MC][SN].*|V.P.*SM.?" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.[MC][SN].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][SN].*" postag_regexp="yes"/> <token postag="PX.[FC][SN].*" postag_regexp="yes"/> <token postag="A..[FC][SN].*|V.P.*SF.?" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.[FC][SN].*" postag_regexp="yes"><exception regexp="yes">era|mira|queda|cap</exception><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[MC][PN].*" postag_regexp="yes"/> <token postag="PX.[MC][PN].*" postag_regexp="yes"/> <token postag="A..[MC][PN].*|V.P.*PM.?" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.[MC][PN].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][PN].*" postag_regexp="yes"/> <token postag="PX.[FC][PN].*" postag_regexp="yes"/> <token postag="A..[FC][PN].*|V.P.*PF.?" postag_regexp="yes"><exception postag="AQ0CN0"/></token> <token postag="N.[FC][PN].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="DPAA" name="det + poss + adj + adj"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <token postag="A.*|V.P.*|DN.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rulegroup id="DNumN" name="Det + Numeral + Nom/Adj"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[AIDE].*" postag_regexp="yes"/> <token postag="DN0.P0" postag_regexp="yes"/> <token postag="A.*|V.P.*|N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <!--<rule> <pattern> <token postag="D[AID].[MC][PN0].*" postag_regexp="yes"></token> <marker> <token postag="DN0CP0" /> </marker> <token postag="A..[MC][PN0].*|V.P..PM.?|N.[MC][PN0].*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="DN0MP0"></disambig> </rule> <rule> <pattern> <token postag="D[AID].[FC][PN0].*" postag_regexp="yes"></token> <marker> <token postag="DN0CP0" /> </marker> <token postag="A..[FC][PN0].*|V.P..PF.?|N.[FC][PN0].*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="DN0FP0"></disambig> </rule>--> <rule> <pattern> <marker> <token postag="D[AID].[MC][PN0].*" postag_regexp="yes"/> <token postag="DN0[CM]P0" postag_regexp="yes"/> <token postag="A..[MC][PN0].*|V.P..PM.?|N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[AID].[FC][PN0].*" postag_regexp="yes"/> <token postag="DN0[CF]P0" postag_regexp="yes"/> <token postag="A..[FC][PN0].*|V.P..PF.?|N.[FC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="DeDiN" name="Determinant exclamatiu + indeterminat + nom: quin poc seny"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[ET].*|PT.*" postag_regexp="yes"/> <token postag="DI.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="DNA" name="Det + Nom + Adj/Possessiu/participi"> <!--Falla amb nom neutre?: Aquest art expressa --> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception inflected="yes">meu</exception><exception postag="DN.*" postag_regexp="yes"/><exception inflected="yes" regexp="yes">poc|major</exception></token> <!-- --> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"><exception regexp="yes">som|presta|tens|comprés|després|muntà|va|segons|afecta|viu</exception></token> <!--<exception postag="V[MA]IP3S0" postag_regexp="yes"/>--> </marker> </unify> </pattern> <disambig action="unify"/> <example type="untouched">Són <marker>les dos alternatives</marker> bàsiques.</example> </rule> <!-- <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"></token> <token postag="N.*" postag_regexp="yes">deu</token> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="unify"/> </rule> --> <rule> <pattern> <marker> <token postag="D[^R].[MC][SN0].*" postag_regexp="yes"/> <token postag="N.[MC][SN0].*" postag_regexp="yes"/> <token postag="A..[MC][SN0].*|V.P..SM.?|PX.[MC][SN0].*" postag_regexp="yes"><exception postag="V[MA]IP3S0.?" postag_regexp="yes"/><exception regexp="yes">som|tens|comprés|muntà|va</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][SN0].*" postag_regexp="yes"/> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][SN0].*|V.P..SF.?|PX.[FC][SN0].*" postag_regexp="yes"><exception>afecta</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[MC][PN0].*" postag_regexp="yes"/> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception inflected="yes">meu</exception></token> <token postag="A..[MC][PN0].*|V.P..PM.?|PX.[MC][PN0].*" postag_regexp="yes"><exception>segons</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][PN0].*" postag_regexp="yes"/> <token postag="N.[FC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][PN0].*|V.P..PF.?|PX.[FC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rulegroup id="DAN" name="Det + Adj + Nom"> <rule> <!-- fa la mateixa passa (sense excepcions) --> <pattern> <token postag="V.[SI].*" postag_regexp="yes"/> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].[MF].." postag_regexp="yes"/> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*|CC" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].[MF].." postag_regexp="yes"/> <!--afegit: altres, bastants, qualssevol, qualssevulla--> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">tants|recull|passi|quina|sabeu|surt|ara|fou|perquè|trenca|era|diu|si|però|escull|creix|dura|parla|mira|queda|estima|passa|escolta|troba|tots?|som</exception><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].C.." postag_regexp="yes"/> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">quina|sabeu|fan|ara|fou|perquè|diu|si|però|era|tots?|som</exception><exception postag="DN.*|V[MA]IP3S0.?" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="unify"/> </rule> <rule> <pattern> <marker> <token postag="D[^R].[MC][SN0].*" postag_regexp="yes"/> <token postag="A..[MC][SN0].*|V.P..SM.?|PX.[MC][SN0].*" postag_regexp="yes"/> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception regexp="yes">recull|passi|sabeu|fan|surt|perquè|diu|si|però|escull|creix|escolta|troba|tot|som</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][SN0].*" postag_regexp="yes"/> <token postag="A..[FC][SN0].*|V.P..SF.?|PX.[FC][SN0].*" postag_regexp="yes"/> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception regexp="yes">ara|quina|fan|era|mira|queda|estima|passa|escolta|troba|fou</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[MC][PN0].*" postag_regexp="yes"/> <token postag="A..[MC][PN0].*|V.P..PM.?|PX.[MC][PN0].*" postag_regexp="yes"/> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">tots|tants</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][PN0].*" postag_regexp="yes"/> <token postag="A..[FC][PN0].*|V.P..PF.?|PX.[FC][PN0].*" postag_regexp="yes"/> <token postag="N.[FC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="ANAA" name=" Adj + Nom + Adj"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="ANA" name=" Adj + Nom + Adj"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/><exception>tens</exception></token> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <marker> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/><exception>tens</exception></token> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/></token> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"><exception postag="A.0CN0|_GV_" postag_regexp="yes"/></token> <token postag="N.[FC][PN0].*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes"/><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="Nom_3Adj" name="nom + tres adj abans de concordar"> <pattern> <token postag="N.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/><exception regexp="yes">som|mal</exception></token> </and> </marker> <token postag="V.P.*|AQ.*" postag_regexp="yes"/> <token postag="V.P.*|AQ.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.P.*|AQ.*"/> </rule> <rulegroup id="NAA" name="Nom + Adj + Adj"> <antipattern> <token>va</token> <token postag="VMIS3S00"/> </antipattern> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">queda|troba|ret|torna|posa|veu|seus?</exception></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="AO0CN0"/><exception>seré</exception></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception regexp="yes">fer|som</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> <example type="untouched">si es pren vi acompanyat</example> </rule> <rule> <pattern> <token><exception postag="D..F..|D...P." postag_regexp="yes"/></token> <marker> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception>ret</exception></token> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"><exception>seré</exception></token> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"><exception>fer</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <token><exception postag="D..M..|D...P." postag_regexp="yes"/></token> <marker> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">seu|troba|torna|posa|veu</exception></token> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"/> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"/> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="N.[FC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"/> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="DAA" name="det + adj + adj"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D[^R].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="D.*|V.[^P].*" postag_regexp="yes"/></token> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="V.[^P].*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="part" name="part nom masculí o femení"> <rule> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">valor|vall|part|corrent|capital|ordre<exception postag="_GN_MS"/></token> <token postag="_GN_FS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="A.*" postag_regexp="yes" regexp="yes">part|corrent<exception postag="_GN_MS"/></token> <token postag="_GN_FS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="AQ0MS0"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">valor|vall|part|corrent|capital|ordre<exception postag="_GN_FS"/></token> <token postag="_GN_MS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="AQ0CS0">corrent<exception postag="_GN_FS"/></token> <token postag="_GN_MS"/> </and> </marker> </pattern> <disambig action="add"> <wd pos="AQ0MS0"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="AQ0CS0">corrent<exception postag="_GN_FS"/></token> <token postag="_GN_MS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="AQ0CS0"/> </disambig> </rule> <rule> <!-- actes, alumnes --> <pattern> <marker> <and> <token postag="NCFP000"><exception postag="_GN_FP"/></token> <token postag="NCMP000"/> <token postag="_GN_MP"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCFP000"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="NCMP000"><exception postag="_GN_MP"/></token> <token postag="NCFP000"/> <token postag="_GN_FP"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCMP000"/> </disambig> </rule> <rule> <!-- soprano --> <pattern> <marker> <and> <token postag="NCFS000"><exception postag="_GN_FS"/></token> <token postag="NC[MC]S000" postag_regexp="yes"/> <token postag="_GN_MS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="NCMS000"><exception postag="_GN_MS"/></token> <token postag="NC[FC]S000" postag_regexp="yes"/> <token postag="_GN_FS"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCMS000"/> </disambig> </rule> </rulegroup> <rule id="article_adj_nom" name="article + adj neutre + nom/adj"> <!-- els principals implicades. Adjectius neutres amb errors. --> <pattern> <unify> <feature id="nombre"/> <token postag="D.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MSI].*" postag_regexp="yes"/></token> <token postag="AQ.C.*" postag_regexp="yes"><exception regexp="yes">corrent|pendent|comensal|activista</exception></token> </and> </marker> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MSI].*|AQ.*|V.P.*|PX.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}.+</exception></token> </unify> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <!-- el titular deixa, el lateral mostra, el central porta --> <rule id="article_nom_verb" name="article + nom (adj neutre) + verb"> <pattern> <unify> <feature id="nombre"/> <token postag="D[AD].*" postag_regexp="yes"/> <and> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MSI].*" postag_regexp="yes"/></token> <token postag="AQ.CS.*" postag_regexp="yes"/> </and> </unify> <marker> <and> <token postag="NC.*" postag_regexp="yes"><exception>dubte</exception></token> <token postag="V.[MSI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <!-- <rule id="article_nom_adj" name="article + nom (adj neutre) + adjectiu"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D.*" postag_regexp="yes"></token> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception postag="V.[MSI].*" postag_regexp="yes"/></token> <token postag="AQ.CS.*" postag_regexp="yes"></token> </and> </marker> </unify> <token postag="AQ.*|V.P.*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="N.*"></disambig> </rule> --> <rulegroup id="que_causa" name="no nom darere de relatiu. Ex: que causa, que pensa"> <rule> <pattern> <token postag="PR.*|CS" postag_regexp="yes"><exception regexp="yes">com|segons</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">nous?|reis|deu|temes</exception><exception regexp="yes">\p{Lu}.*</exception></token> <token postag="VM.*" postag_regexp="yes"><exception postag="VMIP1S0.?" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule> <pattern> <token postag="PR.*" postag_regexp="yes"><exception>com</exception></token> <token>no</token> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">nous?</exception></token> <token postag="VM.*" postag_regexp="yes"><exception postag="VMIP1S0.?" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> </rulegroup> <rulegroup id="NUMERALS_ENCADENATS" name="numerals encadenats"> <rule> <pattern> <token postag="DN.[FC][PN]." postag_regexp="yes"/> <marker> <token postag="DN.[FC][PN]." postag_regexp="yes"/> <token postag="N.F[PN0].*|A..F[PN0].*" postag_regexp="yes"><exception postag="NCCN000|DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> <!-- tres-centes cinquanta mil organitzacions, nou mil organitzacions --> </rule> <rule> <pattern> <token postag="DN.[MC][PN]." postag_regexp="yes"/> <marker> <token postag="DN.[MC][PN]." postag_regexp="yes"/> <token postag="N.M[PN0].*|A..M[PN0].*" postag_regexp="yes"><exception postag="NCCN000|DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="DN.[FC][PN]." postag_regexp="yes"/> </marker> <token regexp="yes">i|ni|o|,</token> <token postag="DN.[FC][PN]." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*"/> </rule> <rule> <pattern> <marker> <token postag="DN.[MC][PN]." postag_regexp="yes"/> </marker> <token regexp="yes">i|ni|o|,</token> <token postag="DN.[MC][PN]." postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*"/> </rule> </rulegroup> <rule id="AIXO_ADJ" name="això + adjectiu"> <pattern> <token postag="PD0NS000"/> <marker> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="V.[IMS].*|SPS00" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|PX.*|RG.*"/> </rule> <rule id="tot_son" name="tot son (són)"> <pattern> <marker> <token postag="PI.*" postag_regexp="yes" inflected="yes">tot</token> </marker> <token>son</token> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule id="DET_POSS_NOM0" name="excepció a la regla següent"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes">seu</token> </marker> <token min="0" postag="RG"/> <token postag="A.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="remove" postag="PX.*"/> </rule> <rule id="DET_POSS_NOM" name="Det + possessiu + Nom/adj"> <pattern> <token postag="DA.*" postag_regexp="yes"/> <marker> <token postag="PX.*" postag_regexp="yes"/> </marker> <token min="0" postag="RG"/> <token postag="[AN].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="PX.*"/> <example type="untouched">I la seu també ha sigut expropiada.</example> <example type="untouched">perquè fos la seu sempre fixa dels déus</example> </rule> <rulegroup id="que" name="que (no adv)"> <rule> <pattern> <marker> <and> <token postag="RG.*" postag_regexp="yes">que</token> <token postag="RG.*" postag_regexp="yes" negate_pos="yes"/> </and> </marker> <token><exception postag="A.*|V.P.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="RG.*"/> </rule> <rule> <pattern> <token postag="DA.*" postag_regexp="yes"/> <marker> <and> <token postag="RG.*" postag_regexp="yes">que</token> <token postag="RG.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="RG.*"/> </rule> </rulegroup> <rule id="aviat" name="aviat adverbi"> <pattern> <!--<token regexp="yes">ben|més|tan|massa</token>--> <marker> <token postag="RG">aviat<exception postag="_GV_"/></token> </marker> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule id="desperta_adj" name="desperta (adj)"> <pattern> <token postag="V.[ISPN].*" postag_regexp="yes"/> <token min="1" max="3" postag_regexp="yes" postag="RG|LOC_ADV"/> <marker> <token postag="AQ0FS0">desperta</token> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="amic_nom0" name="amic nom davant d'adjectiu"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">amic</token> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="prep_mesmenys_nom" name="preposició + més/menys + nom"> <antipattern> <token postag="A.*|V.P.*" postag_regexp="yes"/> <token postag="N..P.*" postag_regexp="yes"/> </antipattern> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <token regexp="yes">més|menys</token> <marker> <and> <token postag="N..P.*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule id="gaire_no_adv" name="gaire no adverbi"> <pattern> <marker> <and> <token postag="RG.*" postag_regexp="yes">gaire</token> <token postag="DI.CS.*" postag_regexp="yes"/> </and> </marker> <token postag="N.[FMC][SN].*" postag_regexp="yes"><exception postag="AQ.[FMC][SN].|V.N.*" postag_regexp="yes"/><exception regexp="yes">fons|si</exception></token> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> <rulegroup id="nom_adv_adj" name="nom + adverbi + adjectiu que concorden"> <antipattern> <token>tens</token> <token>que</token> </antipattern> <rule id="aa2" name="aa1: Era la feina més dura "> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="NC.*|_GN_.*|DA.*" postag_regexp="yes"><exception postag="CC|RG" postag_regexp="yes"/></token> <token postag="RG_anteposat"/> <marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="filter" postag="AQ.*|V.P.*|PX.*|_GN_.*"/> </rule> <rule id="aa2b" name="aa1: Era un home força misteriós"> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="NC.*|_GN_.*" postag_regexp="yes"><exception postag="CC"/></token> <marker> <token postag="RG_anteposat"/> </marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="RG.*"/> </rule> </rulegroup> <!-- adverbis seguits d'adj i participi. REVISAR: tant català, tant catalana --> <rulegroup id="adv_adj" name="adverbi + adjectiu"> <rule id="quelcom" name="quelcom"> <pattern> <token postag="PI0CS000">quelcom</token> <token postag="AQ0[MC]S0" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule id="aa1" name="aa1"> <!-- excep: més aviat complexes --> <pattern> <token>més</token> <marker> <token>aviat</token> </marker> <token postag="AQ.*|NC.*|SPS.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule id="molt_fi" name="molt fi"> <pattern> <marker> <token postag="RG.*" postag_regexp="yes" regexp="yes">molt|poc|tan|força|massa|tot</token> <token postag="AQ.*" postag_regexp="yes">fi</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="aa3" name="aa1"> <pattern> <marker> <token postag="RG_anteposat"><exception regexp="yes">molt|poc|tant|tan|força|massa|tot|també|quelcom</exception><exception postag="N.*" postag_regexp="yes"/></token> </marker> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception postag="V.[NMIS].*|_GV_" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="R.*"/> </rule> <rule id="aa4" name="aa1"> <pattern> <token postag="RG_anteposat|.*LOC_ADV.*" postag_regexp="yes"><exception regexp="yes">molt|poc|tant|tan|força|massa|tot|més|també</exception></token> <marker> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception postag="V.[NMIS].*|_GV_|RG" postag_regexp="yes"/><exception inflected="yes" regexp="yes">estat|part</exception><exception>nou</exception></token> <!--|N.*<exception regexp="yes">parts?</exception>--> <!-- exc. força restaurants que seria en pocs anys força hegemònica a Catalunya.--> <!-- ací hi ha contradicció amb la regla adv_adjverb --> </marker> <token><exception regexp="yes">seus?|de|d'</exception></token> </pattern> <disambig action="filter" postag="A.*|V.P.*|DP.*"/> <example type="untouched">Són massivament admiradors seus.</example> </rule> <rule id="aa4b" name="aa1"> <antipattern> <token postag="VM.*" postag_regexp="yes" regexp="yes" skip="3" inflected="yes">estar|anar</token> <token min="0" max="3" postag="RG_anteposat|LOC_ADV" postag_regexp="yes"><exception postag="PR.*" postag_regexp="yes"/><exception regexp="yes">tant?</exception></token> <token postag="V.G.*" postag_regexp="yes"/> </antipattern> <pattern> <token regexp="yes" inflected="yes">ser|estar|parèixer|semblar|quedar</token> <marker> <token postag="RG.*" postag_regexp="yes" regexp="yes">molt|poc|tant|tan|força|massa|tot|més|també</token> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception postag="V.[NMIS].*|_GV_|RG" postag_regexp="yes"/><exception inflected="yes" regexp="yes">estat|part</exception><exception>nou</exception></token> </marker> <token><exception regexp="yes">seus?|de|d'</exception></token> </pattern> <disambig action="filterall"/> <example type="untouched">Són massivament admiradors seus.</example> </rule> <rule id="aa4a" name="aa1"> <!-- res de més inútil que--> <pattern> <token>res</token> <token inflected="yes">de</token> <token postag="RG_anteposat"/> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="D.*|PI.*|VS.*" postag_regexp="yes"/></token> </marker> <token regexp="yes">com|que</token> </pattern> <disambig action="filter" postag="A.*|V.P.*|_GN_.*"/> </rule> <rule id="aa5" name="aa1"> <!-- amb més públic, per a tal objectiu. Excep: en gairebé tots els; de més alta qualitat --> <antipattern> <token>mal</token> <token postag="A.*|V.P.*" postag_regexp="yes"/> </antipattern> <pattern> <token postag="SPS00"><exception>cap</exception></token> <token postag="RG_anteposat"><exception regexp="yes">molt|poc|tant|tan|.+ment|massa|ben</exception></token> <marker> <token postag="NC.*" postag_regexp="yes"><exception postag="D.*|PI.*|VS.*" postag_regexp="yes"/></token> </marker> <token><exception postag="NC.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> <!-- cas: molt comunes. Però: tal objectiu--> <rule id="aa6" name="aa1"> <pattern> <!-- <token postag="SPS00" negate_pos="yes"/> PROVISIONAL!!! --> <marker> <and> <token postag="RG"/> <token postag="D.*" postag_regexp="yes"/> </and> </marker> <and> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="N.[MC][SN].*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="aa6b" name="aa1"> <pattern> <token>de</token> <marker> <and> <token postag="RG">molt</token> <token postag="D.*" postag_regexp="yes"/> </and> </marker> <and> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception postag="N.[MC][SN].*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="aa7" name="la molt astuta"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="DA.*" postag_regexp="yes"/> <token postag="RG_anteposat"/> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception postag="V.[SI].*" postag_regexp="yes"/><exception>mal</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="aa8" name="aa1"> <pattern> <token postag="D.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <marker> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|_GN_.*"/> </rule> <rule id="aa9" name="aa1"> <pattern> <token postag="D.*|N.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <marker> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception>som</exception></token> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|_GN_.*"/> </rule> <!-- <rule id="aa10" name="aa1"> <pattern> <token postag="N.*|_GN_.*" postag_regexp="yes"><exception postag="CC"/></token> <token postag="RG.*" postag_regexp="yes"></token> <marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="V.[^P].*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|PX.*|_GN_.*"></disambig> </rule> --> <!--<rule id="aa17" name="característiques molt particulars"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="NC.*|_GN_.*" postag_regexp="yes"><exception postag="D.*|V[SA].*|RG" postag_regexp="yes"></exception><exception regexp="yes">serè|coma</exception></token> <unify-ignore> <token postag="RG_anteposat"/> </unify-ignore> <token postag="AQ.*|V.P.*" postag_regexp="yes"><exception>seré</exception></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule>--> <rule id="aa11" name="aa1"> <!-- ampliar a LOC_ADV Però han de concordar??: que seria en pocs anys força hegemònica a Catalunya. Aquesta regla permet errors: "una alineació poc habitual"--> <pattern> <token postag="RG.*|V.[SI].*|PI.*|_PUNCT.*" postag_regexp="yes"/> <marker> <token postag="RG_anteposat"><exception postag="NC.*" postag_regexp="yes">força</exception><exception>quelcom</exception></token> </marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="N.[MC][SN].*" postag_regexp="yes"/></token> <!--<exception postag="V.[^P].*" postag_regexp="yes"/> --> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="aa12" name="aa1"> <!-- ampliar a LOC_ADV --> <!-- Haurien de concordar?? --> <pattern> <token postag="N.*|_GN_.*|RG.*|V.[SI].*|PI.*" postag_regexp="yes"/> <token postag="_PUNCT.*" postag_regexp="yes"/> <marker> <token postag="RG_anteposat"><exception regexp="yes">força|tot</exception></token> </marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="N.[MC][SN].*" postag_regexp="yes"/></token> <!--<exception postag="V.[^P].*" postag_regexp="yes"/> --> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="aa13" name="aa1"> <antipattern> <token>a</token> <token>més</token> </antipattern> <pattern> <token postag="N.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="V.[^P].*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|PX.*|_GN_.*"/> </rule> <rule id="aa14" name="aa1"> <pattern> <token postag="N.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <marker> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> </marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="V.[^P].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag=".*LOC_ADV.*|RG.*"/> </rule> <rule id="aa15" name="aa1"> <pattern> <token postag="N.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <token postag=".*LOC_ADV.*|RG.*" postag_regexp="yes"/> <marker> <token postag="AQ.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="V.[^P].*" postag_regexp="yes"/><exception>som</exception></token> </marker> </pattern> <disambig action="filter" postag="A.*|V.P.*|PX.*|_GN_.*"/> </rule> <rule id="aa16" name="aa1"> <!-- tan regular, molt dur, etc. --> <pattern> <token postag="RG_anteposat"/> <marker> <and> <token postag="AQ.*" postag_regexp="yes"/> <token postag="V.N.*" postag_regexp="yes"><exception>fer</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="A.*|_GN_.*"/> </rule> </rulegroup> <rule id="molts_mes_adj_n" name="molts més + adj + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="DI.*" postag_regexp="yes" inflected="yes">molt</token> <token>més</token> <token postag="A.*" postag_regexp="yes"/> <token postag="NC.*" postag_regexp="yes"><exception postag="V.N.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="molts_mes" name="molts més + nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="DI.*" postag_regexp="yes" inflected="yes">molt</token> <token>més</token> <token postag="NC.*" postag_regexp="yes"><exception postag="V.N.*" postag_regexp="yes"/></token> </marker> </unify> </pattern> <disambig action="filterall"/> </rule> <rule id="via_no_prep" name="via no preposició"> <pattern> <token postag="D..FS." postag_regexp="yes"/> <marker> <token postag="NCFS000">via</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule id="PREP_VERB" name="no Verb conjugat darrere de preposició"> <!-- "de sumes": "sumes" no és verb. Mogut per "En forma part". Mogut amunt per "d'escriptura comú" Excep: per dintre sou, el vers diu --> <pattern> <token postag="SP.*|LOC_PREP" postag_regexp="yes"><exception postag="PP.*|P0.*|RG.*|_GN.*|CS" postag_regexp="yes"/></token> <token min="0" regexp="yes">[“‘«"']</token> <marker> <and> <token postag="N.*|A.*|RG|V.[NGP].*" postag_regexp="yes"><exception>diu</exception></token> <token postag="V.[MSI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[SIM].*"/> <example type="untouched">Quants segons triga a arribar-hi?</example> </rule> <rule id="PREP_ART_VERB" name="no Verb conjugat darrere de preposició i article"> <!-- "a l'esquerra": "esquerra" no és verb . Mogut per "De les dites baronies"--> <pattern> <token postag="SP.*" postag_regexp="yes"><exception postag="RG"/></token> <token min="0" regexp="yes">[“‘«"']</token> <token postag="DA.*" postag_regexp="yes"><exception inflected="yes">es</exception></token> <token min="0" regexp="yes">[“‘«"']</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.[^NGP].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="PREP_VERBGERUND" name="no Verb gerundi darrere de preposició"> <pattern> <token postag="SP.*|.*LOC_PREP.*" postag_regexp="yes"><exception postag="PP.*|P0.*|RG.*|_GN.*|CS" postag_regexp="yes"/><exception>en</exception></token> <token min="0" postag="DA.*" postag_regexp="yes"><exception inflected="yes">es</exception></token> <marker> <and> <token postag="N.*|A.*|RG" postag_regexp="yes"/> <token postag="V.G.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.G.*"/> <example type="untouched">En acabant se'n va anar a casa.</example> </rule> <!-- gerundi/adj + nom "Ocupant llocs" Canviat de lloc per: "D'eixa important època" --> <rule id="adv_geradj_nom" name="adverbi + gerundi/adjectiu + nom"> <pattern> <token postag="RG.*" postag_regexp="yes"/> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <and> <token postag="V.G.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> </and> </marker> <token postag="N.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="en_costes" name="en costes"> <pattern> <token postag="V.[SI].*|_GV_" postag_regexp="yes"/> <marker> <token postag="SPS00">en</token> <token postag="NCFP000">costes</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="els_dona" name="els dona"> <pattern> <marker> <token postag="PP3CP000">els</token> <token postag="VMIP3S00">dona</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="caure_la_bava" name="caure la bava"> <pattern> <marker> <token inflected="yes" postag="V.*" postag_regexp="yes">caure</token> </marker> <token>la</token> <token>bava</token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rulegroup id="verbnom_verb" name="verb/nom + verb"> <!-- verb/nom + verb El diu és un dispostiu, Aquella era havia estat --> <antipattern> <token regexp="yes">si|quan</token> <token min="0">no</token> <token postag="&pronom_feble;" postag_regexp="yes"/> <token postag="V.[IS].*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <token postag="D[DAI].*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes" negate_pos="yes"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <token postag="D[DAI].*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception>duran</exception></token> </and> </marker> <token postag="(PP|P0).*" postag_regexp="yes"/> <token postag="V.[IS].*" postag_regexp="yes"><exception postag="VMIP1S0B"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <token postag="D[DAI].*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="(PP|P0).*" postag_regexp="yes"/> <token postag="(PP|P0).*" postag_regexp="yes"/> <token postag="V.[IS].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <!-- el pare no hi és; la porta ja s'havia tancat--> <pattern> <token postag="D[DAI].*" postag_regexp="yes"/> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception regexp="yes" inflected="yes">llevar|treure</exception></token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">no|ja</token> <token postag="(PP|P0).*|V.[IS].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rulegroup id="verb_verbGN" name="verb + GN (art+nom)"> <rule> <!-- mantenir la calma --> <pattern> <token postag="V.[ISNG].*|_GV_" postag_regexp="yes"><exception postag="N.*|AQ.*" postag_regexp="yes"/></token> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="DA.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*|A.*|PX.*|V.P.*" postag_regexp="yes"/> <token postag="V.[IS].*" postag_regexp="yes"/> </and> </marker> </unify> </pattern> <disambig action="filter" postag="N.*|A.*|PX.*|V.P.*"/> </rule> <rule> <!-- retorna en paga --> <pattern> <token postag="V.[IS].*|_GV_" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/></token> <token>en</token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="N.*|A.*|PX.*|V.P.*" postag_regexp="yes"><exception regexp="yes">queda|resta</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="N.*|A.*|PX.*|V.P.*"/> </rule> <rule> <pattern> <token postag="(PP|P0).*" postag_regexp="yes" regexp="yes">['-].+</token> <token postag="DA.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*|A.*|PX.*|V.P.*" postag_regexp="yes"/> <token postag="V.[IS].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|A.*|PX.*|V.P.*"/> </rule> <rule> <!-- retorna'ls en paga --> <pattern> <token postag="(PP|P0).*" postag_regexp="yes" regexp="yes">['-].+</token> <token>en</token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <!-- eliminat per: passar les tanques correctament primer --> <!-- <rulegroup id="verbnom_adv" name="verb_nom+adverbi"> <rule> <pattern> <marker> <and> <token postag="V.[SI].*" postag_regexp="yes"></token> <token postag="NC.*" postag_regexp="yes"></token> </and> </marker> <token>de</token> <token>manera</token> <token postag="AQ0[FC]S.*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="V.*"></disambig> </rule> <rule> <pattern> <marker> <and> <token postag="V.[SI].*" postag_regexp="yes"></token> <token postag="NC.*" postag_regexp="yes"></token> </and> </marker> <token postag="RG" postag_regexp="yes" regexp="yes">.+ment</token> <token postag="V.[SI].*" postag_regexp="yes" negate_pos="yes"></token> </pattern> <disambig action="filter" postag="V.*"></disambig> </rule> <rule> <pattern> <marker> <and> <token postag="V.[SI].*" postag_regexp="yes"></token> <token postag="NC.*" postag_regexp="yes"></token> </and> </marker> <token postag="RG" postag_regexp="yes" regexp="yes">.+ment</token> <token postag="V.[SI].*" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="N.*"></disambig> </rule> </rulegroup> --> <rule id="nom_nomverb" name="nom + verb/nom"> <pattern> <!-- a quina xifra correspon; punts dobles volien dir; a petita escala --> <token postag="N.*" postag_regexp="yes"><exception postag="V.*|D.*|A.*|V.P.*|_GV_|C.*|RG.*|complement|.*LOC.*" postag_regexp="yes"/><exception inflected="yes" regexp="yes">mot|paraula|terme|expressió|vocable|nom|tipus|denominació|numeral</exception></token> <token min="0">no</token> <marker> <and> <token postag="V.*" postag_regexp="yes"><exception regexp="yes">força|\p{Lu}.*|brossa</exception></token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN_.*|A.*|V.P.*|PX.*|VMIP1S0.?" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> <!-- sobre --> </rule> <!-- el seu disseny també queda Però: posar en explotació prou terres--> <!--<rule id="nom_nomverb2" name="nom + adv + verb/nom"> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.*|D.*|A.*|V.P.*|_GV_|C.*|RG.*|complement" postag_regexp="yes" /></token> <token postag="RG_anteposat"/> <marker> <and> <token postag="V.*" postag_regexp="yes" /> <token postag="N.*" postag_regexp="yes"><exception postag="_GN_.*|A.*|V.P.*|PX.*|VMIP1S0.?" postag_regexp="yes" /></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"></disambig> </rule>--> <!-- sobre --> <rule id="infinitiu_nomverb" name="infinitiu + verb/nom"> <!-- és típic menjar ou --> <pattern> <token postag="V.N.*" postag_regexp="yes"><exception postag="complement"/></token> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception regexp="yes">era|eres</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="A.*|V.P.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="sota0" name="sota preposició"> <pattern> <marker> <token postag="SPS00">sota<exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="D.*" postag_regexp="yes"><exception inflected="yes">es</exception></token> <token postag="[AN].*|V.P.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filterall"/> </rule> <rule id="nomverb_nom" name="nom + verb/nom"> <antipattern> <token postag="SPS00|D[DI].*|PX.*|.*LOC_PREP.*" postag_regexp="yes"/> <token min="0" postag="_QM_OPEN"/> <token postag="NC.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"><exception inflected="yes" regexp="yes">nom|persona|ritme|sexe</exception><exception postag="VMIP1S0B"/><exception regexp="yes">dona|dones</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*|A.*|PX.*|V.P.*|D.*|SPS.*|NP.*" postag_regexp="yes"/></token> </and> </marker> <token postag="NC.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes" negate_pos="yes"/><exception regexp="yes">\d.*|p|propietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|estrela|model|hoste|base</exception></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="nomverb_verb" name="nom/verb + verb"> <antipattern> <token>va</token> <token postag="VMIS3S00"/> </antipattern> <pattern> <token><exception postag="&pronom_feble;|RN" postag_regexp="yes"/></token> <marker> <and> <token postag="V.[GMSI].*" postag_regexp="yes"/> <token postag="NC.*|A.*|V.P.*|PX.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">som|fan|creixen</exception></token> </and> </marker> <!-- No està ben resolt?? --> <token min="0" max="3" postag="&pronom_feble;|RN" postag_regexp="yes"><exception regexp="yes">['-].+</exception></token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="V.[MSI].*|_GV_" postag_regexp="yes" negate_pos="yes"/><exception postag="VMIP1S0B"/></token> </pattern> <disambig action="remove" postag="V.[GMSI].*"/> </rule> <rule id="verb_nomverb" name="verb + nom/verb"> <pattern> <!--<exception postag="V.[NMSI].*|PP.*|P0.*|_GV_" postag_regexp="yes" negate_pos="yes" /> --> <token postag="V.[NMSI].*|_GV_|PP.*|P0.*" postag_regexp="yes"><exception postag="V.[NMSI].*|PP.*|P0.*|_GV_" postag_regexp="yes" negate_pos="yes"/><exception postag="PP.*|P0.*" postag_regexp="yes" regexp="yes">[^'-].+</exception><exception regexp="yes">jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vost[èé]s?|vós|men</exception></token> <marker> <and> <token postag="V.[SIM].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">era|va|seré|fou|queda|troba|estaria|estaries</exception><exception postag="_GV_" postag_regexp="yes"/></token> <!--_GN_.*--> </and> </marker> <token><exception postag="P[P0].*" postag_regexp="yes" regexp="yes">['-].+</exception></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <!-- <rule> <pattern mark="1"> <token regexp="yes">al|del|pel</token> <token postag="N.[MC][SN].*|A..[MC][SN].*|V.P..SM" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="N.*|A.*|V.P.*"></disambig> </rule> <rule> <pattern mark="1"> <token regexp="yes">als|dels|pels|cals</token> <token postag="N.[MC][PN].*|A..[MC][PN].*|V.P..PM" postag_regexp="yes"></token> </pattern> <disambig action="filter" postag="N.*|A.*|V.P.*"></disambig> </rule> </rulegroup> --> <rule id="segons1" name="segons + pronom"> <pattern> <marker> <token postag="CS">segons</token> </marker> <token postag="(DE|DT|PT).*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="CS"/> </rule> <rule id="EM_DEU" name="em deu: excepció a les regles següents"> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <marker> <and> <token postag="DN0CP0">deu</token> <token postag="V.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule id="si_nom" name="si nom"> <pattern> <token postag="D[^R].MS.|PX.MS.*" postag_regexp="yes"/> <marker> <token>si</token> </marker> <token postag="SENT_END|_PUNCT.*|C.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule id="nNom0" name="no Nom"> <!-- no són noms si no han concordat amb determinants. Mogut per "ens ensenya"--> <antipattern> <token>personal</token> <token regexp="yes">de|d'</token> </antipattern> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">demà|liderats?|oi|queda|formi|baixa|porto|troba|trobes|ara|esper|vau|he|deixa|deixes|sap|pren|allò|breu|sec|personal|fou|crec|davant|darrere|damunt|davall|sota|ve|tornés|seré|estic|som|sou|amples?|creix|fem|res|si|bé|perquè|però|dins|real|era|eres|dius?|fals<exception postag="_GN.*" postag_regexp="yes"/><exception case_sensitive="yes">Era</exception></token> <token postag="[AVRIPC].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rule id="nNomMasculi" name="no Nom masculí si no ha concordat"> <pattern> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">por<exception postag="_GN_M.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="NCF.*|_GN_F.*"/> </rule> <rule id="nNomFemeni" name="no Nom femení si no ha concordat"> <!-- on té molt poc pes --> <pattern> <marker> <and> <token inflected="yes" regexp="yes">pe|posterior|estaria|truca|espera<exception postag="_GN_F.*" postag_regexp="yes"/></token> <token postag="NCF.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="NCF.*"/> </rule> <rulegroup id="som" name="què som"> <rule> <pattern> <token regexp="yes">qui|quins|què|quant|quants|com|nosaltres|pocs|poques|ja</token> <marker> <token postag="VSIP1P00">som</token> </marker> </pattern> <disambig action="remove" postag="A.*|N.*"/> </rule> <rule> <pattern> <marker> <token postag="VSIP1P00">som</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="A.*|N.*"/> </rule> <rule> <pattern> <marker> <token postag="VSIP1P00">som</token> </marker> <token postag="D.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="A.*|N.*"/> </rule> </rulegroup> <rule id="adj_punct" name="adjectiu no verb abans de puntuació"> <!-- Però: Quants anys tens, Ricard? ¿Quina edat tens..., seixanta-vuit?--> <antipattern> <token regexp="yes">contestà|tens</token> <token>:</token> </antipattern> <pattern> <token><exception regexp="yes">no|que|ja|perquè|encara|com</exception><exception postag="&pronom_feble;" postag_regexp="yes"/><exception postag="PI.*" postag_regexp="yes" inflected="yes">altre</exception></token> <marker> <and> <token postag="AQ.*" postag_regexp="yes"><exception regexp="yes">sabeu|tornés|bufa|som|molesta|viu|accepta|acceptes?|va|expressa|baixa|desperta</exception></token> <!--tens|plana. Exception: rates --> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> <token postag="_PUNCT.*" postag_regexp="yes"><exception regexp="yes">[\?!\(]</exception></token> </pattern> <disambig action="filter" postag="AQ.*|_GN_.*|N.*"/> </rule> <rulegroup id="NoAdj" name="no adjectiu si no han concordat"> <!-- excepció a la regla --> <rule> <pattern> <token regexp="yes">tan|molt|gens|lo</token> <!-- "tan amic", però "encara seré" --> <marker> <and> <token postag="A.*" postag_regexp="yes" regexp="yes">artista|artistes|amics?|amiga|amigues|seré|accepta|acceptes|fer<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="[NV].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="[NV].*"/> </rule> <!-- no són adj si no han concordat amb determinants. Mogut per "ens ensenya"--> <rule> <pattern> <marker> <and> <token postag="A.*|V.P.*" postag_regexp="yes" regexp="yes">enllumenat|contractes?|contracta|artista|artistes|manca|donant|amics?|amiga|amigues|pega|muntà|corredors?|sabeu|xiquets?|muntés|accepta|envolta|tornés|seré|escolta|talar|afectes?|acceptes?|afecta<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*|V.[^P].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="A.*|V.P.*"/> </rule> <rule> <pattern> <token><exception postag="RG_anteposat"/></token> <marker> <and> <token postag="A.*" postag_regexp="yes" regexp="yes">som|tens<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="A.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^A].*"/> </rule> <rule> <pattern> <token inflected="yes">fer</token> <marker> <token postag="AQ.*" postag_regexp="yes" inflected="yes">possible</token> </marker> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">animal</token> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="N.*"/> </rule> </rulegroup> <rulegroup id="numeral_nom" name="numeral + nom plural"> <rule> <pattern> <token regexp="yes">(\d[\d.,]+\d|\d+)<exception>1</exception><exception postag="_C_TEMPS"/></token> <marker> <token postag="NC.[PN].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="remove" postag="NC.S.*"/> </rule> <rule> <pattern> <token>1</token> <marker> <token postag="NC.[SN].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="remove" postag="NC.P.*"/> </rule> </rulegroup> <rulegroup id="determinants_numerals" name="deternimants numerals"> <rule> <pattern> <marker> <token postag="DN.*" postag_regexp="yes"/> <token postag="DN.*" postag_regexp="yes"/> </marker> <token postag="DN.*" postag_regexp="yes"/> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <marker> <token postag="DN.*" postag_regexp="yes"/> </marker> <token postag="N..P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*|_GN.*"/> </rule> </rulegroup> <rulegroup id="nou" name="nou (adj/nom/numeral)"> <rule> <pattern> <token>altres</token> <marker> <token>nou</token> </marker> </pattern> <disambig action="remove" postag="V.*|NC.S000|AQ..S."/> </rule> <rule> <pattern> <token>el</token> <marker> <token>nou</token> </marker> </pattern> <disambig action="remove" postag="V.*|NCFS000"/> </rule> <rule> <pattern> <token>tan</token> <marker> <token>nou</token> </marker> </pattern> <disambig action="remove" postag="V.*|NCFS000|DN.*|NC.*"/> </rule> <rule> <pattern> <marker> <token postag="NCFS000">nou</token> <token postag="AQ0FS0">moscada</token> </marker> </pattern> <disambig action="filterall"/> </rule> <rule> <pattern> <token postag="DA..P." postag_regexp="yes"/> <marker> <token>nou</token> </marker> </pattern> <disambig action="remove"> <wd pos="AQ0MS0"/> </disambig> </rule> <rule> <pattern> <token postag="D[^R].FS." postag_regexp="yes"/> <marker> <token>nou</token> </marker> </pattern> <disambig action="filter" postag="NCFS.*|_GN_FS"/> </rule> <rule> <pattern> <token><exception postag="D[^R].*" postag_regexp="yes"/></token> <marker> <token>nou</token> </marker> <token postag="N.[MC][SN].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="AQ.MS.*|_GN_MS"/> </rule> <rule> <pattern> <marker> <and> <token>nou</token> <token postag="_GN_MS" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <token>tot</token> <marker> <token>nou</token> </marker> <token><exception postag="[AN].*[FMC][PN].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="AQ.MS.*|_GN_MS"/> </rule> </rulegroup> <rulegroup id="molt_no_adverbi" name="molt no adverbi"> <rule> <pattern> <marker> <and> <token postag="RG.*" postag_regexp="yes"><exception>massa</exception></token> <token postag="DI.[MC][SN].*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">de|d'</token> <token postag="N.[MC][SN].*" postag_regexp="yes"><exception regexp="yes">fons|si|acord</exception></token> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> <rule> <pattern> <marker> <and> <token postag="RG.*" postag_regexp="yes"><exception>massa</exception></token> <token postag="DI.[MC][SN].*" postag_regexp="yes"/> </and> </marker> <token postag="N.[MC][SN].*" postag_regexp="yes"><exception postag="AQ.[MC][SN].|V.N.*" postag_regexp="yes"/><exception regexp="yes">fons|si</exception></token> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> <rule> <!-- massa coses --> <!-- massa material: ambiguous --> <pattern> <marker> <and> <token postag="RG.*" postag_regexp="yes">massa</token> <token postag="DI.CN.*" postag_regexp="yes"/> </and> </marker> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">fons|si|fondo</exception></token> </pattern> <disambig action="filter" postag="[^R].*"/> </rule> </rulegroup> <rule id="massa" name="massa no nom"> <pattern> <token><exception postag="D[^R].FS." postag_regexp="yes"/></token> <marker> <token postag="DI.CN.*" postag_regexp="yes">massa<exception postag="_GN_FS"/></token> </marker> <token postag="N.*|A.*" postag_regexp="yes"><exception>nul·la</exception></token> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="TOT_gerundi" name="tot + gerundi"> <pattern> <token>tot</token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.G.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="gens" name="gens + adj"> <antipattern> <token postag="D..FS." postag_regexp="yes"/> <token>massa</token> </antipattern> <pattern> <token postag="RG.*" postag_regexp="yes" regexp="yes">gens|massa</token> <token postag="AQ.*|RG.*" postag_regexp="yes"><exception postag="C.*|P[0P].*" postag_regexp="yes"/></token> </pattern> <disambig action="filterall"/> </rule> <rule id="poc_capital" name="poc capital"> <pattern> <token postag="DI0MS0">poc</token> <token postag="NCMS000">capital</token> </pattern> <disambig action="filterall"/> </rule> <rule id="en_prep" name="en (preposició)"> <pattern> <token postag="V.P.*" postag_regexp="yes"/> <marker> <token postag="SPS00">en</token> </marker> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="JO" name="jo mateixa"> <pattern> <token postag="PP1CSN00">jo</token> <token postag="AQ0FS0">mateixa</token> </pattern> <disambig action="filterall"/> </rule> <rulegroup id="DetNom" name="Determinant + nom"> <!-- Caldria diferenciar/elimianr alguns casos. Per exemple DN + DI CAL SEPARAR EL CAS DA+NC QUE ÉS L'UNIC PROBLEMÀTIC --> <antipattern> <token inflected="yes">un</token> <token inflected="yes">poc</token> <token postag="N.*" postag_regexp="yes"/> </antipattern> <antipattern> <token regexp="yes">uns|unes</token> <token postag="DN.*" postag_regexp="yes"/> </antipattern> <antipattern> <token postag="V.[MGN].*" postag_regexp="yes"/> <!-- falta un guionet --> <token>la</token> <token>a</token> <token postag="V.N.*|contraccio|D.*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <marker> <token postag="D[^RA].[M][SN0].*" postag_regexp="yes"><exception postag="RG" regexp="yes">tant|molt|poc</exception></token> </marker> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception>la</exception></token> </pattern> <disambig action="filter" postag="D.*"/> </rule> <rule> <pattern> <token postag="D[^RA].[M][SN0].*" postag_regexp="yes"><exception postag="RG" regexp="yes">tant|molt|poc</exception></token> <marker> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception regexp="yes">passi|la</exception><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <!--exception next rule--> <pattern> <token postag="D[^RA].[F][SN0].*" postag_regexp="yes">sa</token> <marker> <token postag="N.[FC][SN0].*" postag_regexp="yes">casa</token> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token postag="D[^RA].[F][SN0].*" postag_regexp="yes"/> </marker> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception postag="VMIP3S0.?" postag_regexp="yes"/></token> <!-- quan aquesta vibra --> </pattern> <disambig action="filter" postag="D.*"/> </rule> <rule> <pattern> <token postag="D[^RA].[F][SN0].*" postag_regexp="yes"/> <marker> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception postag="VMIP3S0.?" postag_regexp="yes"/><exception>nova</exception></token> <!-- quan aquesta vibra --> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token postag="D[^RAN].[M][PN0].*" postag_regexp="yes"/> </marker> <token postag="N.[MC][PN0].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="D.*"/> </rule> <rule> <pattern> <token postag="D[^RAN].[M][PN0].*" postag_regexp="yes"/> <marker> <token postag="N.[MC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <pattern> <marker> <token postag="D[^RAN].[F][PN0].*" postag_regexp="yes"/> </marker> <token postag="N.[FC][PN0].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="D.*"/> </rule> <rule> <pattern> <token postag="D[^RAN].[F][PN0].*" postag_regexp="yes"/> <marker> <token postag="N.[FC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <rule> <!-- He canviat (N|A.|PX) per (N). Per què no hi ha V.P.* ? No cal? --> <pattern> <marker> <token postag="D[^R].[MC][SN0].*" postag_regexp="yes"><exception postag="RG" regexp="yes">força|tant|molt|poc</exception></token> <token postag="(N|A.|PX).[MC][SN0].*|V.P..SM." postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][SN0].*" postag_regexp="yes"><exception>força</exception></token> <token postag="(N|A.|PX).[FC][SN0].*|V.P..SF." postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <!-- excep: massa temps --> <pattern> <marker> <token postag="D[^R].[MC][PN0].*" postag_regexp="yes"><exception regexp="yes">força|gens</exception></token> <token postag="(N|A.|PX).[MC][PN0].*|V.P..PM." postag_regexp="yes"><exception postag="DN.*|_GN_MS" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="D[^R].[FC][PN0].*" postag_regexp="yes"><exception>força</exception></token> <token postag="(N|A.|PX).[FC][PN0].*|V.P..PF." postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rulegroup id="nom_neutre" name="desambigua nom neutre o masculí i femení alhora"> <!-- Desambigua un nom neutre o masculí i femení alhora. El llum, els alumnes. Excepció: L'intel·lectual --> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_MS"><exception postag="_GN_FS"/></token> </and> <marker> <and> <token postag="NCCS.*|NCMN.*|NCCN.*" postag_regexp="yes"/> <token postag="_GN_MS"/> </and> </marker> </pattern> <disambig action="add"> <wd pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_FS"><exception postag="_GN_MS"/></token> </and> <marker> <and> <token postag="NCCS.*|NCFN.*|NCCN.*" postag_regexp="yes"/> <token postag="_GN_FS"/> </and> </marker> </pattern> <disambig action="add"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_MP"/> </and> <marker> <and> <token postag="NCCP.*|NCMN.*|NCCN.*" postag_regexp="yes"/> <token postag="_GN_MP"/> </and> </marker> </pattern> <disambig action="add"> <wd pos="NCMP000"/> </disambig> <!-- how to preserve the lemma? --> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_FP"/> </and> <marker> <and> <token postag="NCCP.*|NCFN.*|NCCN.*" postag_regexp="yes"/> <token postag="_GN_FP"/> </and> </marker> </pattern> <disambig action="add"> <wd pos="NCFP000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_MS"><exception postag="_GN_FS"/></token> </and> <marker> <and> <token postag="NC[MC][SN].*" postag_regexp="yes"><exception postag="V.[NSI].*|PX.*" postag_regexp="yes"/></token> <token postag="_GN_MS"><exception>passi</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="NCMS000|_GN_MS"/> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_FS"><exception postag="_GN_MS"/></token> </and> <marker> <and> <token postag="NC[FC][SN].*" postag_regexp="yes"><exception>nova</exception></token> <token postag="_GN_FS"><exception postag="V.[SI].*" postag_regexp="yes"/></token> <!-- quan aquesta vibra --> </and> </marker> </pattern> <disambig action="filter" postag="NCFS000|_GN_FS"/> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_MP"><exception postag="_GN_FP"/></token> </and> <marker> <and> <token postag="NC[MC][PN].*" postag_regexp="yes"/> <token postag="_GN_MP"/> </and> </marker> </pattern> <disambig action="filter" postag="NCMP000|_GN_MP"/> </rule> <rule> <pattern> <and> <token postag="D.*|PX.*" postag_regexp="yes"/> <token postag="_GN_FP"><exception postag="_GN_MP"/></token> </and> <marker> <and> <token postag="NC[FC][PN].*" postag_regexp="yes"/> <token postag="_GN_FP"/> </and> </marker> </pattern> <disambig action="filter" postag="NCFP000|_GN_FP"/> </rule> </rulegroup> <rulegroup id="ordinal_parts" name="ordinal + parts"> <rule> <pattern> <marker> <token postag="AO.*" postag_regexp="yes"/> </marker> <token regexp="yes">parts?</token> </pattern> <disambig action="filter" postag="AO.*|_GN_.*"/> </rule> <rule> <pattern> <token postag="AO.*" postag_regexp="yes"/> <marker> <token regexp="yes">parts?</token> </marker> </pattern> <disambig action="filter" postag="NC.*|_GN_.*"/> </rule> </rulegroup> <!-- numeral seguit de nom o adjectiu--> <rulegroup id="DetNum" name="determinants numerals"> <rule> <pattern> <marker> <token postag="DN.*" postag_regexp="yes"><exception postag="[NA].*" postag_regexp="yes"/></token> </marker> <token postag="(N|A|RG).*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*|_GN.*"/> </rule> <rule> <pattern> <token postag="DN.*" postag_regexp="yes"/> <marker> <token postag="DN.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="DN.*|_GN.*"/> </rule> <rule> <pattern> <marker> <token postag="DN.*" postag_regexp="yes"/> </marker> <token postag="DN.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DN.*|_GN.*"/> </rule> </rulegroup> <rulegroup id="TOT" name="tot (determinant, nom o pronom)"> <rule> <!-- Nom si ha concordat--> <pattern> <and> <token postag="N.*" postag_regexp="yes">tot</token> <token postag="_GN_MS"/> </and> </pattern> <disambig action="filter" postag="N.*|_GN.*"/> </rule> <rule> <!-- No nom si no ha concordat--> <pattern> <and> <token postag="N.*" postag_regexp="yes">tot</token> <token postag="N.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule> <!-- pronom (en algun cas) si no concorda amb les paraules següents --> <pattern> <token postag="V.*" postag_regexp="yes" skip="1"/> <token>entre</token> <unify negate="yes"> <feature id="nombre"/> <feature id="genere"/> <marker> <token regexp="yes">tote?s</token> </marker> <and> <token postag="D.*" postag_regexp="yes"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> </unify> </pattern> <disambig action="filter" postag="P.*"/> <!-- destacaren entre tots la figura de Joan Amades --> <!-- ens volen fer pagar entre tots la mala gestió --> </rule> <rule> <!-- pronom (en algun cas) si no concorda amb les paraules següents --> <pattern> <token postag="V.*|SPS00" postag_regexp="yes" skip="1"/> <unify negate="yes"> <feature id="nombre"/> <feature id="genere"/> <marker> <token regexp="yes">tote?s</token> </marker> <and> <token postag="D.*" postag_regexp="yes"/> <token postag="_GN_.S" postag_regexp="yes"/> </and> </unify> </pattern> <disambig action="filter" postag="P.*"/> <!-- Espero que trobeu totes la pàgina --> <!-- ens volen fer pagar entre tots la mala gestió --> </rule> <rule> <!--determinant si concorda amb les paraules següents--> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="D.*" postag_regexp="yes" inflected="yes">tot</token> </marker> <and> <token postag="D.*" postag_regexp="yes"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> </unify> </pattern> <disambig action="filter" postag="D.*|_GN_.*"/> </rule> <rule> <!-- tot això--> <pattern> <marker> <token postag="DI.*" postag_regexp="yes">tot</token> </marker> <token postag="PD0NS000"/> </pattern> <disambig action="filter" postag="DI.*"/> </rule> <!-- eren tots família --> <rule> <pattern> <token postag="V.[MSI]..P.." postag_regexp="yes"/> <token min="0" max="1" postag="V.P.*" postag_regexp="yes"/> <marker> <token postag="PI..P..." postag_regexp="yes" inflected="yes">tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <pattern> <token postag="V.[MSI]..P.." postag_regexp="yes"/> <token min="0" max="1" postag="V.P.*" postag_regexp="yes"/> <token>pas</token> <marker> <token postag="PI..P..." postag_regexp="yes" inflected="yes">tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <pattern> <token postag="V.[MSI]..S.." postag_regexp="yes"/> <token min="0" max="1" postag="V.P.*" postag_regexp="yes"/> <marker> <token postag="PI..S..." postag_regexp="yes" inflected="yes">tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <pattern> <token postag="V.[MSI]..S.." postag_regexp="yes"/> <token min="0" max="1" postag="V.P.*" postag_regexp="yes"/> <token>pas</token> <marker> <token postag="PI..S..." postag_regexp="yes" inflected="yes">tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <pattern> <token regexp="yes">ho|-ho</token> <token min="0" max="3" postag="V.*|SPS.*" postag_regexp="yes"/> <marker> <token>tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <!-- amb locucions preposicionals --> <rule id="baix_de_tot" name="baix de tot"> <pattern> <token regexp="yes">baix|dalt|capdavall|sobre|damunt</token> <token>de</token> <marker> <token postag="PI.*" postag_regexp="yes">tot<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <!-- totes de--> <pattern> <marker> <token postag="PI.*" postag_regexp="yes" inflected="yes">tot</token> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="PI.*"/> </rule> <rule> <!-- tot, --> <pattern> <marker> <token postag="PI.*" postag_regexp="yes" inflected="yes">tot</token> </marker> <token postag="_PUNCT.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="PI.*"/> </rule> </rulegroup> <rule id="P0_DA" name="pronom feble i article: pronom feble"> <antipattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="[NA].*|V.P.*" postag_regexp="yes"/> </antipattern> <!--mogut per "L'ens"--> <pattern> <marker> <and> <token postag="DA.*" postag_regexp="yes"><exception regexp="yes">en|n'</exception></token> <token postag="P[0P].*" postag_regexp="yes"/> </and> </marker> <token postag="P[0P].*" postag_regexp="yes"><exception regexp="yes">si|jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vostès?|vós</exception></token> </pattern> <disambig action="filter" postag="P0.*|PP.*"/> </rule> <rulegroup id="seu_de" name="seu (nom) de"> <rule> <pattern> <marker> <token postag="_GN_F." postag_regexp="yes" regexp="yes">seus?</token> </marker> <token regexp="yes">de|d'|i</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> </rulegroup> <rule id="nNom0a" name="no Nom"> <!-- no són noms si no han concordat. --> <antipattern> <token>manca</token> <token regexp="yes">de|d'</token> </antipattern> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">ocupa|ocupes|surts?|sobre|caus?|resulta|manca|sabeu<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="nNomMasculi2" name="no Nom masculí si no ha concordat"> <pattern> <marker> <token postag="NCF.*" postag_regexp="yes" inflected="yes">base1<exception postag="_GN_M.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="NCF.*|_GN_F.*|V.*"/> </rule> <rule id="forma_verb" name="forma (verb) excepció a la regla següent"> <pattern> <marker> <token postag="V.*" postag_regexp="yes" regexp="yes">forma|tomba<exception postag="_GN_FS"/></token> </marker> <token postag="N.*|D.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rulegroup id="AdjNom" name="adj + nom"> <antipattern> <token regexp="yes">\p{Lu}.*<exception scope="previous" postag="SENT_START"/></token> <token postag="V.[IS].*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <marker> <token postag="A..[MC][SN0].*|V.P..SM.?|PX.[MC][SN0].*" postag_regexp="yes"><exception postag="AQ0CN0|_GV_|N.CN.*|VAP00SM0" postag_regexp="yes"/><exception inflected="yes" regexp="yes">poder|voler|saber</exception></token> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception regexp="yes">recull|ens|estic|tant|cap|son|ser</exception><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[FC][SN0].*|V.P..SF.?|PX.[FC][SN0].*" postag_regexp="yes"><exception postag="AQ0CN0|_GV_|N.CN.*" postag_regexp="yes"/><exception inflected="yes" regexp="yes">poder|voler|saber</exception></token> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">parla|cap|son</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[MC][PN0].*|V.P..PM.?|PX.[MC][PN0].*" postag_regexp="yes"><exception postag="AQ0CN0|_GV_|N.CN.*" postag_regexp="yes"/><exception inflected="yes" regexp="yes">poder|voler|saber</exception></token> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="A..[FC][PN0].*|V.P..PF.?|PX.[FC][PN0].*" postag_regexp="yes"><exception postag="AQ0CN0|_GV_|N.CN.*" postag_regexp="yes"/><exception inflected="yes" regexp="yes">poder|voler|saber</exception></token> <token postag="N.[FC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rule id="nNom0b" name="no Nom"> <!-- no són noms si no han concordat. --> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">quina|quines|trobar|pega|mostra|mostres|conserva|conserves|donant|racista|racistes<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rulegroup id="NomAdj" name="nom + adj"> <!-- falta participi+nom: requereix tractament especial --> <!-- QUÈ PASSA: en les seves múltiples disciplines. --> <!-- la teva brillant llum // les seves múltiples disciplines<exception postag="A..C.*" postag_regexp="yes"></exception> "Dura massa" --> <!-- les seves múltiples disciplines<exception postag="A..C.*" postag_regexp="yes"></exception> --> <rule> <pattern> <marker> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">estic|seré</exception></token> <token postag="A..[MC][SN0].*|V.P..SM.?|PX.[MC][SN0].*" postag_regexp="yes"><exception postag="AO.*|AQ0CN0" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <!-- fill meu, fill seu--> <pattern> <token postag="N.[MC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <marker> <token postag="PX.[MC][SN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="PX.*"/> </rule> <rule> <!-- fills meus, fills seus --> <pattern> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <marker> <token postag="PX.[MC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="PX.*"/> </rule> <rule> <pattern> <marker> <token postag="N.[FC][SN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception regexp="yes">fou|queda</exception></token> <token postag="A..[FC][SN0].*|V.P..SF.?|PX.[FC][SN0].*" postag_regexp="yes"><exception postag="AO.*|AQ0CN0" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="N.[MC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/><exception inflected="yes">més</exception></token> <token postag="A..[MC][PN0].*|V.P..PM.?|PX.[MC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="N.[FC][PN0].*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> <token postag="A..[FC][PN0].*|V.P..PF.?|PX.[FC][PN0].*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rulegroup id="ser_atribut_adjectiu" name="ser + atribut (adjectiu)"> <!--exceptions--> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" inflected="yes">mitjà</token> </marker> <token>de</token> <token regexp="yes" inflected="yes">comunicació|transport|informació</token> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes">divisòria</token> </marker> <token>d'</token> <token>aigües</token> </pattern> <disambig action="remove" postag="A.*"/> </rule> <!-- main rule --> <rule> <antipattern> <token>fora</token> <token postag="V.[ISM].*" postag_regexp="yes"/> </antipattern> <antipattern> <token postag="NC.*" postag_regexp="yes"/> <token postag_regexp="yes" postag="CC|_PUNCT_CONT"/> <token postag="NC.*" postag_regexp="yes"/> </antipattern> <pattern> <unify> <feature id="nombre"/> <token inflected="yes" regexp="yes">ser|estar|parèixer|semblar</token> <marker> <and> <token postag="A.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"><exception inflected="yes" regexp="yes" postag="N.*" postag_regexp="yes">reflex|desert|motiu|foguera|mestre|director|corba|sinònim|part1|líder|mà|iniciativa</exception></token> </and> </marker> </unify> <!--<token><exception inflected="yes">de</exception></token>--> </pattern> <disambig action="remove" postag="N.*"/> <example type="untouched">Aquesta impressió és reflex de la situació.</example> <example type="untouched">Són mones albines.</example> <example type="untouched">Si fora bufa vent, ens quedem a casa.</example> <!--<example type="untouched">Són mitjans de comunicació.</example>--> </rule> <rule> <antipattern> <token>fora</token> <token postag="V.[ISM].*" postag_regexp="yes"/> </antipattern> <pattern> <token inflected="yes" regexp="yes">ser|estar|parèixer|semblar</token> <marker> <and> <token postag="A.*" postag_regexp="yes" inflected="yes">alt<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="N.*"/> </rule> </rulegroup> <rule id="GerAdj_Nom" name="gerundi/adjectiu + nom"> <pattern> <marker> <and> <token postag="V.G.*" postag_regexp="yes"><exception>corrent</exception><exception scope="previous" postag="SPS00"/></token> <token postag="A.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> </and> </marker> <token postag="N.*" postag_regexp="yes"><exception postag="V.[SI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="ser_fan" name="ser fan"> <pattern> <token inflected="yes">ser</token> <marker> <token postag="NCCS000">fan</token> </marker> </pattern> <disambig action="filter" postag="NCCS000"/> </rule> <rule id="nNom1" name="no Nom"> <!-- repetit després de DetNom per "pel vers de tradició" --> <antipattern> <token>personal</token> <token regexp="yes">de|d'</token> </antipattern> <pattern> <marker> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">pinte|jo|fan|demà|ahir|avui|hui|totals?|vius?|veus?|saps?|sola|soles|vessant|sec|personal|vers|creu|cau|fou|crec|davant|darrere|damunt|davall|sota|ve|tornés|seré|estic|som|sou|amples?|creix|fem|res|si|bé|perquè|però|dins|sobre|real|era|eres|dius?<exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rulegroup id="EncadenaAdj" name="encadena adjectius"> <rule> <pattern> <token postag="_GN_MS"/> <marker> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"><exception postag="_GN_MS"/><exception>fer</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <token postag="_GN_FS"/> <marker> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"><exception postag="_GN_FS"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <token postag="_GN_MP"/> <marker> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"><exception postag="_GN_MP"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <token postag="_GN_FP"/> <marker> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"><exception postag="_GN_FP"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> <rule> <pattern> <and> <token postag="_GN_MS" regexp="yes">\p{Ll}.+</token> <token postag="A.*" postag_regexp="yes"/> </and> <token regexp="yes">i|o|ni|,|però|sinó</token> <marker> <token postag="A..[MC][SN0].*|V.P..SM.?" postag_regexp="yes"><exception postag="_GN_MS"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <and> <token postag="_GN_FS" regexp="yes">\p{Ll}.+</token> <token postag="A.*" postag_regexp="yes"/> </and> <token regexp="yes">i|o|ni|,|però|sinó</token> <marker> <token postag="A..[FC][SN0].*|V.P..SF.?" postag_regexp="yes"><exception postag="_GN_FS"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <and> <token postag="_GN_MP" regexp="yes">\p{Ll}.+</token> <token postag="A.*" postag_regexp="yes"/> </and> <token regexp="yes">i|o|ni|,|però|sinó</token> <marker> <token postag="A..[MC][PN0].*|V.P..PM.?" postag_regexp="yes"><exception postag="_GN_MP"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> </disambig> </rule> <rule> <pattern> <and> <token postag="_GN_FP" regexp="yes">\p{Ll}.+</token> <token postag="A.*" postag_regexp="yes"/> </and> <token regexp="yes">i|o|ni|,|però|sinó</token> <marker> <token postag="A..[FC][PN0].*|V.P..PF.?" postag_regexp="yes"><exception postag="_GN_FP"/></token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> <!-- Cas particular: no aplicar la regla COMPLEXES --> <rule> <pattern> <token postag="AQ0[FC][PN]0|VMP00PF.?" postag_regexp="yes"><exception postag="_GN_MP|NCMP.*" postag_regexp="yes"/></token> <token regexp="yes" skip="1">i|o|ni|,|però|sinó</token> <marker> <token>complexes</token> </marker> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> <rule> <pattern> <marker> <token>complexes</token> </marker> <token regexp="yes" skip="1">i|o|ni|,|però|sinó</token> <token postag="AQ0[FC][PN]0|VMP00PF.?" postag_regexp="yes"><exception postag="_GN_MP|NCMP.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> <!-- adjectius --> <!-- Encadena numerals --> <rule> <pattern> <marker> <token postag="DN.[FC][PN]." postag_regexp="yes"/> </marker> <token regexp="yes">i|ni|o|,</token> <and> <token postag="DN.[FC][PN]." postag_regexp="yes"/> <token postag="_GN_FP"/> </and> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="DN.[MC][PN]." postag_regexp="yes"/> </marker> <token regexp="yes">i|ni|o|,</token> <and> <token postag="DN.[MC][PN]." postag_regexp="yes"/> <token postag="_GN_MP"/> </and> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> </disambig> </rule> </rulegroup> <rulegroup id="filtra_noms_masculins_femenins" name="filtra noms masculins i femenins"> <rule> <pattern> <and> <token postag="NCMS000|NCCS000|AQ0CS0" postag_regexp="yes"/> <token postag="_GN_MS"/> <token postag="NCFS000"><exception postag="_GN_FS"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCFS000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCFS000|NCCS000|AQ0CS0" postag_regexp="yes"/> <token postag="_GN_FS"/> <token postag="NCMS000"><exception postag="_GN_MS"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCMP000|NCCP000|PX3MP0C0" postag_regexp="yes"/> <token postag="_GN_MP"/> <token postag="NCFP000"><exception postag="_GN_FP"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCFP000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCFP000|NCCP000" postag_regexp="yes"/> <token postag="_GN_FP"/> <token postag="NCMP000"><exception postag="_GN_MP"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCMP000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCFP000|NCCP000" postag_regexp="yes"/> <token postag="_GN_FP"/> <token postag="NCMS000"><exception postag="_GN_MS"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCMS000"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCMS000|NCCS000" postag_regexp="yes"/> <token postag="_GN_MS"/> <token postag="NCFP000"><exception postag="_GN_FP"/></token> </and> </pattern> <disambig action="remove"> <wd pos="NCFP000"/> </disambig> </rule> </rulegroup> <rulegroup id="pols" name="pols"> <rule> <pattern> <token postag="_GN_MS">pols</token> </pattern> <disambig action="filter" postag=".*MS.*"/> </rule> <rule> <pattern> <token postag="_GN_FS">pols</token> </pattern> <disambig action="filter" postag=".*FS.*"/> </rule> <rule> <pattern> <token postag="_GN_FP">pols</token> </pattern> <disambig action="filter" postag=".*FP.*"/> </rule> </rulegroup> <rule id="nou_adj" name="nou adjectiu"> <pattern> <marker> <and> <token postag="AQ.*" postag_regexp="yes">nou</token> <token postag="_GN_MS" postag_regexp="yes"/> </and> </marker> <token postag="N.[MC][SN].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="AQ.*|_GN_MS"/> </rule> <!-- <rule id="NomParticipiParticipi" name="nom + participi + participi, que no han concordat"> <pattern> <token postag="NC.*" postag_regexp="yes"></token> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception postag="_GN.*|SPS00" postag_regexp="yes" /></token> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="V.[MIS].*|RG.*" postag_regexp="yes"/></token> </and> </marker> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="V.[MIS].*" postag_regexp="yes" /></token> </pattern> <disambig action="filter" postag="V.P.*|AQ.*"></disambig> </rule> --> <rule id="VERB_PREPOSICIO" name="verb + preposició"> <!-- mogut per "haver acabat"; excepció: per tal d'aconseguir els seus fins; per a aconseguir fins dignes d'aconseguir-se--> <!-- mogut per "aconseguir fins dignes";--> <pattern> <token postag="V.[SING].*|_GV_" postag_regexp="yes"><exception postag="N.*|_GN_.*|RG.*" postag_regexp="yes"/></token> <marker> <token postag="SPS00"><exception postag="_GN_.*|PI.*|DI.*" postag_regexp="yes"/></token> </marker> <token><exception postag="V.[MSI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="SP.*|RG.*|CS|_obligacio"/> </rule> <rule id="PARTICIPI_PREPOSICIO" name="verb compost (participi) + preposició"> <pattern> <and> <token postag="V.P.*" postag_regexp="yes"><exception postag="N.*|_GN_.*" postag_regexp="yes"/></token> <token postag="_GV_"/> </and> <marker> <token postag="SPS00"><exception postag="_GN_.*|PI.*|DI.*" postag_regexp="yes"/></token> </marker> <token><exception postag="V.[MSI].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="SP.*|RG.*"/> </rule> <rule id="sota" name="sota preposició"> <pattern> <marker> <and> <token postag="RG"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="SPS00"/> </and> </marker> <token postag="D.*" postag_regexp="yes"><exception inflected="yes">es</exception></token> <token postag="[AN].*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="S.*"/> </rule> <rule id="PREP_VERBbis" name="no Verb conjugat darrere de preposició"> <!-- "de sumes": "sumes" no és verb. Mogut per "En forma part". Mogut amunt per "d'escriptura comú" --> <pattern> <token postag="SP.*|.*LOC_PREP.*" postag_regexp="yes"><exception postag="PP.*|P0.*" postag_regexp="yes"/></token> <marker> <and> <token postag="N.*|RG|V.[NGP].*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[MSI].*"/> </rule> <rule id="PREP_ART_VERBbis" name="no Verb conjugat darrere de preposició i article"> <!-- "a l'esquerra": "esquerra" no és verb . Mogut per "De les dites baronies"--> <pattern> <token postag="SP.*" postag_regexp="yes"><exception postag="RG"/></token> <token postag="DA.*" postag_regexp="yes"><exception inflected="yes">es</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.[^NGP].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="prep_participinom" name="prep + participi_nom"> <rule> <!-- punt de vista, condemnat a mort --> <antipattern> <token>a</token> <token>perdut</token> </antipattern> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"/> <marker> <and> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="NC.*|_GN_.*"/> </rule> <rule> <!-- en realitat funciona com a adjectiu --> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> </marker> <token><exception postag="N.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="NC.*|_GN_.*"/> </rule> </rulegroup> <!-- "en contacte" és verb o nom? --> <rulegroup id="EN_VerbNom" name="verb/nom darrere de preposició en"> <rule> <antipattern> <token>no</token> <token>en</token> <token>dona</token> </antipattern> <pattern> <token><exception regexp="yes">que|què</exception></token> <token>en</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.[^NGP].*" postag_regexp="yes"><exception regexp="yes">surt|parla|paga|saps|pren|passa|trama|porta|treu|trau|faig</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rule id="NoVerb" name="no verb si no és en grup verbal"> <pattern> <token postag="_GN_.*" postag_regexp="yes" regexp="yes">diputats?|diputad(a|es)|negativa|negatives|brossa<exception postag="_GV_"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="noVerbBalear0" name="es estiu (no balear)"> <pattern> <token>es</token> <marker> <and> <token postag="VMIP1S0B"/> <token postag="[NAI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rulegroup id="PP_VERB" name="pronom personal seguit de verb"> <!-- pronom personal + verb. Mogut per "en obres properes" --> <!-- estudiar concordances de persona i nombre!!!!!!<exception postag="D.*" postag_regexp="yes"/> --> <!-- se sent sola; s'havia fet.. com tractar: el metges, es fan... --> <!--creat per "ens ensenya". Excep: en complexes perspectives--> <antipattern> <token>l'</token> <token>ho</token> </antipattern> <antipattern> <token>s'</token> <token><exception postag="V...3..." postag_regexp="yes"/></token> </antipattern> <antipattern> <token>es</token> <token regexp="yes">sobre|encara</token> </antipattern> <antipattern> <token postag="SPS00|LOC_PREP" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="[NA].*|V.P.*" postag_regexp="yes"/> </antipattern> <rule> <pattern> <marker> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">si|en|l'|el|la|els|les|['-].+</exception></token> </marker> <token postag="V.[^MNPG].*" postag_regexp="yes"><exception regexp="yes">\p{Lu}[\p{Ll}\-'·]+</exception></token> </pattern> <disambig action="filter" postag="P.*|_GV_"/> </rule> <rule> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">si|en|l'|el|la|els|les|['-].+</exception></token> <marker> <token postag="V.[^MNPG].*" postag_regexp="yes"><exception regexp="yes">\p{Lu}[\p{Ll}\-'·]+|acord</exception></token> </marker> </pattern> <disambig action="filter" postag="V.[^MNPG].*|_GV_|_perfet|_obligacio|_loc_nosequi"/> </rule> <rule> <pattern> <marker> <token postag="&pronom_feble;" postag_regexp="yes"><exception regexp="yes">si|['-].+</exception></token> </marker> <token regexp="yes">ben|mig</token> <token postag="V.[^MNPG].*|_GV_|_perfet|_obligacio" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="P0.*|PP.*" postag_regexp="yes" regexp="yes">l'|el|la|els|les|en</token> <token postag="V.[SI].*" postag_regexp="yes"><exception>bloc</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_GV_"/> <wd pos="_GV_"/> </disambig> </rule> </rulegroup> <rulegroup id="verbs_darrere_sino" name="neteja verbs darrere de 'sinó'"> <rule> <pattern> <token>sinó</token> <marker> <and> <token postag="_GN_.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="_GN_.*|A.*|N.*|D.*|V.P.*|PX.*"/> </rule> <rule> <pattern> <token skip="3">sinó<exception scope="next" regexp="yes">que|perquè</exception></token> <marker> <and> <token postag="_GN_.*|N.*|A.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="_GN_.*|A.*|N.*|D.*|V.P.*|PX.*"/> </rule> <rule> <pattern> <token skip="3">sinó<exception scope="next" regexp="yes">que|perquè</exception></token> <marker> <and> <token postag="DA.*" postag_regexp="yes"/> <token postag="_GV_"/> </and> </marker> </pattern> <disambig action="filter" postag="_GN_.*|A.*|N.*|D.*|V.P.*|PX.*"/> </rule> </rulegroup> <rule id="NoVerb2" name="no verb si no és en grup verbal"> <pattern> <and> <token postag="V.[^P].*" postag_regexp="yes" regexp="yes">senzilles|senzilla|disperses|diputats?|diputad(a|es)|negativa|negatives|terminis?|brossa|ultra|rica|estesa|esteses<exception postag="_GV_"/></token> <token postag="[^V].*|V.P.*" postag_regexp="yes"/> </and> </pattern> <disambig action="filter" postag="[^V].*|V.P.*"/> </rule> <!-- <rule id="NoVerb3" name="no verb, enumeració"> la forma i la textura <pattern> <token postag="DA.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.[SI].*" postag_regexp="yes"/> </and> </marker> <token postag="CC|_PUNCT_CONT" postag_regexp="yes"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="V.[SIM].*"></disambig> </rule>--> <rulegroup id="Verb_adverbi" name="Verb i adverbi: encara sóc, sóc encara"> <rule> <!-- ATENCIÓ: quan el verb és també substantiu, poden haver-hi problemes: encara es "troba". Les excepcions no són fiables Ens encara i ens destrueix. Ell encara ho creu. --> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" skip="4"><exception postag="_GV_"/><exception scope="next" postag="DA.*|R.*|.*LOC_ADV.*|PP.*|P0.*|SENT_END|V.*|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <token postag="RG"/> </and> </marker> <token postag="V.[MSI].*|_GV_" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <token postag="V.*" postag_regexp="yes" skip="3"><exception scope="next" postag="R.*|.*LOC_ADV.*|P0.*|PP.*|SENT_END|V.*|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <marker> <and> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_"/><exception>acabat</exception></token> <!-- excep: S'havien acabat--> <token postag="RG"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <marker> <token>encara</token> </marker> <token regexp="yes">que|bo|gràcies|sort</token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rulegroup id="infinitiu_o_nom" name="infinitiu o nom"> <rule> <!-- excepcions a la regla següent --> <pattern> <token>tot</token> <token regexp="yes">el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"><exception regexp="yes">\p{Lu}.+</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token regexp="yes">l|el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">que|on</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token regexp="yes">l|el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"/> </and> </marker> <token postag="A.0[MC][SN].|VMP00SM.?" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token regexp="yes">l|el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"/> </and> </marker> <token postag="RG_anteposat"/> <token postag="A.0[MC][SN].|VMP00SM.?" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <marker> <and> <token postag="V.N.*" postag_regexp="yes" skip="4"><exception scope="next" postag="R.*|.*LOC_ADV.*|PP.*|P0.*|SENT_END|V.*|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="V.[SI].*|_GV_" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token postag="V.[NGSI].*|_GV_" postag_regexp="yes" skip="3"><exception scope="next" postag="SPS00|R.*|.*LOC_ADV.*|PP.*|P0.*|SENT_END|DA.*|_GN_MS|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <token regexp="yes">l|el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token postag="SPS00"/> <token regexp="yes">l|el|l'</token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="SPS00"/> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <token regexp="yes">més|menys<exception scope="previous" inflected="yes">valer</exception></token> <marker> <and> <token postag="V.N.*" postag_regexp="yes"><exception>ser</exception></token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <marker> <and> <token postag="_GN_.*" postag_regexp="yes">deure</token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <!-- excepcions a la regla següent --> <pattern> <marker> <token postag="N.*" postag_regexp="yes">deure</token> </marker> <token inflected="yes">de</token> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"><exception regexp="yes">\p{Lu}.+|ésser|militar|titular|boiar|metre</exception></token> </and> </marker> <token postag="SPS00"/> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <antipattern> <token>de</token> <token>l</token> <token>saber</token> </antipattern> <pattern> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"><exception regexp="yes">\p{Lu}.+|ésser|militar|boiar|metre</exception></token> </and> </marker> <token><exception postag="_PUNCT.*|CC|AQ0[MC][SN]0|V.P.*SM.|_GV_|&pronom_feble;" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> <rule> <pattern> <marker> <and> <token postag="V.N.*" postag_regexp="yes"/> <token postag="NCMS.*" postag_regexp="yes"/> </and> </marker> <token postag="PP3..A00" postag_regexp="yes"/> <token><exception postag="V.[SI].*|_GV_|&pronom_feble;" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="V.N.*"/> </rule> </rulegroup> <rule id="els_passa_igual" name="els passa igual"> <!-- excep: la roba encara no està seca; la taca més negra; narracions en vers sota els arbres --> <pattern> <token postag="_GV_"><exception postag="_GN_.*" postag_regexp="yes"/></token> <marker> <token postag="_GV_"/> </marker> <token postag="RG.*|.*LOC_ADV.*" postag_regexp="yes"><exception regexp="yes">no|encara|que|més</exception></token> </pattern> <disambig action="filter" postag="V.*|_GV_|_perfet"/> </rule> <rule id="encara" name="encara"> <pattern> <and> <token postag="RG">encara</token> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="siVerbBalear" name="sí verb balear"> <!-- el calç--> <pattern> <token postag="_GV_"><exception>en</exception></token> <marker> <and> <token postag="VMIP1S0B"/> <token postag="N.*|A.*" postag_regexp="yes"><exception postag="_GN_.*|RG" postag_regexp="yes"/><exception>senyal</exception></token> <token postag="_GV_" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_"/> <example type="untouched">Va pensar que en cas que vingués ho faria.</example> </rule> <!--<exception regexp="yes">.+[oe]|faig|estic|dic|fenc|incloc|moc|predic|ric|sec|solc|coc|contradic|crec|duc|escórrec|hac|jac</exception>--> <rulegroup id="noVerbBalear" name="no verb balear"> <!-- No és verb balear, si no hi ha res que ho hagi indicat prèviament --> <rule> <pattern> <marker> <and> <token postag="VMIP1S0B">van</token> <token postag="VMIP1S0B" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove"> <wd lemma="vanar"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="VMIP1S0B"/> <token postag="[NAI].*" postag_regexp="yes"/> <!--<token postag="V...[^1].*" postag_regexp="yes" negate_pos="yes"></token>--> </and> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rule> <pattern> <marker> <and> <token postag="VMIP1S0B"/> <token postag="RG"/> </and> </marker> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="VMIP1S0B">al</token> </marker> <token spacebefore="no">-</token> <token spacebefore="no"/> </pattern> <disambig action="remove"> <wd pos="VMIP1S0B"/> </disambig> </rule> </rulegroup> <rulegroup id="no_GV" name="neteja GV"> <rule> <pattern> <token postag="_GV_"><exception postag="P[P0].*|V.*" postag_regexp="yes"/><exception regexp="yes">acord|banda|part|llum|dubte|qüestió|pràctica|valor|marxa|escena|servei|servici|contacte|baixa|falta|terme|origen|camí|corrent|relleu|compte|consulta|alta|funcionament</exception></token> </pattern> <disambig action="remove"> <wd pos="_GV_"/> </disambig> </rule> <rule> <pattern> <token><exception postag="_GV_"/></token> <marker> <and> <token postag="DA.*" postag_regexp="yes"/> <token postag="_GV_"/> </and> </marker> <token><exception postag="_GV_"/></token> </pattern> <disambig action="filter" postag="D.*|_GN_.*"/> </rule> </rulegroup> <rule id="verb_verbadj" name="verb + verb/adj"> <antipattern> <token>fora</token> <token postag="V.[ISM].*" postag_regexp="yes"/> </antipattern> <pattern> <token postag="V.[MSI].*|_GV_" postag_regexp="yes"><exception postag="PP.*|P0.*|N.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <marker> <and> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="remove" postag="V.[SIM].*"/> </rule> <rule id="verbadj_verb" name="verb/adj + verb"> <pattern> <marker> <and> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception scope="previous">que</exception></token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token postag="V.[MSI].*|_GV_" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> <!-- <token postag="V.[MSI].*|PP.*|P0.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/><exception regexp="yes">jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vost[èé]s?|vós</exception></token> --> </pattern> <disambig action="filter" postag="A.*|V.P.*"/> </rule> <!-- <rule id="tant_nom_com_nom" name="desambigua tant+nom+com+nom"> tant grecs com romans. És excep. de la regla següent <pattern> <token>tant</token> <token postag="NC.*" postag_regexp="yes"/> <token>com</token> <marker> <token postag="NC.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="filter" postag="[^V].*"></disambig> </rule> --> <rulegroup id="NomnoVerb_en_enumeracions" name="paraules que no són verb en enumeracions"> <rule> <pattern> <token postag="NC.*|_GN_.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <token regexp="yes">i|o|ni|,</token> <marker> <and> <token postag="NC.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token><exception postag="D.*|SPS.*|RG.*|AQ.*|V.P.*|NC.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="V.[MSIG].*"/> </rule> <rule> <antipattern> <token regexp="yes">què|que</token> <token postag="V.[MSIG].*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <and> <token postag="NC.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token regexp="yes">i|o|ni|,</token> <token postag="NC.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <!-- <token><exception postag="D.*|SPS.*|RG.*|AQ.*|V.P.*|NC.*" postag_regexp="yes"/></token> --> </pattern> <disambig action="remove" postag="V.[MSIG].*"/> </rule> <rule> <pattern> <marker> <and> <token postag="NC.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <token postag="_GN_.*" postag_regexp="yes"/> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token regexp="yes">i|o|ni|,</token> <token postag="_GN_.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <!-- <token><exception postag="D.*|SPS.*|RG.*|AQ.*|V.P.*|NC.*" postag_regexp="yes"/></token> --> </pattern> <disambig action="remove" postag="V.[MSIG].*"/> </rule> </rulegroup> <rulegroup id="AdjnoVerb_en_enumeracions" name="paraules que no són verb en enumeracions"> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="A.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> <token regexp="yes">i|o|ni|,</token> <marker> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <token regexp="yes">i|o|ni|,</token> <token postag="A.*" postag_regexp="yes" regexp="yes">\p{Ll}.+</token> </unify> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> </rulegroup> <rulegroup id="verb_adjectiu" name="verb + adjectiu"> <!-- El riu passa engorjat. Viatges sola. Ronda amagat. --> <rule> <pattern> <token><exception postag="D[^R]..S." postag_regexp="yes"/></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}.*</exception></token> <token postag="VM[IS]..S.." postag_regexp="yes"/> </and> </marker> <token postag="A...S.|V.P..S.." postag_regexp="yes"/> </pattern> <disambig action="remove" postag="NC.*"/> <example type="untouched">Allí brolla una deu càrstica.</example> </rule> <rule> <!-- hi ha cap cas? --> <pattern> <token><exception postag="D[^R]..P." postag_regexp="yes"/></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="VM[IS]..P.." postag_regexp="yes"/> </and> </marker> <token postag="A...P.|V.P..P.." postag_regexp="yes"/> </pattern> <disambig action="remove" postag="NC.*"/> </rule> </rulegroup> <rule id="tant_x_com_y" name="tant x com y: no verb. Ex: tant grecs com romans"> <pattern> <token>tant</token> <token postag="A.*|NC.*" postag_regexp="yes"/> <token>com</token> <marker> <and> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> <token postag="V.[MSIG].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="A.*|N.*|V.P.*"/> </rule> <rule id="tant_no_det" name="tant: no determinant"> <pattern> <token postag="V.*" postag_regexp="yes"/> <marker> <token regexp="yes">tant|molt</token> </marker> <token postag="NP.*|V.N.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="D.*"/> </rule> <rulegroup id="mig_x_mig_y" name="mig x mig y. Ex: mig figa mig raïm"> <rule> <pattern> <marker> <token>mig</token> </marker> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> <token regexp="yes">,|ni|i|o</token> <token>mig</token> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_mig"/> </disambig> </rule> <rule> <pattern> <token>mig</token> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> <token regexp="yes">,|ni|i|o</token> <marker> <token>mig</token> </marker> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_mig"/> </disambig> </rule> <rule> <pattern> <marker> <token>mig</token> </marker> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> <token>mig</token> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_mig"/> </disambig> </rule> <rule> <pattern> <token>mig</token> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> <marker> <token>mig</token> </marker> <token postag="A.*|NC.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_mig"/> </disambig> </rule> </rulegroup> <rule id="VerbNom_noNom" name="paraules que no són verb sense pronom (verb reflexiu)"> <pattern> <marker> <and> <token postag="NC.*|AQ.*" postag_regexp="yes" regexp="yes">tinya|tinyes|esperit|salina|salines|persona|persones|olives|oliva|amiga|amigues|boira|boires|digna|dignes?</token> <token postag="V.[MSI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="VerbNomAdj" name="verb i adjectiu i nom: verb"> <pattern> <token postag="R.*|.*LOC_ADV.*" postag_regexp="yes" negate_pos="yes"><exception regexp="yes">["“«'‘-]</exception></token> <marker> <and> <token postag="A.*|V.P.*" postag_regexp="yes"><exception postag="_GN_.*|RG.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}.*</exception><exception regexp="yes">[\p{Ll}·]+(e|[aei]sses|[ae]res|era)|oferta|ofertes</exception></token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="_GV_"/><exception regexp="yes">revés|empesa|viu|desperta|nous|buida|buides|composta|compostes</exception></token> <token postag="N.*" postag_regexp="yes"><exception postag="DN.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.[^P].*"/> <example type="untouched">Una peça per a piano sol composta per Chopin.</example> </rule> <rule id="VerbNomAdj_valencians1" name="verb (valencià) i nom que no ha concordat"> <pattern> <token>que</token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era<exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbNomAdj_valencians2" name="verb (valencià) i nom que no ha concordat"> <!-- després de totes les comprovacions, donem prioritat al nom o a l'adjectiu sobre la forma verbal valenciana --> <pattern> <token postag="N.*|A.*" postag_regexp="yes" negate_pos="yes"><exception postag="N.*|A.*" postag_regexp="yes"/></token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era<exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <!-- <rule id="VerbNom_valencia" name="verb subjuntiu (valencià) i nom que no ha concordat: tema"> després de totes les comprovacions, donem prioritat al nom o a l'adjectiu sobre la forma verbal valenciana <pattern> <token postag="N.*|A.*" postag_regexp="yes" negate_pos="yes"><exception postag="N.*|A.*" postag_regexp="yes"/></token> <marker> <and> <token postag="N.*" postag_regexp="yes"></token> <token postag="A.*" postag_regexp="yes"></token> <token postag="V.S.*" postag_regexp="yes" regexp="yes">.+a<exception postag="_GV_" /></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"></disambig> </rule> --> <rule id="VerbAdverbi" name="verb (sense pronoms) i adverbi"> <pattern> <token><exception postag="RN"/></token> <marker> <and> <token postag="RG"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">gratis<exception postag="_GV_"/></token> <!--<exception regexp="yes">rebé|encara</exception>--> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="enlaire" name="punys/mans/braços enlaire"> <pattern> <token postag="NC.*|RG|_GN_.*|UNKNOWN|SPS.*" postag_regexp="yes"/> <!-- mà|braç|cama|cap|puny|peu|ventre|panxa|terra|pols|pedra|més --> <marker> <token postag="RG">enlaire</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="darreres" name="darreres (adj. no nom)"> <pattern> <token postag="_GN_FP">darreres</token> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="en_ma" name="en mà"> <pattern> <marker> <token postag="NC.*" postag_regexp="yes"/> </marker> <token>en</token> <token>mà</token> </pattern> <disambig action="add"> <wd pos="_loc_enma"/> </disambig> </rule> <rule id="verbnom_andana" name="verb/nom -> nom: andana"> <pattern> <marker> <and> <token postag="VM[ISM].*" postag_regexp="yes" regexp="yes">andan(a|es)</token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="NC.*|_GN_.."/> </rule> <rule id="dosi" name="dosi (nom no verb)"> <pattern> <!--<token postag="D.*|A.*" postag_regexp="yes"/>--> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes">dosi|dosis</token> </marker> </pattern> <disambig action="remove" postag="V.[MS].*"/> </rule> <rule id="VerbNom" name="verb i nom que no ha concordat"> <!-- Això fou estrany --> <antipattern> <token postag="V.[MSI].*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes"/> </antipattern> <antipattern> <token inflected="yes">ser</token> <token>tot</token> <token postag="NC.*" postag_regexp="yes"/> </antipattern> <pattern> <token><exception postag="V.[MSING].*|_GV_|R[GN]|.*LOC_ADV.*|C.*|_PUNCT.*|SENT_START" postag_regexp="yes"/><exception regexp="yes">["“«'‘(]|\d+</exception><exception inflected="yes" regexp="yes">mot|paraula|terme|expressió|vocable|nom|tipus</exception></token> <marker> <and> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">força|coma|cap|noms?|nous?|deu|viu|cometa</exception></token> <token postag="V.[MSI].*" postag_regexp="yes"><exception postag="_GV_|_loc_enma" postag_regexp="yes"/><exception regexp="yes">\p{Lu}.*</exception><exception regexp="yes">[\p{Ll}·]+(e|es|[aei]sses|[ae]res|era)|seus?</exception></token> <!-- problema: els noms acabats en -e no tenen comprovació de concordança!! --> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbNom_valencians1" name="verb (valencià) i nom que no ha concordat"> <pattern> <token>que</token> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era<exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}.*</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rule id="VerbNom_valencians2" name="verb (valencià) i nom que no ha concordat"> <!-- després de totes les comprovacions, donem prioritat al nom sobre la forma verbal valenciana --> <pattern> <token postag="N.*" postag_regexp="yes" negate_pos="yes"><exception postag="N.*|CS" postag_regexp="yes"/></token> <!-- quan impacte --> <marker> <and> <token postag="NC.*" postag_regexp="yes"/> <token postag="VMIP1S0V" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era<exception postag="_GV_"/><exception>pinte</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rulegroup id="baixa" name="baixa (adj o verb)"> <rule> <pattern> <token postag="SENT_START|_PUNCT|CC" postag_regexp="yes"/> <marker> <token postag="V.*" postag_regexp="yes">baixa<exception postag="_GN_FS"/></token> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <token>ja</token> <marker> <token postag="V.*" postag_regexp="yes">baixa<exception postag="_GN_FS"/></token> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> </rulegroup> <rulegroup id="viu" name="viu (adj o verb)"> <rule> <pattern> <token postag="_GN_FS|NC[FC][SN].*" postag_regexp="yes"/> <marker> <token postag="V.*" postag_regexp="yes">viu<exception postag="_GN_MS"/></token> </marker> <token postag="A..[FC][SN].|V.P..SF." postag_regexp="yes"/> </pattern> <disambig action="remove" postag="A.*"/> </rule> </rulegroup> <rule id="dura" name="dura"> <pattern> <token>encara</token> <marker> <token>dura</token> </marker> </pattern> <disambig action="remove" postag="[AN].*"/> </rule> <rule id="VerbAdjectiu" name="verb i adjectiu que no ha concordat"> <!-- fer exàmens. Excep: tan regular (adj) --> <antipattern> <token postag="V.[SI].*|_GV_" postag_regexp="yes"/> <token min="0" max="4" postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_|VMIP1S0.?|V.G.*" postag_regexp="yes"/><exception regexp="yes">viu|nous?|massissa|senzilla</exception></token> </antipattern> <antipattern> <!-- una base de dades completa --> <token postag="NCFS000"/> <token inflected="yes">de</token> <token/> <token>completa</token> </antipattern> <pattern> <token><exception postag="RG_anteposat|.*LOC_ADV.*|_GV_|SPS00|CC|UNKNOWN|V.[SI].*|_PUNCT.*|RN" postag_regexp="yes"/><exception postag="P.*" postag_regexp="yes" regexp="yes">['-].+</exception><exception inflected="yes" regexp="yes">ser|estar|semblar|parèixer|considerar</exception></token> <marker> <and> <token postag="A.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}+[\p{Ll}·]*</exception><exception regexp="yes">[\p{Ll}·]+(e|[aei]sses|[ae]res|era|às)</exception></token> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_|VMIP1S0.?|V.[GP].*" postag_regexp="yes"/><exception regexp="yes">viu|nous?|massissa|senzilla</exception></token> <!-- |baixa|baixes ?? --> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbAdjectiu2" name="verb i adjectiu que no ha concordat després de puntuació"> <pattern> <token postag="_PUNCT.*" postag_regexp="yes"/> <marker> <and> <token postag="A.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">\p{Lu}+[\p{Ll}·]*</exception><exception regexp="yes">[\p{Ll}·]+(e|[aei]sses|[ae]res|era|às)</exception></token> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_|VMIP1S0.?|V.G.*" postag_regexp="yes"/><exception regexp="yes">viu|nous?|massissa|senzilla</exception></token> </and> </marker> <token postag="N.*|V.G.*|RG|_GN_.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbAdjectiu_tens" name="verb i adjectiu que no ha concordat: tens (verb habitual)"> <!-- si tens coneguts. Excep: tan regular (adj) --> <pattern> <token><exception postag="RG_anteposat|.*LOC_ADV.*|_GV_|SPS00" postag_regexp="yes"/><exception regexp="yes">["«'‘]</exception></token> <marker> <and> <token postag="A.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="V.*" postag_regexp="yes">tens</token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbAjectiu_valencians1" name="verb (valencià) i adjectiu que no ha concordat"> <pattern> <token>que</token> <marker> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era|.+às<exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="VerbAdj_valencians2" name="verb (valencià) i adjectiu que no ha concordat"> <!-- després de totes les comprovacions, donem prioritat al nom sobre la forma verbal valenciana --> <pattern> <token><exception postag="N.*|A.*" postag_regexp="yes"/></token> <marker> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="V.[MSI].*" postag_regexp="yes" regexp="yes">.+e|.+[aei]sses|.+[ae]res|.+era|.+às<exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="encara_mes_VerbAdj" name="encara/molt més dures"> <pattern> <token postag="RG.*" postag_regexp="yes"/> <token>més</token> <marker> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="V.IP.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="VerbAdj_present" name="verb (presendt d'indicatiu) i adj que no ha concordat: confesses"> <antipattern> <token postag="V.[SI].*|_GV_" postag_regexp="yes"/> <token min="0" max="4" postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="V.IP2S..?" postag_regexp="yes"/> </antipattern> <pattern> <token><exception regexp="yes">["“«'‘(]|més</exception></token> <marker> <and> <token postag="A.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="V.IP2S..?" postag_regexp="yes"><exception regexp="yes">subjectes|estables|lliures|nous|paleses|concretes|complexes|dures|actives|fines|primes|baixes|justes|barates|rica|riques</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"/> </rule> <rule id="verbadj_lliure" name="verb/adj -> adj: lliure"> <pattern> <marker> <and> <token postag="A.*" postag_regexp="yes" regexp="yes">lliures?</token> <token postag="V.[SI].*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> </pattern> <disambig action="remove" postag="V.*"/> </rule> <rule id="verbnom_dubte_compte" name="verb/nom -> verb: compte, dubte"> <pattern> <marker> <and> <token postag="VM[ISM].*" postag_regexp="yes" regexp="yes">comptes?|dubtes?|rest(a|es)</token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="_GV_"/> </and> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rulegroup id="nParticipi" name="no participi si no ha concordat"> <antipattern> <token regexp="yes">me|ma</token> <token postag="V.P..SM." postag_regexp="yes"/> </antipattern> <rule> <!-- paraules que habitualment no són participi si no han concordat (darrere de "de"?: base de dades, sistema de partits --> <pattern> <and> <token postag="V.P.*" postag_regexp="yes" regexp="yes">costats?|vista|partida|dada|dades|partits?|estats?|beguda|begudes<exception postag="_GN_.*|_GV_" postag_regexp="yes"/><exception scope="previous" regexp="yes">e|as|em|eu|an</exception></token> <token postag="N.*" postag_regexp="yes"/> </and> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <!-- A més, són nom si tenen un adjectiu al darrere que concorda --> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <and> <token postag="V.P.*" postag_regexp="yes" regexp="yes">partida|dada|dades|partits?|estats?|beguda|begudes</token> <token postag="N.*" postag_regexp="yes"/> </and> <token postag="A.*|V.P.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> <rule> <pattern> <marker> <token postag="N.*" postag_regexp="yes" regexp="yes">resposta|respostes</token> </marker> <token regexp="yes">que|de|d'</token> </pattern> <disambig action="remove" postag="V.P.*"/> </rule> </rulegroup> <!-- <rule id="sParticipi" name="Altrament sí que són participi"> <pattern> <marker> <and> <token postag="V.P.*" postag_regexp="yes"></token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes" /></token> </and> </marker> <token postag="N.*" postag_regexp="yes"><exception postag="V.[IS].*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="[^N].*"></disambig> </rule> --> <!-- verb + adj/verb Havien estat ocultes. Mogut per: cap historiador reputat accepta aquesta teoria --> <rule id="verb_nom2" name="verb + adjectiu"> <pattern> <token postag="V.*" postag_regexp="yes"><exception postag="N.*|_GN.*" postag_regexp="yes"/><exception inflected="yes">haver</exception></token> <!-- les persones som consumidores --> <marker> <and> <token postag="V.[^GNP].*" postag_regexp="yes"/> <!-- inclòs el gerundi?? --> <token postag="A.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> <!-- s'incorporaren nou seminaristes--> </rule> <!-- Desactivat per: el conjunt porta el nom <rule id="verb_nom4c" name="verb + nom"> <pattern> <and> <token postag="V.[IS].*|_GV_" postag_regexp="yes"><exception postag="PP.*|P0.*" postag_regexp="yes"/></token> <token postag="N.*|_GN.*" postag_regexp="yes" negate_pos="yes"></token> </and> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"></token> <token postag="N.*" postag_regexp="yes"></token> </and> </marker> </pattern> <disambig action="filter" postag="[^V].*"></disambig> </rule> --> <!-- nom + nom/verb La comunitat fou. Canviat de lloc per: un dels membres deixa --> <rule id="verb_nom5a" name="verb + nom"> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="[AD].*|_GV_|V.[SI].*" postag_regexp="yes"/></token> <marker> <and> <token postag="V.P.*" postag_regexp="yes"/> <!--respostes per--> <token postag="N.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> </and> </marker> <token><exception postag="SPS.*" postag_regexp="yes"/><exception>que</exception></token> </pattern> <disambig action="filter" postag="V.P.*"/> </rule> <!-- <rule id="verb_nom5" name="verb + nom"> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="[AD].*|V.N.*|RG.*" postag_regexp="yes"></exception><exception inflected="yes" regexp="yes">mot|paraula|terme|expressió|vocable|nom|tipus</exception></token> La gran taula <marker> <and> <token postag="V.[MSI].*" postag_regexp="yes"><exception regexp="yes">cap|força</exception></token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes" /></token> </and> </marker> </pattern> <disambig action="filter" postag="V.*"></disambig> </rule> --> <rulegroup id="nAdjectiu" name="no adjectiu si no ha concordat"> <!-- paraules que habitualment no són adjectius si no han concordat: fer|segons|envolta--> <rule> <antipattern> <token postag="V.[SIN].*|_GV_" postag_regexp="yes"/> <token min="0" max="4" postag="RG|LOC_ADV" postag_regexp="yes"/> <token postag="A.*" postag_regexp="yes"/> </antipattern> <pattern> <token><exception postag="RG_anteposat"/></token> <marker> <and> <token postag="A.*" postag_regexp="yes" regexp="yes">dura|acceptes|manca|vius?|accepta|palesa|manifesta|ultra|vers|lluny|presta|som|sabeu|seré|fer|afecta|alterna|ciutadà|ciutadans|ciutadana|ciutadanes|jugadors?|jugadora|jugadores|cantants?<exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="A.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <marker> <and> <token postag="A.*" postag_regexp="yes">dura<exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="A.*" postag_regexp="yes" negate_pos="yes"/> </and> </marker> <token regexp="yes">més|mensy|manco|molt|poc|moltíssim|poquíssim</token> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <token><exception postag="RG_anteposat"/><exception>com</exception></token> <marker> <and> <!--dret--> <token postag="A.*" postag_regexp="yes" regexp="yes" inflected="yes">titular|redactor|directiu|carreter|mural|promotor|director|estranger|missatger|motiu|part|restaurant|parella<exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="A.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule> <pattern> <marker> <and> <token regexp="yes">recull|tria|caça|expressa<exception postag="_GN_.*" postag_regexp="yes"/><exception scope="previous" postag="V.[IS].*" postag_regexp="yes"/></token> <token postag="A.*|SENT_END|PARA_END" postag_regexp="yes" negate_pos="yes"/> </and> </marker> <token postag="[ND].*|RG" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="[AN].*"/> </rule> </rulegroup> <rule id="corrent_per_gerundi" name="corrent per (gerundi)"> <pattern> <marker> <token postag="VMG00000">corrent<exception postag="_GN.*" postag_regexp="yes"/></token> </marker> <token inflected="yes">per</token> </pattern> <disambig action="filter" postag="VMG00000"/> </rule> <rulegroup id="Nom_AdjectiuNoConcorda" name="nom + adjectiu que no han concordat (comú)"> <rule> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="V.*|A.*|complement.*|_GV_" postag_regexp="yes"/><exception inflected="yes" regexp="yes">mot|paraula|terme|expressió|vocable|nom|tipus|denominació</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception regexp="yes">\p{Lu}.+</exception></token> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="_GN.*|SPS00|V.[GMIS].*|CC|RG.*" postag_regexp="yes"/></token> <!-- exc. just allà --> </and> </marker> </pattern> <disambig action="filter" postag="V.P.*|AQ.*"/> </rule> <rule> <!-- problema: poden crear de forma espontània parells electró-positró. --> <pattern> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> <and> <token postag="A.*" postag_regexp="yes"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="_GN.*|SPS00|V.[GMIS].*|CC|RG.*" postag_regexp="yes"/></token> <!-- exc. just allà --> </and> </marker> </pattern> <disambig action="filter" postag="V.P.*|AQ.*"/> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="N.*" postag_regexp="yes"/> <token postag="RG_anteposat"/> <token postag="A.*" postag_regexp="yes"/> </unify> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*|AQ.*" postag_regexp="yes"><exception postag="_GN.*|SPS00|V.[GMIS].*|CC|RG.*" postag_regexp="yes"/></token> <!-- exc. just allà --> </and> </marker> </pattern> <disambig action="filter" postag="V.P.*|AQ.*"/> </rule> </rulegroup> <!--<rule id="GN_verb" name="GN verb: el pare no hi és"> <pattern> <token postag="_GN_.*" postag_regexp="yes"/> <marker> <and> <token postag="_GN_.*" postag_regexp="yes"/> <token postag="_GV_"/> </and> </marker> <token postag="V.[SI].*|&pronom_feble;|RN" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="_GN_.*|[AN].*"></disambig> </rule> --> <rule id="GV_GN" name="un cas concret d'ambiguitat GV/GN"> <!-- "el parla gran quantitat de persones --> <pattern> <token postag="_GV_"><exception postag="_GN_.*" postag_regexp="yes"/></token> <marker> <and> <token postag="_GV_"/> <token postag="_GN_.*" postag_regexp="yes"/> </and> </marker> <token postag="_GN_.*" postag_regexp="yes"/> <and> <token postag="NC.*|PX.*" postag_regexp="yes"><exception regexp="yes">col?p|vegada|volta</exception></token> <token postag="_GN_.*" postag_regexp="yes"/> </and> </pattern> <disambig action="filter" postag="_GV_|V.*"/> </rule> <rule id="verbnom_GN" name="verb/nom + GN"> <!-- a tots els toca la seva part --> <pattern> <and> <token postag="_GV_"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="P.*" postag_regexp="yes"/> </and> <marker> <and> <token postag="_GV_"/> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="_GN_.*" postag_regexp="yes"/> <and> <token postag="NC.*|PX.*|A.*" postag_regexp="yes"><exception regexp="yes">col?p|vegada|volta</exception></token> <token postag="_GN_.*" postag_regexp="yes"/> </and> </pattern> <disambig action="filter" postag="_GV_|V.[^M].*"/> <example type="untouched">Hauria fet <marker>falta</marker> un coet.</example> </rule> <!-- nom + nom/prep Enfrontament contra. Enfrontament sindical contra. Mogut per: "la gran via de" via (prep.)--> <rule id="nom_prep" name="nom + preposició"> <pattern> <token postag="N.*|A.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="SPS00"/> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="haver_de" name="haver de + infinitiu"> <pattern> <marker> <token postag="VA.*" postag_regexp="yes" inflected="yes">haver</token> </marker> <token regexp="yes">de|d'</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="VA.*|_GV_|_obligacio"/> </rule> <rule id="VerbAuxiliar" name="verb auxiliar i no auxiliar"> <pattern> <marker> <and> <token postag="VA.*" postag_regexp="yes"><exception postag="_GV_"/></token> <token postag="VM.*" postag_regexp="yes" inflected="yes">anar</token> </and> </marker> </pattern> <disambig action="filter" postag="VM.*"/> </rule> <rule id="VerbPrep" name="verb i preposició: preposició"> <!-- cas: sense llevat. Quan entre en... --> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes"><exception postag="_GV_"/><exception>salvat</exception></token> <token postag="SPS.*" postag_regexp="yes"/> </and> </marker> <token><exception postag="SPS.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="sobre" name="sobre no verb"> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes">sobre<exception postag="_GV_"/></token> <token postag="SPS.*" postag_regexp="yes"/> </and> </marker> <token postag="SPS00"/> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule id="GerAdj" name="gerundi i adj: gerundi"> <pattern> <token><exception postag="SPS00|CC|_PUNCT.*|SENT_START" postag_regexp="yes"/><exception inflected="yes" regexp="yes">ser|estar|semblar|parèixer|considerar|tan|tant</exception></token> <!-- en calent --> <marker> <and> <token postag="V.G.*" postag_regexp="yes"><exception regexp="yes">arrogant|equivalent|important|corrent|justificant</exception></token> <!-- exception: tots els verbs reflexius --> <token postag="A.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="V.G.*"/> </rule> <rule id="mal" name="mal (adv)"> <pattern> <marker> <token postag="RG.*" postag_regexp="yes">mal<exception postag="_GN.*" postag_regexp="yes"/></token> </marker> <token postag="V.P.*|A.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG.*"/> </rule> <rule id="Prep_NomAdv" name="prep + nom i adverbi"> <!-- fins demà, de mal vestida--> <pattern> <token postag="SPS.*" postag_regexp="yes"/> <marker> <and> <token postag="R.*" postag_regexp="yes"><exception inflected="yes" regexp="yes">llarg|tot|infinit|lli</exception><exception postag="_GN.*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token postag="AQ.*|V.P.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="Prep_NomAltres" name="preposició + nom i altres: nom"> <!-- problema: de gran lirisme. A petita escala --> <pattern> <token postag="SPS.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*|A.*|V.P.*" postag_regexp="yes" negate_pos="yes"><exception postag="DN.*|_GN.*|_GV_|(DI|DE|DT|PT).*|PI.*" postag_regexp="yes"/></token> <token postag="N.*|A.*|V.P.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="N.*|A.*|V.P.*|_english_ignore_"/> </rule> <rule id="PrepNom_llevat" name="preposició o nom: llevat"> <!-- potser no és prep.: cap --> <pattern> <marker> <and> <token postag="SPS.*" postag_regexp="yes">llevat</token> <token postag="N.*" postag_regexp="yes"/> </and> </marker> <token><exception regexp="yes">això|de|d'</exception></token> </pattern> <disambig action="filter" postag="[^S].*"/> </rule> <rule id="ates_el" name="atès el/atesa la"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <token postag="V.P.*" postag_regexp="yes" regexp="yes">atesa|ateses</token> </marker> <token postag="D.*" postag_regexp="yes"/> </unify> </pattern> <disambig action="remove" postag="N.*"/> </rule> <rulegroup id="PrepNom" name="preposició + nom: prep. Ex: contra"> <!-- potser no és prep.: cap --> <rule> <pattern> <marker> <and> <token postag="SPS.*" postag_regexp="yes"><exception scope="previous" postag="D[^N].*" postag_regexp="yes"/></token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule> <pattern> <token regexp="yes">tot|tots|totes|algun|alguns|algunes</token> <marker> <and> <token postag="SPS.*" postag_regexp="yes" regexp="yes">via|vora</token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </marker> <token postag="D.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> </rulegroup> <rule id="cantant" name="cantant"> <pattern> <marker> <token postag="NCCS000">cantant</token> </marker> <token inflected="yes">de</token> </pattern> <disambig action="remove" postag="A.*|V.G.*"/> </rule> <rule id="InfGer_Nom" name="infinitiu o gerundi / nom que no ha concordat"> <!-- ser, deixant, etc. excep: tan regular (adj)--> <pattern> <token><exception postag="RG.*" postag_regexp="yes"/></token> <marker> <and> <token postag="V.[NG].*" postag_regexp="yes" regexp="yes">\p{Ll}.*<exception regexp="yes">seient|justificant</exception></token> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rulegroup id="CAP2" name="cap: tractament especial (det, adj, nom, adv, verb...)"> <!-- TODO: ampliar cap cabre VMIP1S0 cap cabre VMIP3S0 cap cabre VMM02S0 cap cap DI0CS0 cap cap NCCS000 cap cap NCMS000 cap cap PI0CS000 cap cap SPS00 cap capar VMIP1S0--> <rule> <pattern> <token postag="VM.*" postag_regexp="yes" regexp="yes" inflected="yes" skip="2">anar|córrer|traslladar|moure|avançar|caminar</token> <marker> <token postag="SPS.*" postag_regexp="yes">cap</token> </marker> </pattern> <disambig action="filter" postag="SPS.*"/> </rule> <rule> <!-- cap d'aquells homes. Excep: el cap d'aquells homes--> <pattern> <marker> <token postag="SPS.*" postag_regexp="yes">cap<exception postag="_GN_MS"/></token> </marker> <token regexp="yes">de|d'</token> <token postag="D[AD].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="PI.*"/> </rule> </rulegroup> <rule id="primer_adj" name="primer (adjectiu, no adverbi)"> <antipattern> <token skip="5">primer</token> <token regexp="yes" min="1" max="2">,|i</token> <token regexp="yes">després|posteriorment</token> </antipattern> <pattern> <token postag="SENT_START|_PUNCT.*" postag_regexp="yes"/> <token min="0" max="3" regexp="yes">\p{P}</token> <marker> <token postag="AO0MS0">primer</token> </marker> <token postag="NC.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="RG"/> </rule> <rulegroup id="FORCA2" name="força: tractament especial (det, adj, nom, adv, verb...)"> <!-- TODO: ampliar --> <rule> <pattern> <token regexp="yes" inflected="yes">guanyar|perdre</token> <marker> <token postag="NC.*" postag_regexp="yes">força</token> </marker> <token><exception postag="NC.*" postag_regexp="yes"/></token> </pattern> <disambig action="filter" postag="NC.*|_GN_.*"/> </rule> <rule> <pattern> <marker> <token postag="DI.*" postag_regexp="yes">força<exception postag="_GN_FS"/></token> </marker> <token postag="NC.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="DI.*|_GN_.*"/> </rule> <rule> <pattern> <token postag="V.N.*" postag_regexp="yes"/> <marker> <token postag="V.*" postag_regexp="yes">força</token> </marker> </pattern> <disambig action="filter" postag="[^V].*"/> </rule> <rule> <!-- cobra més força --> <pattern> <token postag="V.*" postag_regexp="yes"/> <token postag="RG"/> <marker> <token postag="N.*" postag_regexp="yes">força</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <marker> <token postag="_GN_FS">força</token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*|V.*|_GV_"/> </rule> <rule> <pattern> <marker> <token postag="_GN_FS">força<exception postag="_GV_"/></token> </marker> </pattern> <disambig action="filter" postag="N.*|_GN_.*"/> </rule> <rule> <pattern> <marker> <token postag="_GV_">força<exception postag="_GN_FS"/></token> </marker> </pattern> <disambig action="filter" postag="V.*|_GV_"/> </rule> <rule> <!-- nom+força+adj : Permet analitzar errors: era una dona força misteriós--> <pattern> <token postag="N.*" postag_regexp="yes"/> <marker> <and> <token postag="N.*" postag_regexp="yes">força</token> <token postag="RG_anteposat"/> <token postag="V.*" postag_regexp="yes"/> <token postag="DI.*" postag_regexp="yes"/> </and> </marker> <token postag="AQ.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="RG.*"/> </rule> </rulegroup> <rule id="AdvNom" name="adverbi i nom: no nom"> <!-- llavors company. Excepció: tant com, tant (de) mal com --> <pattern> <token><exception regexp="yes">tant|com</exception><exception postag="DN.*" postag_regexp="yes"/></token> <marker> <and> <token postag="RG.*" postag_regexp="yes"><exception regexp="yes">força|total|pla</exception></token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> <example type="untouched">Una obra per a dos piano.</example> </rule> <rule id="AdjAdv" name="adjectiu i adverbi"> <!-- correctament primer. Excep: tant (de) mal --> <antipattern> <token>conforme</token> <token>a</token> </antipattern> <antipattern> <token>l'</token> <token>ho</token> <token postag="A.*" postag_regexp="yes"/> </antipattern> <antipattern> <!-- error de concordança --> <token postag="NC.*" postag_regexp="yes"/> <token>llarg</token> </antipattern> <pattern> <token><exception regexp="yes">tant|com|tan|més</exception><exception postag="DA.*" postag_regexp="yes"/></token> <marker> <and> <token postag="RG.*" postag_regexp="yes"><exception>total</exception></token> <token postag="A.*" postag_regexp="yes"><exception postag="_GN.*|CC" postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="remove" postag="A.*"/> </rule> <rule id="PronomAltres" name="pronom i altres: altres"> <!-- en què, el gener --> <pattern> <marker> <and> <token postag="PP.*|P0.*" postag_regexp="yes"><exception postag="_GV_"/></token> <token postag="DA.*|SPS00" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^P].*"/> </rule> <rule id="GRANS" name="grans de cereals..."> <pattern> <marker> <token postag="NC.*" postag_regexp="yes">grans<exception scope="previous" postag="NC.P.*" postag_regexp="yes"/></token> </marker> <token regexp="yes">de|d'</token> <token postag="NC.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="N.*"/> <example type="untouched">Són fragments grans de membrana.</example> </rule> <rulegroup id="DEU" name="no és numeral si no ha concordat..."> <rule> <pattern> <marker> <and> <token postag="DN0CP0">deu</token> <token postag="V.*" postag_regexp="yes"><exception postag="_GN_.*|V.P.PM." postag_regexp="yes"/></token> </and> </marker> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> </rulegroup> <rule id="nNom2" name="no nom si no ha concordat"> <pattern> <and> <token postag="N.*" postag_regexp="yes" regexp="yes">feu|busca|busques|màgics?|màgica|màgiques|pinte|trenca|guarda|passa|salva|faig|dic|jeia|estaria|estaries|grossa|ros|suau|sobre|publicà|allò|parla|parles|deixa|deixes|torna|tornes|sabeu|seré|joves?|caus?|meritoris?|meritòri(a|es)|seca|resulta|porta|fou|grans?|surt|era|verticals?|visc<exception postag="_GN_.*" postag_regexp="yes"/></token> <token postag="[AVCP].*|SPS00" postag_regexp="yes"/> </and> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="el_no_article" name="el no article"> <!-- el feu cantar --> <pattern> <marker> <and> <token postag="DA.*" postag_regexp="yes"/> <token postag="_GV_"/> </and> </marker> <token min="0" postag="_QM_OPEN"/> <and> <token postag="V.[SI].*" postag_regexp="yes"/> <token postag="_GV_"><exception postag="_GN_.*|N.*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule id="en_no_preposicio" name="en no preposició"> <!-- en porti --> <pattern> <marker> <and> <token postag="P.*" postag_regexp="yes">en</token> <token postag="_GV_"/> </and> </marker> <and> <token postag="V.[MSI].*" postag_regexp="yes"/> <token postag="_GV_"><exception postag="_GN_.*|N.*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="remove"> <wd pos="SPS00"/> </disambig> </rule> <rule id="duc_verb" name="duc verb o nom"> <pattern> <token>que</token> <marker> <token postag="V.*" postag_regexp="yes">duc</token> </marker> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <rule id="EL_MES_x_POSSIBLE" name="el més gran possible"> <pattern> <token postag="DA.*" postag_regexp="yes"/> <token regexp="yes">més|menys</token> <token postag="AQ.*" postag_regexp="yes"/> <marker> <token postag="AQ.*" postag_regexp="yes" regexp="yes">possibles?</token> </marker> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <rule id="adjectius_que_concorden" name="adjectius que concorden, però no hi ha nom"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="V.P.*|A.*" postag_regexp="yes"><exception postag="_GN_.*|_GV_" postag_regexp="yes"/></token> <token postag="V.P.*|A.*" postag_regexp="yes"><exception postag="_GN_.*|_GV_|AQ0CN0" postag_regexp="yes"/></token> </unify> </pattern> <disambig action="unify"/> </rule> <rule id="Nom_AdjectiuNoConcorda2" name="nom + adjectiu, que no han concordat (comú)"> <!-- EXEMPLE D'UTILITAT:Dóna-hi l'últim ullada. Exception: recent (erroni com a adverbi), "recent casats" Problema: dos adjectius que concorden, però no són etiquetats amb _GN_ --> <pattern> <token><exception postag="N.*" postag_regexp="yes"/></token> <token postag="V.P.*|A.*" postag_regexp="yes"><exception postag="N.*" postag_regexp="yes"/><exception>recent</exception><exception inflected="yes" regexp="yes">poder|voler|saber</exception></token> <marker> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="V.P.*" postag_regexp="yes"><exception postag="_GN.*|SPS00|V.[GMIS].*|CC" postag_regexp="yes"/><exception inflected="yes" regexp="yes">donar|anomenar</exception></token> </and> </marker> </pattern> <disambig action="filter" postag="N.*"/> </rule> <!-- *****????????? mides moderades construït, El feminisme d'arrel il·lustrada reclama --> <!-- <rule id="VerbNomVerb" name="verbnom + verb"> <pattern> <marker> <and> <token postag="V.[IS].*" postag_regexp="yes"></token> <token postag="_GN.*" postag_regexp="yes"><exception postag="_GV_"/></token> </and> </marker> <and> <token postag="V.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes" negate_pos="yes"/> </and> </pattern> <disambig action="filter" postag="[^V].*"></disambig> </rule> --> <rule id="AiN" name="adjectiu i nom: adjectiu (algunes paraules?) comú"> <pattern> <and> <token postag="A.*" postag_regexp="yes" inflected="yes" regexp="yes">comú|pendent</token> <token postag="N.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/></token> </and> </pattern> <disambig action="filter" postag="A.*"/> </rule> <rule id="en_article" name="En article"> <pattern> <unify> <feature id="nombre"/> <feature id="genere"/> <marker> <and> <token postag="DA.*" postag_regexp="yes">en</token> <token postag="SPS.*" postag_regexp="yes"/> </and> </marker> <token postag="NP..SP0" postag_regexp="yes"/> </unify> </pattern> <disambig action="filter" postag="DA.*|_GN.*"/> </rule> <rule id="en_no_article" name="En no article"> <pattern> <marker> <and> <token postag="DA.*" postag_regexp="yes">en</token> <token postag="SPS.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="SPS.*"/> </rule> <rulegroup id="interjeccio" name="interjeccions"> <rule> <pattern> <token>,</token> <marker> <token postag="I"><exception postag="_GN.*|DA.*|A.*|VA.*" postag_regexp="yes"/></token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="I"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <token postag="I"><exception postag="_GN.*|DA.*|A.*|VA.*" postag_regexp="yes"/></token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="I"/> </rule> <rule> <pattern> <token postag="SENT_START|CC|_PUNCT.*" postag_regexp="yes"/> <marker> <token>vaja</token> </marker> <token postag="CC|_PUNCT.*" postag_regexp="yes"/> </pattern> <disambig action="replace" postag="I"/> </rule> <rule> <pattern> <token>vaja</token> <token inflected="yes" regexp="yes">quin|com</token> </pattern> <disambig action="replace" postag="I"/> </rule> </rulegroup> <rule id="PI_N" name="pronom indefinit i nom"> <pattern> <and> <token postag="NC.*" postag_regexp="yes"><exception postag="_GN.*" postag_regexp="yes"/><exception scope="previous" postag="DA.*" postag_regexp="yes"/></token> <token postag="PI.*" postag_regexp="yes"/> </and> </pattern> <disambig action="filter" postag="[^N].*"/> </rule> <!-- paraules concretes--> <rule id="segons5" name="segons + verb"> <pattern> <marker> <token postag="CS">segons</token> </marker> <token postag="V.[IS].*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="CS"/> </rule> <rule id="segons5b" name="segons + verb"> <pattern> <marker> <token postag="CS">segons</token> </marker> <token postag="P0.*|PP.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes"/><exception regexp="yes">jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vost[èé]s?|vós</exception></token> </pattern> <disambig action="filter" postag="CS"/> </rule> <rule id="segons6" name="segons preposició"> <pattern> <marker> <token postag="SPS00">segons</token> </marker> </pattern> <disambig action="filter" postag="SPS00"/> </rule> <rule id="PronomNom2" name="nom i pronom"> <!-- jo, mi, la, te, ens. Excepció: de te. --> <pattern> <marker> <and> <token postag="PP.*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes">te</token> <token postag="_GN_.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="[^P].*"/> </rule> <rulegroup id="fa_x_temps2" name="fa tres anys, molt de temps"> <!-- segona passada de la regla: per a evitar les excepcions de Verbs |NP..SP.* PI0CS000| --> <antipattern> <token>bon</token> <token>dia</token> </antipattern> <rule> <pattern> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception><exception regexp="yes">què|quant</exception></token> <marker> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="12">fer<exception postag=".*LOC_ADV.*" postag_regexp="yes"/><exception scope="next" regexp="yes">que|en</exception><exception scope="next" postag="_PUNCT.*" postag_regexp="yes">,</exception><exception postag="V.[MSI].*|_GV_|DA.*" postag_regexp="yes" scope="next"/></token> </marker> <token regexp="yes">segons?|minuts?|hor(a|es)|di(a|es)|setman(a|es)|mes|mesos|(tri|quadri|se)mestres?|anys?|lustres?|dècad(a|es)|segles?|mil·lennis?|moments?|instants?|temps|estona|estius?|primaver(a|es)|hiverns?</token> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token><exception postag="&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="12">fer<exception scope="next" regexp="yes">que|en</exception><exception scope="next" postag="_PUNCT.*" postag_regexp="yes">,</exception><exception postag="V.[MSI].*|_GV_|DA.*" postag_regexp="yes" scope="next"/></token> <marker> <token regexp="yes">segons?|minuts?|hor(a|es)|di(a|es)|setman(a|es)|mes|mesos|(tri|quadri|se)mestres?|anys?|lustres?|dècad(a|es)|segles?|mil·lennis?|moments?|instants?|temps|estona|estius?|primaver(a|es)|hiverns?</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token><exception postag="NP..SP.*|&pronom_feble;" postag_regexp="yes" regexp="yes">[^'-].+</exception></token> <marker> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="1">fer<exception postag=".*LOC_ADV.*" postag_regexp="yes"/><exception scope="next" regexp="yes">,|que|en</exception><exception postag="V.[MSI].*|_GV_" postag_regexp="yes" scope="next"/></token> <token regexp="yes">molt|moltíssim|poc|poquet|poquíssim|barbaritat</token> </marker> <token><exception postag="AQ.*|V.P.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token>fins</token> <marker> <token postag="V.I[PI]3S0.?" postag_regexp="yes" inflected="yes" skip="1">fer<exception postag=".*LOC_ADV.*" postag_regexp="yes"/><exception scope="next" regexp="yes">,|que|en</exception><exception postag="V.[MSI].*|_GV_" postag_regexp="yes" scope="next"/></token> <token regexp="yes">poquet|poc|poquíssim</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> <rule> <pattern> <token>no</token> <token regexp="yes">fa|feia</token> <token>tant</token> </pattern> <disambig action="add"> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> <wd pos="LOC_ADV"/> </disambig> </rule> </rulegroup> <rule id="car" name="car (si no ha concordat com a nom o adjectiu)"> <pattern> <token><exception postag="RG.*" postag_regexp="yes"/></token> <marker> <token postag="CC">car<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="CC"/> </rule> <rule id="cert" name="cert: no determinant si no ha concordat"> <pattern> <!-- <token><exception postag="RG.*" postag_regexp="yes"/></token> --> <marker> <token postag="AQ.*" postag_regexp="yes" inflected="yes">cert<exception postag="_GN_.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="filter" postag="AQ.*"/> </rule> <!-- <rule id="tant_x_com" name="tant + __ + com"> <pattern> <marker> <token>tant</token> </marker> <token skip="-1"></token> <token>com</token> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="RG"></match> </disambig> </rule> --> <rule id="elsuns_x_elsaltres" name=" (els) uns + prep + els altres"> <pattern> <token skip="1">uns</token> <marker> <token postag="SP.*" postag_regexp="yes" skip="1"/> </marker> <token>altres</token> </pattern> <disambig> <match no="1" postag_regexp="yes" postag="SP.*"/> </disambig> </rule> <!-- <rule id="lun_x_laltre" name=" un __ l'altre"> cal millorar-la <pattern> <token>un</token> <token skip="3"></token> <marker> <token>altre</token> </marker> </pattern> <disambig><match no="3" postag_regexp="yes" postag="P.*|_GN_MS"></match></disambig> </rule> --> <!-- <rule id="buidaGN" name="elimina etiquetes GN"> <pattern> <token></token> </pattern> <disambig action="filter" postag="[^_].*"></disambig> </rule> --> <rule id="tant_no_determinant" name="tant no determinant"> <pattern> <marker> <token postag="DI0MS0">tant<exception postag="_GN_MS"/></token> </marker> <token><exception postag="NC.*|A.*" postag_regexp="yes"/><exception inflected="yes">de</exception></token> </pattern> <disambig action="remove" postag="D.*"/> </rule> <rulegroup id="CASOS_CONCRETS" name="alguns casos concrets"> <rule id="mostres" name="mostra/mostres de"> <!-- és generalitzable? --> <pattern> <marker> <and> <token postag="V.*" postag_regexp="yes" regexp="yes">mostres|mostra</token> <token postag="NC.*" postag_regexp="yes"/> </and> </marker> <token regexp="yes">de|d'</token> </pattern> <disambig action="filter" postag="NC.*"/> </rule> </rulegroup> <!-- Útils per a algunes regles --> <rulegroup id="diferent_del_del" name="diferent del del"> <rule> <pattern> <token regexp="yes">diferents?|distint(s|a|es)?</token> <marker> <token>de</token> </marker> <token postag="DA.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_repetition"/> </disambig> </rule> <rule> <pattern> <token>a</token> <token>diferència</token> <marker> <token>de</token> </marker> <token postag="DA.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_repetition"/> </disambig> </rule> <rule> <pattern> <token>cap</token> <marker> <token>cap</token> </marker> <token regexp="yes">arrere|enrere|endarrere|avant|envat|endavant</token> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup id="nom_en_complement" name="nom en complement"> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"><exception>molt</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> <example type="untouched">S'estan convertint en molt extremistes</example> </rule> <rule> <pattern> <token>com</token> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D[ADI].*" postag_regexp="yes"/> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D[ADI].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <!-- Durant el període medieval gremis d'artesans --> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <and> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <token postag="complement" postag_regexp="yes"/> </and> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <and> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"><exception postag="DI.*" postag_regexp="yes"/></token> <token postag="complement" postag_regexp="yes"/> </and> <token postag="RG_anteposat"/> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes"><exception>a</exception></token> <marker> <token postag="PD0NS000"/> </marker> </pattern> <disambig action="add"> <wd pos="complement"/> </disambig> </rule> <!-- complement regit per la preposició 'a' --> <rule> <pattern> <token>a</token> <marker> <token postag="N.*|PI.*|PD.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <token>a</token> <token postag="D[ADI].*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <token>a</token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="DA.*" postag_regexp="yes"/> <token postag="PX.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <token>a</token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="D[ADI].*" postag_regexp="yes"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <token>a</token> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="A.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <token>a</token> <marker> <token postag="PD0NS000"/> </marker> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="complement_a" postag_regexp="yes"/> </and> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <and> <token postag="N.*" postag_regexp="yes"/> <token postag="complement_a" postag_regexp="yes"/> </and> <token postag="RG_anteposat"/> <marker> <token postag="A.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="complement_a"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCF.*" postag_regexp="yes"/> <token postag="complement.*" postag_regexp="yes"/> </and> <token>i</token> <marker> <token>mitja</token> </marker> </pattern> <disambig action="replace"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <and> <token postag="NCM.*" postag_regexp="yes"/> <token postag="complement.*" postag_regexp="yes"/> </and> <token>i</token> <marker> <token>mig</token> </marker> </pattern> <disambig action="replace"> <wd pos="complement"/> </disambig> </rule> <rule> <pattern> <token>cada</token> <marker> <token postag="N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="complement_cada"/> </disambig> </rule> </rulegroup> <rulegroup id="adj_ignore_concordance" name="adjectiu que ja acompanya un nom"> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="N.*" postag_regexp="yes"/> <marker> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="N.*" postag_regexp="yes"/> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> <marker> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="N.*" postag_regexp="yes"/> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> <token regexp="yes">i|o|ni|,</token> <marker> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token postag="N.*" postag_regexp="yes"/> <token postag="RG_anteposat"/> <marker> <token postag="A.*|PX.*|V.P.*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="genere"/> <feature id="nombre"/> <token regexp="yes">jo|mi|tu|ella?|nosaltres|vosaltres|elle?s|vost[èé]s?|vós</token> <marker> <token inflected="yes">mateix</token> </marker> </unify> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> </rulegroup> <rulegroup id="tot_toponim" name="tot + topònim"> <rule> <pattern> <marker> <token regexp="yes">tot|mig</token> </marker> <token postag="NPFSG00"/> </pattern> <disambig action="add"> <wd pos="allow_masculine"/> </disambig> </rule> </rulegroup> <rulegroup id="mon_ton_son" name="mon ton son: no són determinants si no han concordat"> <rule> <pattern> <token postag="DP.MS.*" postag_regexp="yes"><exception postag="_GN_MS"/></token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule> <pattern> <token postag="DP.FS.*" postag_regexp="yes"><exception postag="_GN_FS"/></token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule> <pattern> <token postag="DP.MP.*" postag_regexp="yes"><exception postag="_GN_MP"/></token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> <rule> <pattern> <token postag="DP.FP.*" postag_regexp="yes"><exception postag="_GN_FP"/></token> </pattern> <disambig action="filter" postag="[^D].*"/> </rule> </rulegroup> <rulegroup id="una_vegada" name="locució una vegada/volta/cop"> <rule> <pattern> <token>una</token> <marker> <token regexp="yes" skip="2">vegada|volta</token> </marker> <token postag="_GN_.*|V.[PSI].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_loc_unavegada"/> </disambig> </rule> <rule> <pattern> <token>un</token> <marker> <token skip="2" regexp="yes">col?p</token> </marker> <token postag="_GN_.*|V.[PSI].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_loc_unavegada"/> </disambig> </rule> </rulegroup> <rulegroup id="tant_x_com" name="tant + __ + com + __"> <rule> <!-- Dificultats: és tan(t) important com bonic --> <pattern> <marker> <token>tant</token> </marker> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes" skip="20"/> <token>com</token> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <pattern> <marker> <token>tant</token> </marker> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes" skip="20"/> <token>com</token> <token>no</token> <token postag="A.*|V.P.*|PX.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <!-- tant partidaris com opositors --> <pattern> <marker> <token>tant</token> </marker> <token postag="N.*" postag_regexp="yes" skip="20"/> <token>com</token> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <!-- tant partidaris com altres opositors --> <pattern> <marker> <token>tant</token> </marker> <token postag="N.*" postag_regexp="yes" skip="20"/> <token>com</token> <token postag="[AD].*" postag_regexp="yes"/> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" skip="1">tant?|tantes|tants</token> <token postag="N.*" postag_regexp="yes" skip="20"/> <marker> <token>com</token> </marker> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_com"/> </disambig> </rule> <rule> <pattern> <marker> <token>tant</token> </marker> <token postag="N.*" postag_regexp="yes" skip="20"/> <token>com</token> <token>no</token> <token postag="N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <pattern> <marker> <token>tant</token> </marker> <token regexp="yes" skip="20">\p{Lu}.*</token> <token>com</token> <token regexp="yes">\p{Lu}.*</token> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <!-- Tant fora com dins del Japó --> <pattern> <marker> <token>tant</token> </marker> <token min="0">a</token> <token postag="RG|.*LOC_ADV.*" postag_regexp="yes" skip="20"/> <token>com</token> <token min="0">a</token> <token postag="RG|.*LOC_ADV.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <!-- Tant jurídicament com en la realitat --> <pattern> <marker> <token>tant</token> </marker> <token postag="RG" skip="20"/> <token>com</token> <token postag="SPS00"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <!-- coneixements tant científics com de les més variades disciplines--> <pattern> <marker> <token>tant</token> </marker> <token postag="A.*|V.P.*" postag_regexp="yes" skip="20"/> <token>com</token> <token inflected="yes">de</token> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <pattern> <marker> <token>tant</token> </marker> <token postag="SPS00|.*LOC_PREP.*" postag_regexp="yes" skip="20"/> <token>com</token> <token postag="SPS00|.*LOC_PREP.*|RG" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="allow_tant"/> </disambig> </rule> <rule> <pattern> <token>tant</token> <token postag="DA.*" postag_regexp="yes" skip="5"/> <marker> <token>com</token> </marker> <token postag="DA.*" postag_regexp="yes" skip="5"/> </pattern> <disambig action="replace"> <wd pos="CC"/> </disambig> </rule> <rule> <pattern> <token postag="allow_tant" skip="21">tant</token> <marker> <token>com</token> </marker> </pattern> <disambig action="filter" postag="RG|allow_com"/> </rule> </rulegroup> <rulegroup id="com_més__més" name="com més __ + més +adj"> <rule> <pattern> <token>com</token> <token skip="-1" regexp="yes">més|menys</token> <token regexp="yes">més|menys</token> <marker> <token postag="AQ.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> </rulegroup> <rule id="TAL" name="tal (no pronom)"> <pattern> <and> <token inflected="yes">tal</token> <token postag="_GN_.*" postag_regexp="yes"/> </and> </pattern> <disambig action="remove" postag="PD.*|RG.*"/> </rule> <rulegroup id="QUE_COMPARATIU" name="'que' com a comparatiu"> <!-- Excepcions amb "tenir, haver-hi, trobar..." ?? --> <!-- arriba un |moment|instant, tal punt no tenia cap altra missió que inculcar-li disciplina, no tenia cap altra missió que inculcar-li, cap altre objectiu... hi ha evidències que ingerir àcid palmític incrementa el risc hi ha evidències que considerar abans, d'acord que copiar-les de manera que situar-les /resolt La possibilitat teòrica i tècnica que viatjar en el temps ens permetés Després d'arribar a la conclusió que ser un músic i un artista era el mateix L'afer es complica pel fet que marcar o desmarcar-se d'un usuari com "amic" --> <rule> <pattern> <token regexp="yes">més|menys</token> <token postag="[AN].*|V.P.*" postag_regexp="yes"/> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"><exception>haver</exception></token> </pattern> <disambig action="add"> <wd pos="comparatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes" skip="5">tenir|trobar<exception scope="next" inflected="yes" regexp="yes">&exceptions_QUE_COMPARATIU;</exception></token> <marker> <token>que<exception postag="comparatiu"/></token> </marker> <token postag="V.N.*" postag_regexp="yes"><exception>haver</exception></token> </pattern> <disambig action="add"> <wd pos="no_comparatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token skip="1">hi</token> <token inflected="yes" skip="5">haver<exception scope="next" inflected="yes" regexp="yes">&exceptions_QUE_COMPARATIU;</exception></token> <marker> <token>que<exception postag="comparatiu"/></token> </marker> <token postag="V.N.*" postag_regexp="yes"><exception>haver</exception></token> </pattern> <disambig action="add"> <wd pos="no_comparatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">haver</token> <token skip="5">-hi<exception scope="next" inflected="yes" regexp="yes">&exceptions_QUE_COMPARATIU;</exception></token> <marker> <token>que<exception postag="comparatiu"/></token> </marker> <token postag="V.N.*" postag_regexp="yes"><exception>haver</exception></token> </pattern> <disambig action="add"> <wd pos="no_comparatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="5" regexp="yes">arribar|des</token> <token regexp="yes">moments?|instants?|punts?</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="relatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1">haver</token> <token>dubte</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="relatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1" regexp="yes">fer|donar</token> <token regexp="yes">efecte|impressió</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="relatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1">fer</token> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="relatiu" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="5" regexp="yes">fet|possibilitat|conclusió|evidència|prova|acord</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="conjuncio" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="10" regexp="yes">concloure|conclusió|evidència|pressentir|pressentiment|sensació|sospitar|sospita|dir|sostenir|afirmar|aclarir|explicar|contar|pensar|creure</token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="conjuncio" lemma="que"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes" skip="20">abans|més|menys|altre|mateix|igual|major|menor|tan|tant|pitjor|millor</token> <marker> <token>que<exception postag="no_comparatiu"/></token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="comparatiu"/> </disambig> </rule> <rule> <pattern> <marker> <token>que<exception postag="no_comparatiu"/></token> </marker> <token postag="V.N.*" postag_regexp="yes" skip="15"/> <token inflected="yes" regexp="yes">més|menys|altre|mateix|igual|major|menor|tan|tant|pitjor|millor</token> </pattern> <disambig action="add"> <wd pos="comparatiu"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START" skip="-1"/> <token postag="V.N.*" postag_regexp="yes" skip="10"><exception scope="previous" postag="VA.*" postag_regexp="yes"/><exception>haver</exception></token> <marker> <token>que</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="comparatiu"/> </disambig> </rule> </rulegroup> <rule id="REPEATED_NEGATION" name="negació repetida"> <pattern> <token skip="5">no<exception scope="next" postag="_PUNCT.*" postag_regexp="yes"/></token> <marker> <token>no</token> </marker> </pattern> <disambig action="add"> <wd pos="repeated_negation"/> </disambig> </rule> <rule id="REPEATED_QUAN" name="'quan' repetit"> <pattern> <token skip="25">quan<exception scope="next" postag="_PUNCT.*" postag_regexp="yes"/></token> <marker> <token>quan</token> </marker> </pattern> <disambig action="add"> <wd pos="repeated"/> </disambig> </rule> <rulegroup id="meitat_meitat" name="meitat home meitat dona"> <rule> <pattern> <marker> <token skip="3">meitat</token> </marker> <token>meitat</token> </pattern> <disambig action="add"> <wd pos="_loc_meitat"/> </disambig> </rule> <rule> <pattern> <token skip="3">meitat</token> <marker> <token>meitat</token> </marker> </pattern> <disambig action="add"> <wd pos="_loc_meitat"/> </disambig> </rule> </rulegroup> <rulegroup id="NO_RELATIU" name="no hi ha estructura de relatiu"> <rule> <pattern> <token>d'</token> <token>acord</token> <marker> <token regexp="yes">en|amb|sobre</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">desacord|compte</token> <marker> <token regexp="yes">amb|sobre</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">en|per</token> <token regexp="yes">comparació|contraposició</token> <marker> <token regexp="yes">amb|de|d'|a</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">combinar|relacionar</token> <marker> <token>amb</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">en|amb</token> <token>relació</token> <marker> <token regexp="yes">amb|a</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">corresponent|invers|dret|referent|proper|pròxim|previ|oposar|contrari|igual|similar|semblant|anàleg|idèntic|equivalent|equiparable|alternatiu|superior|inferior|paral·lel|anterior|posterior|parèixer</token> <marker> <token>a</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" regexp="yes">donar|fer</token> <token regexp="yes">origen|front</token> <marker> <token>a</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token inflected="yes" skip="1">fer</token> <token regexp="yes">cas|càrrec|esment</token> <marker> <token regexp="yes">a|de|d'</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">.*%|abans|després|compliment|complement|equivalent|part|comparació|diferents?|distint(s|a|es)?|nord|sud|oest|est|centre|doble|triple|precedent|millor|contraris?</token> <marker> <token>de</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token skip="4" regexp="yes" inflected="yes">distingir|diferenciar|separar|destriar</token> <marker> <token>de</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token skip="1" inflected="yes">exemple</token> <marker> <token>de</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" skip="5">més|menys</token> <marker> <token>de</token> </marker> <token postag="DA.*" postag_regexp="yes"/> <token>que</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token>a</token> <token min="0">l'</token> <token regexp="yes">tenor|efecte</token> <marker> <token>de</token> </marker> <token postag="DA.*" postag_regexp="yes"/> <token>que</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <marker> <token>pe</token> </marker> <token>l</token> <token>que</token> <token regexp="yes">fa|feia</token> <token>a</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <marker> <token>excepte</token> </marker> <token postag="DA.*" postag_regexp="yes"/> <token>que</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">sense?</token> <token regexp="yes">perjudici|perjuí</token> <marker> <token>de</token> </marker> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">de|a|amb|pe</token> </marker> <token postag="DA0MS0"/> <token>que</token> <token>es</token> <token regexp="yes">disposa|preveu</token> <token regexp="yes">en|a</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="SPS00"/> </marker> <token min="0">a</token> <token regexp="yes">l|el</token> <token>que</token> <token inflected="yes" regexp="yes">quedar|restar</token> <token regexp="yes">de|d'</token> </pattern> <disambig action="add"> <wd pos="_no_relatiu"/> </disambig> </rule> </rulegroup> <rulegroup id="de_complement_directe" name="de complement directe: mireu de trobar"> <rule> <pattern> <token inflected="yes" regexp="yes" skip="5">mirar|intentar|permetre|decidir<exception scope="next">que</exception></token> <marker> <token regexp="yes">de|d'</token> </marker> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_complement_directe"/> </disambig> </rule> </rulegroup> <rulegroup id="INTERROGATIUS" name="pronoms interrogatius"> <rule id="qui" name="els qui"> <pattern> <token postag="D[DA].*" postag_regexp="yes"/> <marker> <and> <token postag="PT.*" postag_regexp="yes">qui</token> <token postag="PR.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="PR.*"/> </rule> <rule id="QUAN_INTERROGATIU" name="'quan' interrogatiu"> <pattern> <marker> <token>quan</token> </marker> <token postag="SENT_END|CC|_PUNCT.*" postag_regexp="yes"/> </pattern> <disambig action="filter" postag="PT.*"/> </rule> </rulegroup> <rule id="US_FEU_AMB" name="feu 2P/3S"> <pattern> <token regexp="yes">us|vos</token> <marker> <token skip="3">feu</token> </marker> <token>amb</token> </pattern> <disambig action="remove" postag="VMIS3S00"/> </rule> <rule id="verb_start" name="verb al principi de frase"> <pattern> <token postag="SENT_START"/> <token min="0" max="3" regexp="yes">\p{P}</token> <marker> <token postag="V.[IM].*" postag_regexp="yes"><exception postag_regexp="yes" postag="_GN_.*"/><exception>visca</exception></token> </marker> <token postag="_GN_.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="NC.*|A.*"/> </rule> <rulegroup id="SUBJUNTIU_IMPERATIU" name="subjuntiu/imperatiu"> <rule> <antipattern> <token>es</token> <token postag="V.S.*" postag_regexp="yes" skip="20"/> <token>o</token> </antipattern> <pattern> <token postag="SENT_START"/> <token postag="&pronom_feble;" postag_regexp="yes"/> <marker> <and> <token postag="V.S.*" postag_regexp="yes"/> <token postag="V.I.*" postag_regexp="yes"><exception>revistes</exception></token> </and> </marker> </pattern> <disambig action="remove" postag="V.S.*"/> </rule> <rule id="subj_imp_valencia" name="verb subjuntiu (valencià) i imperatiu (general): digues, sigues"> <pattern> <token postag="PR.*" postag_regexp="yes" skip="2"><exception scope="next" postag="&pronom_feble;|SENT_END|V.*|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <marker> <and> <token postag="V.S.*" postag_regexp="yes"><exception postag="V.I.*" postag_regexp="yes"/></token> <token postag="V.M.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.S.*"/> </rule> <rule id="no_subj_imp" name="no + subjuntiu/imperatiu"> <pattern> <token skip="2">no<exception scope="next" postag="&pronom_feble;|SENT_END|V.*|_GV_" postag_regexp="yes" negate_pos="yes"/></token> <marker> <and> <token postag="V.S.*" postag_regexp="yes"/> <token postag="V.M.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V.[^M].*"/> </rule> <rule> <pattern> <token postag="SENT_START"/> <marker> <and> <token postag="V.S.*" postag_regexp="yes"><exception postag="V.I.*" postag_regexp="yes"/></token> <token postag="V.M.*" postag_regexp="yes"><exception inflected="yes">heure</exception></token> </and> </marker> </pattern> <disambig action="remove" postag="V.S.*"/> </rule> <rule> <pattern> <token regexp="yes">[;,\(]</token> <marker> <and> <token postag="V.S.*" postag_regexp="yes"><exception>haguem</exception></token> <token postag="V.M.*" postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.S.*"/> </rule> <rule> <pattern> <token postag="SENT_START" skip="-1"><exception scope="next" postag="CS|PR.*" postag_regexp="yes"/></token> <marker> <and> <token postag="VMIP..00" postag_regexp="yes"/> <token postag="VMSP..0V" postag_regexp="yes"><exception>revistes</exception></token> </and> </marker> </pattern> <disambig action="remove" postag=".*V"/> </rule> <rule> <pattern> <token regexp="yes">que|quals?</token> <token min="0" postag="&pronom_feble;" postag_regexp="yes"/> <marker> <token postag="V.I.*" postag_regexp="yes">té</token> </marker> </pattern> <disambig action="filter" postag="V.I.*"/> </rule> </rulegroup> <rulegroup id="primera_tercera_persona" name="verb primera o tercera persona"> <rule> <pattern> <token regexp="yes">es|se|s'|hom|ella?</token> <marker> <and> <token postag="V...1S.." postag_regexp="yes"/> <token postag="V...3S.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V...[^1]...|_.*"/> </rule> <rule> <pattern> <token regexp="yes">se|s'|hom|ella?</token> <token postag="&pronom_feble;|PP[12]C[SP]000" postag_regexp="yes"/> <marker> <and> <token postag="V...1S.." postag_regexp="yes"/> <token postag="V...3S.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="filter" postag="V...[^1]...|_.*"/> </rule> </rulegroup> <rulegroup id="HAC_ASPIRADA" name="hac aspirada inicial"> <rule> <pattern> <token postag="NP.*" postag_regexp="yes" regexp="yes">(?-i)Han<exception postag="_GV_"/></token> </pattern> <disambig action="add"> <wd pos="hac_aspirada"/> </disambig> </rule> <rule> <pattern> <token postag="I">ha<exception postag="_GV_"/></token> </pattern> <disambig action="add"> <wd pos="hac_aspirada"/> </disambig> </rule> </rulegroup> <!-- <rulegroup id="MOT_FORASTER" name="paraula no catalana"> <rule> <pattern> <token postag="UNKNOWN" regexp="yes">.*ñ.*|.*á.*|.+ón|.+ía|.+íes|.+ch.+</token> </pattern> <disambig action="add"><wd pos="mot_foraster"></wd></disambig> </rule> <rule> <pattern> <token>agua</token> </pattern> <disambig action="add"><wd pos="mot_foraster"></wd></disambig> </rule> </rulegroup> --> <rulegroup id="persona13" name="persona 1/3"> <rule> <pattern> <marker> <and> <token postag="VM..1S0." postag_regexp="yes" inflected="yes" skip="3">caure</token> <token postag="VM..3S0." postag_regexp="yes"/> </and> </marker> <token postag="PD.*|PI.*|_GN.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="VM..1S0."/> </rule> <rule> <pattern> <marker> <and> <token postag="VM..1S0." postag_regexp="yes" inflected="yes">venir</token> <token postag="VM..3S0." postag_regexp="yes"/> </and> </marker> <token postag="PD.*|PI.*|_GN.*" postag_regexp="yes"/> </pattern> <disambig action="remove" postag="VM..1S0."/> </rule> <rule> <pattern> <token><exception>jo</exception></token> <marker> <and> <token postag="VM..1S0." postag_regexp="yes" inflected="yes" skip="3" regexp="yes">caure|venir|anar</token> <token postag="VM..3S0." postag_regexp="yes"/> </and> </marker> <token regexp="yes" inflected="yes">bé|de gust</token> </pattern> <disambig action="remove" postag="VM..1S0."/> </rule> <rule> <pattern> <marker> <and> <token postag="VA..1S0." postag_regexp="yes" inflected="yes" skip="3">haver</token> <token postag="VA..3S0." postag_regexp="yes"/> </and> </marker> <token regexp="yes">caigut|vingut|anat</token> <token regexp="yes" inflected="yes">bé|de gust</token> </pattern> <disambig action="remove" postag="VA..1S0."/> </rule> <rule> <pattern> <token postag="N..[SN].*|_GN_.S|PI..[SN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;</exception></token> <token min="0" max="3" postag="&pronom_feble;|R.*" postag_regexp="yes"><exception postag="P010S000"/></token> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes"><exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"><exception>viu</exception></token> </and> </marker> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token postag="N..[SN].*|_GN_.S|PI..[SN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;</exception></token> <token min="0" max="3" postag="&pronom_feble;|R.*" postag_regexp="yes"/> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes" inflected="yes" regexp="yes">portar|dur<exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token postag="N..[SN].*|_GN_.S|PI..[SN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;</exception></token> <token min="0" max="3" postag="&pronom_feble;|R.*" postag_regexp="yes"/> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes"><exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </marker> <token inflected="yes" regexp="yes">portar|dur</token> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token regexp="yes">ho|'l|'ls|la|les|'n</token> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes" inflected="yes" regexp="yes">portar|dur<exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token postag="V...1S.." postag_regexp="yes" skip="4"/> <token>que</token> <token>em</token> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes" inflected="yes" regexp="yes">portar|dur<exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </marker> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token regexp="yes">ho|'l|'ls|la|les|'n|l'|els</token> <marker> <and> <token postag="V.[SI].1S.." postag_regexp="yes"><exception postag="VMIP1S0V"/></token> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </marker> <token inflected="yes" regexp="yes">portar|dur</token> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> <rule> <pattern> <token regexp="yes">algú|algun|jo|mi|ella?|vostè|vosté|vós</token> <token min="0" max="3" postag="&pronom_feble;|R.*" postag_regexp="yes"/> <and> <token postag="V.[SI].1S.." postag_regexp="yes"/> <token postag="V.[SI].3S.." postag_regexp="yes"/> </and> </pattern> <disambig action="remove" postag="V.[SI].1S.."/> </rule> </rulegroup> <rulegroup id="verb_reflexiu_simple" name="verb acompanyat de pronom reflexiu"> <rule> <!--<antipattern> <!-\- TODO: generalitzar -\-> <token regexp="yes">això|aço|allò|ell|ella</token> <token regexp="yes">m'|em</token> </antipattern>--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0.0.*" postag_regexp="yes"><exception regexp="yes">['-].*</exception></token> <unify-ignore> <token min="0" postag_regexp="yes" postag="&pronom_feble;"/> </unify-ignore> <marker> <token postag="V.[SI].*" postag_regexp="yes"/> </marker> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- queixeu-vos --> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <marker> <token postag="V.M.*" postag_regexp="yes"/> </marker> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- aneu-vos a queixar --> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.M.*" postag_regexp="yes" inflected="yes">anar</token> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no" skip="2"/> </unify> <token>a</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- vas queixar-te--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.[SIM].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;|&elements_perifrasis_verbals2;</token> <unify-ignore> <marker> <token postag="V.[NG].*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- fugiren emportant-se--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.[SIM].*" postag_regexp="yes"/> <token min="0" postag="V.[NP].*" postag_regexp="yes"/> <unify-ignore> <marker> <token regexp="yes">emportant|enduent</token> </marker> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> </rulegroup> <rulegroup id="verb_reflexiu" name="verb acompanyat de pronom reflexiu"> <antipattern> <token inflected="yes">haver</token> <token><exception inflected="yes" regexp="yes">de|pas</exception><exception postag="V.P.*" postag_regexp="yes"/></token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">tornar|tendir|arribar|aplegar</token> <token><exception>a</exception><exception postag="RG"/></token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">començar|venir</token> <token><exception>a</exception><exception postag="V.G.*|P0.*" postag_regexp="yes"/></token> </antipattern> <antipattern> <token inflected="yes" regexp="yes">deixar|parar|mirar|tractar</token> <token><exception inflected="yes">de</exception><exception postag="P0.0.*" postag_regexp="yes"/></token> </antipattern> <antipattern> <token regexp="yes" inflected="yes">a|de|amb</token> <token><exception postag_regexp="yes" postag="V.N.*"/></token> </antipattern> <antipattern> <token regexp="yes" inflected="yes">&elements_perifrasis_verbals2;|agradar|encatar|encisar</token> <token><exception postag_regexp="yes" postag="V.N.*|RG|LOC_ADV"/><exception inflected="yes" regexp="yes">de|a|per</exception></token> </antipattern> <antipattern> <token>prou</token> <token><exception regexp="yes" inflected="yes">a|de|amb</exception></token> </antipattern> <antipattern> <token inflected="yes">fer</token> <token><exception>bé</exception></token> </antipattern> <antipattern> <token inflected="yes">fer</token> <token>bé</token> <token><exception inflected="yes">de</exception></token> </antipattern> <antipattern> <token inflected="yes">optar</token> <token><exception>per</exception></token> </antipattern> <antipattern> <token>per</token> <token><exception postag="V.N.*" postag_regexp="yes"/></token> </antipattern> <!--<antipattern> <token inflected="yes">en<exception scope="previous" postag="P0.*" postag_regexp="yes"/></token> <token><exception>prou</exception><exception postag="V.[SI].*" postag_regexp="yes"/></token> </antipattern>--> <antipattern> <token inflected="yes" regexp="yes">continuar|seguir|prosseguir</token> <token><exception postag="V.G.*|RG|LOC_ADV" postag_regexp="yes"/></token> </antipattern> <antipattern> <token inflected="yes">acabar</token> <token><exception postag="V.G.*|RG|LOC_ADV" postag_regexp="yes"/><exception inflected="yes">de</exception></token> </antipattern> <antipattern> <token postag="CC"/> </antipattern> <rule> <!--<antipattern> <!-\- TODO: generalitzar -\-> <token regexp="yes">això|aço|allò|ell|ella</token> <token regexp="yes">m'|em</token> </antipattern>--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0.0.*" postag_regexp="yes"><exception regexp="yes">['-].*</exception></token> <unify-ignore> <token min="0" postag_regexp="yes" postag="&pronom_feble;"/> </unify-ignore> <token postag="V.[SI].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;</token> </unify> <token postag="V.[NP].*|SPS00|R.|PP3.*|LOC_ADV" postag_regexp="yes" min="0" max="7"><exception postag="V.[NGP].*" postag_regexp="yes" negate="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;|ser</exception></token> <marker> <token postag="V.[NGP].*" postag_regexp="yes"><exception regexp="yes" inflected="yes">&elements_perifrasis_verbals;</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.[MSI].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;|&elements_perifrasis_verbals2;</token> <unify-ignore> <token postag="V.[NP].*|SPS00|R.|PP3.*|LOC_ADV" postag_regexp="yes" min="0" max="6"><exception postag="V.[NGP].*" postag_regexp="yes" negate="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;|&elements_perifrasis_verbals2;</exception></token> <marker> <token postag="V.[NG].*" postag_regexp="yes"><exception regexp="yes" inflected="yes">&elements_perifrasis_verbals;|&elements_perifrasis_verbals2;</exception></token> </marker> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--has de poder-te queixar--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.[SI].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;</token> <unify-ignore> <token postag="V.[NP].*|SPS00|LOC_ADV|R.|PP3.*" postag_regexp="yes" min="0" max="5"/> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no" skip="2"><exception scope="next" postag="PP.*|V.N.*|SPS00" postag_regexp="yes" negate_pos="yes"/><exception scope="next">per</exception></token> </unify> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--has de començar-te a queixar--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="V.[SI].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;&elements_perifrasis_verbals2;</token> <unify-ignore> <token postag="V.[NP].*|SPS00|R.|LOC_ADV|PP3.*" postag_regexp="yes" min="0" max="5"><exception postag="V.N.*" postag_regexp="yes" inflected="yes" regexp="yes">començar|tornar|deixar</exception></token> <token postag="V.N.*" postag_regexp="yes" inflected="yes" regexp="yes">començar|tornar|deixar</token> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> <token inflected="yes" regexp="yes">a|de</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--m'agrada queixar-me--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0[12]0.*" postag_regexp="yes"/> <unify-ignore> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes" regexp="yes" skip="4">agradar|encatar|encisar|caldre|convenir|permetre|costar</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0[12]0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--m'ha d'agradar queixar-me--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0[12]0.*" postag_regexp="yes"/> <unify-ignore> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;</token> <token postag="V.[NP].*|SPS00|R.|LOC_ADV" postag_regexp="yes" min="0" max="5"/> <token postag="V.[NP].*" postag_regexp="yes" inflected="yes" regexp="yes" skip="3">agradar|encisar|encantar|caldre|convenir|permetre</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0[12]0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--li agrada queixar-se--> <pattern> <token regexp="yes">li|els</token> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes" regexp="yes" skip="4">agradar|encatar|encisar|caldre|convenir|permetre</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- li ha d'agradar queixar-se--> <pattern> <token regexp="yes">li|els</token> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;</token> <token postag="V.[NP].*|SPS00|R.|LOC_ADV" postag_regexp="yes" min="0" max="5"/> <token postag="V.[NP].*" postag_regexp="yes" inflected="yes" regexp="yes" skip="3">agradar|encisar|encantar|caldre|convenir|permetre</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--Els animem a queixar-se.--> <pattern> <token regexp="yes" skip="1">els|la|l'|les|el</token> <token inflected="yes" regexp="yes" skip="4">animar|impulsar|obligar|impel·lir|induir|acusar|conduir|portar|dur|menar|guiar</token> <token postag="SPS00" regexp="yes" inflected="yes">a|de</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- animant-lo a queixar-se.--> <pattern> <token inflected="yes" regexp="yes">animar|impulsar|obligar|impel·lir|induir|acusar|conduir|portar|dur|menar|guiar</token> <token spacebefore="no" skip="4" regexp="yes">'l|-lo|'ls|-los</token> <token postag="SPS00" regexp="yes" inflected="yes">a|de</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--L'animo a continuar esforçant-se.--> <pattern> <token regexp="yes" skip="1">els|la|l'|les|el</token> <token inflected="yes" regexp="yes" skip="4">animar|impulsar|obligar|impel·lir|induir|acusar|conduir|portar|dur|menar|guiar</token> <token postag="SPS00" regexp="yes" inflected="yes">a|de</token> <token postag="V.N.*" postag_regexp="yes"/> <marker> <token postag="V.G.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--Us animem a queixar-vos.--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0[12]0.*" postag_regexp="yes"/> <unify-ignore> <token min="0" postag="VA.*" postag_regexp="yes"/> <token inflected="yes" regexp="yes" skip="4">animar|impulsar|obligar|impel·lir|induir|acusar|conduir|portar|dur|menar|guiar</token> <token postag="SPS00" regexp="yes" inflected="yes" skip="1">a|de</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"><exception inflected="yes" regexp="yes">continuar|seguir|prosseguir|acabar</exception></token> </marker> </unify-ignore> <token postag="P0[12]0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- recomanen abstenir-se.--> <pattern> <token inflected="yes" skip="3">recomanar</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="P0300000" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!--et recomano abstenir-te--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0[12]0.*" postag_regexp="yes"/> <unify-ignore> <token min="0" postag="VA.*" postag_regexp="yes"/> <token inflected="yes" skip="2">recomanar</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"><exception inflected="yes" regexp="yes">continuar|seguir|prosseguir|acabar</exception></token> </marker> </unify-ignore> <token postag="P0[12]0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- se'ns va anar--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0.0.*" postag_regexp="yes"><exception regexp="yes">[-'].*</exception></token> <unify-ignore> <token min="0" postag_regexp="yes" postag="&pronom_feble;"/> </unify-ignore> <token postag="V.[SI].*" postag_regexp="yes" inflected="yes" regexp="yes">&elements_perifrasis_verbals;</token> </unify> <token postag="V.[NP].*|SPS00|R.|PP3.*|LOC_ADV" postag_regexp="yes" min="0" max="6" inflected="yes" regexp="yes">&elements_perifrasis_verbals;<exception postag="V.[NGP].*" postag_regexp="yes" inflected="yes">anar</exception></token> <marker> <token postag="V.[NGP].*" postag_regexp="yes" inflected="yes">anar</token> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- et veus obligat a autocastigar-te--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0.0.*" postag_regexp="yes"><exception regexp="yes">['-].*</exception></token> <token postag="V.[SI].*" postag_regexp="yes" inflected="yes" regexp="yes">veure|considerar</token> <token postag="V.P.*" postag_regexp="yes"/> <unify-ignore> <token skip="1">a</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- et veus obligat a queixar-te--> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0.0.*" postag_regexp="yes"><exception regexp="yes">['-].*</exception></token> <token postag="VA[SI].*" postag_regexp="yes"/> <unify-ignore> <token postag="V.[NP].*" postag_regexp="yes" inflected="yes" regexp="yes">veure|considerar</token> </unify-ignore> <token postag="V.P.*" postag_regexp="yes"/> <unify-ignore> <token skip="1">a</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0.0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- et veig esforçar-te --> <pattern> <unify> <feature id="nombre"/> <feature id="persona"/> <token postag="P0[12]0.*" postag_regexp="yes"/> <unify-ignore> <token postag="VA.*" postag_regexp="yes" min="0"/> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes" skip="2">veure|sentir|observar</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"/> </marker> </unify-ignore> <token postag="P0[12]0.*" postag_regexp="yes" spacebefore="no"/> </unify> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> <rule> <!-- el veig esforçar-se --> <pattern> <token regexp="yes">el|els|l'</token> <token postag="VA.*" postag_regexp="yes" min="0"/> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes" skip="2">veure|sentir|observar</token> <marker> <token postag="V.[NG].*" postag_regexp="yes"/> </marker> <token postag="P030.*" postag_regexp="yes" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="_reflexiu"/> </disambig> </rule> </rulegroup> <rulegroup id="reflexiu_complement" name="reflexiu amb complement"> <rule> <!--Els fan/deixen agenollar.--> <pattern> <token postag="PP3..A00|PP3CP000|P0[123].*" postag_regexp="yes"/> <token min="0" postag="VA.*" postag_regexp="yes"/> <token inflected="yes" regexp="yes">deixar|fer</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu_complement"/> </disambig> </rule> <rule> <!--fan/deixen agenollar el cavall.--> <pattern> <token inflected="yes" regexp="yes">deixar|fer</token> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> <token postag="PD.*|PI.*|_GN.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_reflexiu_complement"/> </disambig> </rule> <rule> <!-- fes-lo agenollar--> <pattern> <token inflected="yes" regexp="yes">deixar|fer</token> <token postag="PP3..A00|PP3CP000|P0[123].*" postag_regexp="yes" spacebefore="no"/> <marker> <token postag="V.N.*" postag_regexp="yes"/> </marker> </pattern> <disambig action="add"> <wd pos="_reflexiu_complement"/> </disambig> </rule> </rulegroup> <rulegroup id="es_personal" name="es (no impersonal)"> <antipattern> <token regexp="yes">per|a</token> <token regexp="yes">motius?|causa|causes</token> </antipattern> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="VA[SI].3P.." postag_regexp="yes"/> <token inflected="yes">baixar</token> <token inflected="yes">de</token> <token postag="D[^N].*" postag_regexp="yes"/> <token><exception postag="DN.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="VA[SI].3S.." postag_regexp="yes"/> <token inflected="yes">baixar</token> <token inflected="yes">de</token> <token postag="D[^N].*" postag_regexp="yes"/> <token><exception postag="DN.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <antipattern> <token postag="D[^N].*" postag_regexp="yes"/> <token skip="5"/> <token postag="D.*" postag_regexp="yes"/> </antipattern> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes" inflected="yes">baixar</token> <token inflected="yes">de</token> <token postag="D[^N].*" postag_regexp="yes"/> <token><exception postag="DN.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">baixar</token> <token inflected="yes">de</token> <token postag="D[^N].*" postag_regexp="yes"/> <token><exception postag="DN.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">pujar</token> <token inflected="yes" regexp="yes">per|a|en</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">anar</token> <token min="0">tot</token> <token>a</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes" inflected="yes">pujar</token> <token inflected="yes" regexp="yes">per|a|en</token> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="VA[SI].3S.." postag_regexp="yes"/> <token inflected="yes">pujar</token> <token inflected="yes" regexp="yes">per|a|en</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes" regexp="yes">es|s'</token> </marker> <token postag="VA[SI].3P.." postag_regexp="yes"/> <token inflected="yes">pujar</token> <token inflected="yes" regexp="yes">per|a|en</token> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <token>que</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">caure</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <token>que</token> <marker> <token inflected="yes">es</token> </marker> <token postag="VA[SI].3S.." postag_regexp="yes"/> <token inflected="yes">caure</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|C.*" postag_regexp="yes"/> <token min="1" max="5" postag="N..[SN].*|_GN_.S|[PD]I..[SN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;|&parts_dia;</exception></token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">algú|algun|jo|mi|ella?|vostè|vosté|vós</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|C.*" postag_regexp="yes"/> <token min="1" max="5" postag="N..[SN].*|_GN_.S|[PD]I..[SN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;|&parts_dia;</exception></token> <token>no</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">algú|algun|jo|mi|ella?|vostè|vosté|vós</token> <token>no</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <!-- Es va --> <pattern> <token postag="SENT_START" skip="2"/> <marker> <token inflected="yes">es<exception scope="previous">on</exception></token> </marker> <token postag="VM[SI].3S.." postag_regexp="yes">va</token> <token><exception postag="UNKNOWN|V.[GIS].*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <!-- Es va anar--> <pattern> <marker> <token inflected="yes">es</token> </marker> <token>va</token> <token>anar</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">caure</token> <token postag="[ND].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes" inflected="yes">caure</token> <token regexp="yes">a|en</token> <token regexp="yes">trossos|terra|pedaços</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="VA[SI].3S.." postag_regexp="yes"/> <token inflected="yes">caure</token> <token postag="[ND].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es</token> </marker> <token postag="VA[SI].3S.." postag_regexp="yes"/> <token inflected="yes">caure</token> <token regexp="yes">a|en</token> <token regexp="yes">trossos|terra|pedaços</token> </pattern> <disambig action="add"> <wd pos="_es_personal_sg"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es<exception postag="_es_personal_sg"/></token> </marker> <token postag="V.[SI].3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_impersonal_sg"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|C.*" postag_regexp="yes"/> <token max="5" postag="N..[PN].*|_GN_.P|[PD]I..[PN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;|&parts_dia;</exception></token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" skip="1">alguns|nosaltres|vosaltres|elle?s|vost[èé]s<exception scope="previous" regexp="yes">en|a</exception></token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <token postag="SENT_START|_PUNCT.*|C.*" postag_regexp="yes"/> <token max="5" postag="N..[PN].*|_GN_.P|[PD]I..[PN].*|_possible_nompropi|UNKNOWN" postag_regexp="yes"><exception regexp="yes">dia|any|mes|segle|&dies_setmana;|&mesos_any;|&parts_dia;</exception></token> <token>no</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" skip="1">alguns|nosaltres|vosaltres|elle?s|vost[èé]s</token> <token>no</token> <marker> <token inflected="yes">es</token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_personal_pl"/> </disambig> </rule> <rule> <pattern> <marker> <token inflected="yes">es<exception postag="_es_personal_pl"/></token> </marker> <token postag="V.[SI].3P.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_es_impersonal_pl"/> </disambig> </rule> </rulegroup> <rule id="endurar" name="endur/endurar"> <pattern> <and> <token postag="_reflexiu"/> <token inflected="yes">endurar</token> <token inflected="yes">endur</token> </and> </pattern> <disambig action="remove"> <wd lemma="endurar"/> </disambig> </rule> <rule id="venir_vendre" name="venir/vendre"> <pattern> <marker> <and> <token postag="_reflexiu"/> <token inflected="yes">venir</token> <token inflected="yes">vendre</token> </and> </marker> <token>a</token> <token regexp="yes">sobre|damunt</token> </pattern> <disambig action="remove"> <wd lemma="vendre"/> </disambig> </rule> <rulegroup id="femeni_inusual" name="femení inusual: amor, color..."> <rule> <pattern> <token regexp="yes">&femeni_inusual;<exception postag=".*_GN_.*|.*LOC.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_GN_MS"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">(&femeni_inusual;)s<exception postag=".*_GN_.*|.*LOC.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_GN_MP"/> </disambig> </rule> </rulegroup> <rulegroup id="masculi_inusual" name="masculí inusual: policia, part, justícia..."> <rule> <pattern> <token regexp="yes" inflected="yes" postag="NC.S.*" postag_regexp="yes">&masculi_inusual;<exception postag=".*_GN_.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="NCM.*"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes" postag="NC.P.*" postag_regexp="yes">&masculi_inusual;<exception postag=".*_GN_.*" postag_regexp="yes"/></token> </pattern> <disambig action="remove" postag="NCM.*"/> </rule> <rule> <pattern> <token regexp="yes" inflected="yes" postag="NC.S.*" postag_regexp="yes">&masculi_inusual;<exception postag=".*_GN_.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_GN_FS"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes" postag="NC.P.*" postag_regexp="yes">&masculi_inusual;<exception postag=".*_GN_.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="_GN_FP"/> </disambig> </rule> </rulegroup> <rulegroup id="possible_nom_propi" name="possible nom propi"> <rule> <antipattern> <token postag="SENT_START"/> <token min="1" max="4" regexp="yes">\p{P}</token> <marker> <token postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </antipattern> <antipattern> <token postag="SENT_START"/> <marker> <token postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </antipattern> <antipattern> <token regexp="yes">[¿¡"'«»‘“:—–\-]</token> <marker> <token postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </antipattern> <pattern> <marker> <token postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </pattern> <disambig action="add"> <wd pos="_possible_nompropi"/> </disambig> </rule> <rule> <antipattern> <token postag="SENT_START"/> <token spacebefore="no">-</token> </antipattern> <pattern> <token spacebefore="no">-</token> <marker> <token spacebefore="no" postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </pattern> <disambig action="add"> <wd pos="_possible_nompropi"/> </disambig> </rule> <rule> <!-- TODO: why do we need this rule? Is there a SENT_START tag in the wrong place? --> <pattern> <token regexp="yes">[ld]'</token> <marker> <token postag="AQ.*|DA.*|PP.*|P0.*|V.[GMSIP].*|N.*|RG|DP.*|SPS00|I" postag_regexp="yes" regexp="yes">\p{Lu}.*</token> </marker> </pattern> <disambig action="add"> <wd pos="_possible_nompropi"/> </disambig> </rule> </rulegroup> <rule id="calen_foc" name="calen foc"> <pattern> <marker> <token>calen</token> </marker> <token>foc</token> </pattern> <disambig action="remove"> <wd lemma="caldre" pos="VMIP3P00"/> </disambig> </rule> <rulegroup id="marca_passat" name="marca de passat (ahir, l'any passat...)"> <rule> <antipattern> <token regexp="yes">com|de</token> <token postag="D.*" postag_regexp="yes" min="0"/> <token regexp="yes" inflected="yes">&dies_setmana;|&mesos_any;|&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;</token> </antipattern> <pattern> <token regexp="yes" inflected="yes">&dies_setmana;|&mesos_any;|&unitats_temps;|&periodes_temps;|&estacions;|&parts_dia;</token> <marker> <token regexp="yes">(prop)?passa(t|ts|da|des)</token> </marker> </pattern> <disambig action="add"> <wd pos="_marca_passat"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">(despús-|abans-d')?ahir|antany|anit<exception scope="previous" regexp="yes">de|d'</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="_marca_passat"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="LOC_ADV" regexp="yes">fa|feia</token> </marker> </pattern> <disambig action="add"> <wd pos="_marca_passat"/> </disambig> </rule> <rule> <pattern> <token>en</token> <token regexp="yes">el|la</token> <marker> <token regexp="yes">passat|prehistòria</token> </marker> </pattern> <disambig action="add"> <wd pos="_marca_passat"/> </disambig> </rule> </rulegroup> <rulegroup id="lo_admissible" name="Tirant lo Blanc"> <rule> <pattern case_sensitive="yes"> <token>Tirant</token> <marker> <token>lo</token> </marker> <token regexp="yes">Blanch?</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern case_sensitive="yes"> <token>Déu</token> <marker> <token>lo</token> </marker> <token>guard</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token>Lo</token> </marker> <token skip="1">Rat</token> <token>Penat</token> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup id="DEU_VOS_GUARD" name="Déu vos guard"> <rule> <pattern> <token skip="2">Déu</token> <marker> <token regexp="yes">(re)?guard</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <marker> <token>valga</token> </marker> <token regexp="yes">'ns|'m</token> <token>Déu</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token>rock</token> <marker> <token regexp="yes">['’]</token> <token>n</token> <token regexp="yes">['’]</token> </marker> <token>roll</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token>rock</token> <marker> <token regexp="yes">['’]n</token> <token regexp="yes">['’]</token> </marker> <token>roll</token> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup id="QUES" name="quès"> <rule> <pattern> <token regexp="yes">els|ls</token> <marker> <token>quès</token> </marker> <token postag="CC" skip="5"/> <token regexp="yes">perquès|coms|quans</token> </pattern> <disambig action="add"> <wd lemma="què" pos="NCMP000"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" skip="3">perquès|coms|quans</token> <token skip="1" postag="CC"/> <token regexp="yes">els|ls</token> <marker> <token>quès</token> </marker> </pattern> <disambig action="add"> <wd lemma="què" pos="NCMP000"/> </disambig> </rule> </rulegroup> <rulegroup id="allowed_repetitions" name="repeticions permeses"> <!-- girar el cap cap a l’altra persona --> <rule> <pattern> <token spacebefore="no">/</token> <marker> <token case_sensitive="yes" spacebefore="no">a</token> </marker> <token>a</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token>seguit</token> <token>seguit</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>de</token> <marker> <token case_sensitive="yes">A</token> </marker> <token>a</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>de</token> <token/> <token>a</token> <marker> <token case_sensitive="yes">A</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">\p{P}\p{P}+</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token spacebefore="no">.</token> <token spacebefore="no" regexp="yes" case_sensitive="yes">es|ES</token> </marker> <token>es</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token>si</token> <marker> <token>no</token> </marker> <token>no</token> <token postag="&pronom_feble;" postag_regexp="yes" min="0" max="2"/> <token postag="V.[SI].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>cada</token> <marker> <token regexp="yes">una?</token> </marker> <token><match no="1"/></token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>a</token> <token regexp="yes">l|la</token> <marker> <token regexp="yes">pa|vi|peix|pul</token> </marker> <token><match no="2"/></token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token>sapiens</token> </marker> <token><match no="0"/></token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>somni</token> <token>de</token> <marker> <token>Joan</token> </marker> <token><match no="3"/></token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token regexp="yes">parlant|r[eo]dolant|adés|així|ai|Bío</token> </marker> <token><match no="0"/></token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>de</token> <marker> <token>totes</token> </marker> <token>totes</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <!--<token>per</token>--> <marker> <token>damunt</token> </marker> <token>damunt</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>de</token> <marker> <token>de</token> </marker> <token>Gaulle</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <token>de</token> <marker> <token>De</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <token>en</token> <marker> <token>en</token> </marker> <token regexp="yes">\p{Lu}.+</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern> <marker> <token>els</token> </marker> <token>els</token> <token postag="V.[IS].*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token>I</token> </marker> <token>i</token> <!-- <token regexp="yes">[A-Z]|(?=.)M{0,4}(CM|CD|D?C{0,3})(XC|XL|L?X{0,3})(IX|IV|V?I{0,3})</token> --> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <!-- <token regexp="yes">[A-Z]|(?=.)M{0,4}(CM|CD|D?C{0,3})(XC|XL|L?X{0,3})(IX|IV|V?I{0,3})</token> --> <marker> <token>i</token> </marker> <token>I</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <!-- <rule> Maximilià I i Joan II. <pattern case_sensitive="yes"> <token postag="NP..SP." postag_regexp="yes"/> <token regexp="yes">segle|\p{Lu}.+</token> <token>I</token> <marker> <token>i</token> </marker> </pattern> <disambig action="immunize"/> </rule> --> <rule> <pattern> <token>de</token> <token>la</token> <marker> <token>a</token> </marker> <token>a</token> <token>la</token> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <token>Torres</token> <marker> <token>Torres</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <token>Rin</token> <token>Tin</token> <marker> <token>Tin</token> </marker> </pattern> <disambig action="add"> <wd pos="_allow_repeat"/> </disambig> </rule> </rulegroup> <rulegroup id="LOC_ADV_TEMPS" name="locacions adverbials de temps, sense filtrar"> <rule id="uns__despres" name="uns ... després"> <pattern> <marker> <token postag="D[IN].*" postag_regexp="yes" skip="3"><exception postag="LOC_ADV_TEMP"/><exception scope="next" postag="_PUNCT.*" postag_regexp="yes"/></token> </marker> <token regexp="yes" inflected="yes" skip="2">&unitats_temps;|&periodes_temps;</token> <token regexp="yes">després|abans|(en|ar|endar)(rer[ea])<exception scope="previous" postag="C.*" postag_regexp="yes"/></token> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="uns__mestard" name="uns ... més tard"> <pattern> <marker> <token postag="D[IN].*" postag_regexp="yes" skip="3"><exception postag="LOC_ADV_TEMP"/><exception scope="next" postag="_PUNCT.*" postag_regexp="yes"/></token> </marker> <token regexp="yes" inflected="yes" skip="2">&unitats_temps;|&periodes_temps;</token> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="anys_despres" name="anys/dies/hores/minuts... després"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <token regexp="yes" inflected="yes" postag="NC.P.*|[PD]I.MS.*" postag_regexp="yes">&unitats_temps;|&periodes_temps;</token> <token regexp="yes">després|abans|enrere|arrere|endarrere</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="mes_tard" name="més tard"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/><exception regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</exception></token> <marker> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="prou_mes_tard" name="prou més tard"> <pattern> <marker> <token regexp="yes">prou|bastant|molt</token> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="anys_mes_tard" name="anys/dies/hores/minuts... més tard"> <pattern> <token postag="N.*" postag_regexp="yes"><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="uns_anys_mes_tard" name="uns anys/dies/hores/minuts... més tard"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[IN].*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> </unify> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="uns_anys_despres" name="anys/dies/hores/minuts... més tard"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[IN].*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> </unify> <token regexp="yes">després|abans|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="uns_quants_anys_mes_tard" name="anys/dies/hores/minuts... més tard"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[IN].*" postag_regexp="yes"/> <token postag="D[IN].*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> </unify> <token>més</token> <token regexp="yes">tard|avant|endavant|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="uns_quants_anys_despres" name="anys/dies/hores/minuts... més tard"> <pattern> <token><exception postag="D[IN].*" postag_regexp="yes"/></token> <marker> <unify> <feature id="nombre"/> <feature id="genere"/> <token postag="D[IN].*" postag_regexp="yes"/> <token postag="D[IN].*" postag_regexp="yes"/> <token regexp="yes" inflected="yes">&unitats_temps;|&periodes_temps;</token> </unify> <token regexp="yes">després|abans|(en|ar|endar)(rer[ea])</token> </marker> </pattern> <disambig action="add"> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> <wd pos="LOC_ADV_TEMP"/> </disambig> </rule> <rule id="URL" name="url"> <!-- It excludes URLs from list of unknown words --> <pattern> <token regexp="yes">(https?|ftp)://.*|www.*</token> </pattern> <disambig action="add"> <wd pos="IS_URL" lemma="IS_URL"/> </disambig> </rule> </rulegroup> <rule id="llibres_biblia" name="abreviatures de llibres de la Bíblia"> <pattern case_sensitive="yes"> <marker> <token regexp="yes">Jo|Gn|Ex|Lv|Nm|Dt|Jos|Jt|Rt|1Sa|2Sa|1Re|2Re|1Cr|2Cr|Esd|Ne|Est|Jb|Sl|Pr|Coh|Ct|Is|Jr|Lm|Ez|Dn|Os|Jl|Am|Ab|Jon|Mi|Na|Ha|So|Ag|Za|Ml|Mt|Mc|Lc|Jn|Ac|Rm|1Co|2Co|Ga|Ef|Fl|Col|1Te|2Te|1Tm|2Tm|Tt|Flm|He|Jm|1Pe|2Pe|1Jn|2Jn|3Jn|Jud|Ap|Estgr|Jdt|Tb|1Ma|2Ma|Sv|Sir|Ba|EpJr|Dngr|Dngr3|Dngr13|Dngr14|Man|3Esr|4Esr|Sl151|Lao|SIH|Abdies|Ageu|Amós|Apocalipsi|Apòstols|Baruc|Cohèlet|Colossencs|Corintis|Cròniques|Càntic|Daniel|Deuteronomi|Efesis|Escrits|Esdres|Ester|Ezequiel|Fets|Filipencs|Filèmon|grec|Gàlates|Gènesi|Habacuc|Hebreus|Isaïes|Jaume|Jeremies|Joan|Job|Joel|Jonàs|Josuè|Judes|Judit|Jutges|Lamentacions|Levític|Lluc|Macabeus|Malaquies|Marc|Mateu|Miquees|Nahum|Nehemies|Nombres|Osees|Pentateuc|Pere|Proverbis|Reis|Romans|Rut|Salms|Samuel|Saviesa|Siràcida|Sofonies|Tessalonicencs|Timoteu|Titus|Tobit|Zecaries|Èxode</token> </marker> <token regexp="yes">[0-9][0-9,.-]*</token> </pattern> <disambig action="add"> <wd pos="_abrev_biblia" lemma="_abrev_biblia"/> </disambig> </rule> <rulegroup id="carreteres" name="carreteres"> <rule> <pattern case_sensitive="yes"> <marker> <token>AP</token> </marker> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">\d</token> </pattern> <disambig action="add"> <wd pos="NCFS000" lemma="_carretera"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token>N</token> </marker> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">\d\d\d</token> </pattern> <disambig action="add"> <wd pos="NCFS000" lemma="_carretera"/> </disambig> </rule> <rule> <pattern case_sensitive="yes"> <marker> <token>C</token> </marker> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">\d\d</token> </pattern> <disambig action="add"> <wd pos="NCFS000" lemma="_carretera"/> </disambig> </rule> </rulegroup> <rulegroup id="expressio_guionet" name="expressió amb guionet"> <rule> <pattern> <token regexp="yes" inflected="yes" skip="2">&expressio_DOS_NOMS;</token> <marker> <token postag="N.*|A.*" postag_regexp="yes"/> </marker> <token spacebefore="no" regexp="yes">-|/|>|<</token> <token postag="N.*|A.*" postag_regexp="yes" spacebefore="no"/> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> <rule> <pattern> <token regexp="yes" inflected="yes">&expressio_DOS_NOMS;</token> <marker> <token postag="N.*|A.*" postag_regexp="yes"/> </marker> <token>i</token> <token postag="N.*|A.*" postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="ignore_concordance"/> </disambig> </rule> </rulegroup> <rule id="seg" name="abreviatura: seg"> <pattern> <token regexp="yes">\d+</token> <token>i</token> <marker> <token>seg</token> </marker> <token>.</token> </pattern> <disambig action="replace"> <wd lemma="següent" pos="Y"/> </disambig> </rule> <rule id="s_essa" name="essa"> <pattern> <marker> <token>s</token> </marker> <token regexp="yes">llarga|curta|sonora|sorda|impura|marcada|líquida</token> </pattern> <disambig action="replace"> <wd lemma="essa" pos="NCFS000"/> </disambig> </rule> <rule id="OFERTA" name="oferta (ofertar)"> <pattern> <and> <token postag="VM[^P].*" postag_regexp="yes" regexp="yes">ofert|oferta|ofertes</token> <token postag="V.P.*|NC.*" postag_regexp="yes"/> </and> </pattern> <disambig action="remove" postag="VM[^P].*"/> </rule> <rule id="PR_PT" name="PR/PT (què)"> <antipattern> <token postag="PR.*" postag_regexp="yes" skip="-1">què</token> <token>?</token> </antipattern> <pattern> <token postag="SPS00"/> <marker> <token postag="PR.*" postag_regexp="yes">què</token> </marker> </pattern> <disambig action="filter" postag="PR.*"/> </rule> <rulegroup id="data_concreta" name="data concreta"> <rule> <pattern> <marker> <token postag="DA..S." postag_regexp="yes"/> </marker> <token>endemà</token> </pattern> <disambig action="add"> <wd pos="_data_concreta"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="DA..S." postag_regexp="yes"/> </marker> <token regexp="yes">dia|setmana|mes|any|&mesos_any;|&dies_setmana;|primavera|estiu|tardor|hivern|\d\d\d\d</token> <!--<token regexp="yes">de|d'|que|\d+|vinent|pròxima?|propera?|següent|provinent</token>--> </pattern> <disambig action="add"> <wd pos="_data_concreta"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="DA..S." postag_regexp="yes"/> </marker> <token regexp="yes">\d+</token> <token inflected="yes">de</token> <token regexp="yes">&mesos_any;</token> </pattern> <disambig action="add"> <wd pos="_data_concreta"/> </disambig> </rule> <rule> <pattern> <marker> <token postag="DA..S." postag_regexp="yes"/> </marker> <token postag="numeral|DN.*" postag_regexp="yes"/> <token inflected="yes">de</token> <token regexp="yes">&mesos_any;</token> </pattern> <disambig action="add"> <wd pos="_data_concreta"/> </disambig> </rule> </rulegroup> <rulegroup id="pringat" name="pringat"> <rule> <pattern> <marker> <token>pringat<exception scope="previous" inflected="yes">haver</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AQ0MS0" lemma="pringat"/> </disambig> </rule> <rule> <pattern> <marker> <token>pringats<exception scope="previous" inflected="yes">haver</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AQ0MP0" lemma="pringat"/> </disambig> </rule> <rule> <pattern> <marker> <token>pringada<exception scope="previous" inflected="yes">haver</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AQ0FS0" lemma="pringat"/> </disambig> </rule> <rule> <pattern> <marker> <token>pringades<exception scope="previous" inflected="yes">haver</exception></token> </marker> </pattern> <disambig action="add"> <wd pos="AQ0FP0" lemma="pringat"/> </disambig> </rule> </rulegroup> <rulegroup id="UNITATS_SI" name="Sistema Internacional d'Unitats"> <rule> <antipattern> <token regexp="yes">[\d\.,  ]*\d</token> <token regexp="yes">aC|dC</token> </antipattern> <antipattern> <token postag="_C_TEMPS"/> <token regexp="yes">a|aC|dC|el|es</token> </antipattern> <pattern> <token regexp="yes">[\d\.,  ]*\d</token> <marker> <token regexp="yes" case_sensitive="yes">[%‰‱]|(da|h|k|M|G|T|P|E|Z|Y|d|c|m|µ|n|p|f|a|z|y)?(m|g|s|A|K|cd|mol|Hz|N|Pa|J|W|Wh|C|V|Ω|S|F|T|Wb|H|rad|sr|lm|lx|Bq|Gy|Sv|kat|l|L)[²³23]?<exception postag="NP.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="Y"/> </disambig> </rule> <rule> <pattern> <token regexp="yes">[\d\.,  ]*\d</token> <token regexp="yes" case_sensitive="yes">[%‰‱]|(da|h|k|M|G|T|P|E|Z|Y|d|c|m|µ|n|p|f|a|z|y)?(m|g|s|A|K|cd|mol|Hz|N|Pa|J|W|Wh|C|V|Ω|S|F|T|Wb|H|rad|sr|lm|lx|Bq|Gy|Sv|kat|l|L)[²³23]?<exception postag="NP.*" postag_regexp="yes"/></token> <token>/</token> <marker> <token regexp="yes" case_sensitive="yes">[%‰‱]|(da|h|k|M|G|T|P|E|Z|Y|d|c|m|µ|n|p|f|a|z|y)?(m|g|s|A|K|cd|mol|Hz|N|Pa|J|W|Wh|C|V|Ω|S|F|T|Wb|H|rad|sr|lm|lx|Bq|Gy|Sv|kat|l|L)[²³23]?<exception postag="NP.*" postag_regexp="yes"/></token> </marker> </pattern> <disambig action="add"> <wd pos="Y"/> </disambig> </rule> </rulegroup> <rule id="noms_lletres" name="algunes lletres"> <pattern> <token postag="D..FS." postag_regexp="yes"/> <marker> <token regexp="yes">s|g</token> </marker> </pattern> <disambig action="replace"> <wd pos="NCFS000"/> </disambig> </rule> <rulegroup id="lletres_majuscules" name="lletres soltes majúscules"> <rule> <pattern> <token regexp="yes">.*\d</token> <marker> <token>-m</token> </marker> </pattern> <disambig action="replace"> <wd pos="NPCN000"/> </disambig> </rule> <rule> <antipattern> <token>A</token> <token regexp="yes">\p{Lu}+</token> </antipattern> <pattern> <token><exception postag="SENT_START"/><exception regexp="yes">[¿?¡!"'‘“«»—–:\-]</exception></token> <marker> <token regexp="yes">\p{Lu}<exception postag="Y"/></token> </marker> </pattern> <disambig action="add"> <wd pos="NPCN000"/> </disambig> </rule> <rule> <!--A és igual a B--> <pattern> <token postag="SENT_START"/> <!--<token min="0" regexp="yes">[¿?¡!"'‘“«»—–:\-]</token>--> <marker> <token regexp="yes">\p{Lu}</token> </marker> <token postag="VS..3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="NPCN000"/> </disambig> </rule> <rule> <!--A és igual a B--> <pattern> <token postag="SENT_START"/> <token regexp="yes">[¿?¡!"'‘“«»—–:\-]</token> <marker> <token regexp="yes">\p{Lu}</token> </marker> <token postag="VS..3S.." postag_regexp="yes"/> </pattern> <disambig action="add"> <wd pos="NPCN000"/> </disambig> </rule> </rulegroup> <rulegroup id="lletres_minuscules" name="lletres soltes minúscules"> <rule> <pattern> <token regexp="yes" inflected="yes">ordre|dimensió</token> <marker> <token regexp="yes">m|n|x|y|z</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rule id="plurals" name="alguns plurals"> <pattern> <token postag="D.*" postag_regexp="yes"/> <marker> <token regexp="yes">(picasso|miró|dalí|rembrandt|botticelli)s</token> </marker> </pattern> <disambig action="add"> <wd lemma="np" pos="NCMP000"/> </disambig> </rule> <rulegroup id="lletres_separades" name="lletres separades"> <rule> <!-- c o n c l u s i ó --> <pattern> <marker> <token regexp="yes">\p{L}</token> </marker> <token regexp="yes" spacebefore="yes">\p{L}</token> <token regexp="yes" spacebefore="yes">\p{L}</token> <token regexp="yes" spacebefore="yes">\p{L}</token> </pattern> <disambig action="immunize"/> </rule> <rule> <!-- c o n c l u s i ó --> <pattern> <token regexp="yes">\p{L}</token> <token regexp="yes" spacebefore="yes">\p{L}</token> <token regexp="yes" spacebefore="yes">\p{L}</token> <marker> <token regexp="yes" spacebefore="yes">\p{L}</token> </marker> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup id="sufixos_prefixos" name="sufixos i prefixos"> <rule> <pattern> <marker> <token>-</token> <token regexp="yes" spacebefore="no">ista|isme|ir|ar|er|re</token> </marker> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rulegroup name="Ignore spelling numbers " id="IGNORE_NUMBERS"> <rule> <pattern> <marker> <token regexp="yes">\d\d?(&mesos_any_abrev;)\d\d(\d\d)?</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <marker> <token regexp="yes">\d\d?</token> <token>-</token> <token regexp="yes">&mesos_any_abrev;</token> <token>-</token> <token regexp="yes">\d\d(\d\d)?</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <marker> <token regexp="yes">\d\d?</token> <token>/</token> <token regexp="yes">&mesos_any_abrev;</token> <token>/</token> <token regexp="yes">\d\d(\d\d)?</token> </marker> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token regexp="yes">\d+xx?|x\d+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule name="dates"> <pattern> <token regexp="yes" case_sensitive="yes">(\d|[12]\d|3[01])[GFMAJSOND]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <!-- minus sign --> <pattern> <token regexp="yes">−?[\d .,]+%?</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <!-- style rules can be suggested for these abbreviations --> <pattern> <token regexp="yes">([012][0-9][\.,])?[0-6]?[0-9]</token> <token regexp="yes" case_sensitive="yes">pm|am|PM|AM|GMT|CEST|UTC|EST</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[\d ,\.]+[x⁄][\d ,\.]+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <antipattern case_sensitive="yes"> <token regexp="yes">[A-Z]+</token> <token spacebefore="no">-</token> <token spacebefore="no">[A-Z]+</token> </antipattern> <pattern case_sensitive="yes"> <token regexp="yes">[A-Z0-9]+</token> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">[A-Z0-9]+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes" case_sensitive="yes">[A-Z]+\d+<exception regexp="yes">CO2|COVID19</exception></token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern case_sensitive="yes"> <token postag="SENT_START"/> <token min="0" max="4" regexp="yes">\p{P}</token> <token>Al</token> <token>-</token> <token>Àndalus</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">([01]?\d|2[0-3])h[0-5]?\d(min|m)([0-5]?\ds)?</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">([01]?\d|2[0-3])h[0-5]?\d</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[0-5]?\d(min|m)[0-5]?\ds</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern case_sensitive="yes"> <token regexp="yes">\d\d\d\d*[A-Z]+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token>sub</token> <token spacebefore="no">-</token> <token spacebefore="no" regexp="yes">\d?\d</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes" case_sensitive="yes">[A-Z]</token> <token>-</token> <token regexp="yes">\d+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">\d+</token> <token>-</token> <token regexp="yes" case_sensitive="yes">[A-Z]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes" case_sensitive="yes">\d+\.d+[a-z]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes" case_sensitive="yes">\d+[\.,d]*x\d+[\.,d]*(cm|mm|m)</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes" case_sensitive="yes">\d+(px|p|v|r)</token> </pattern> <disambig action="ignore_spelling"/> </rule> <!-- wrong units --> <rule> <pattern case_sensitive="yes"> <token regexp="yes" case_sensitive="yes">\d+[\.,d](sg|mt|K[mgplWB]|Kbps|Kcal|Kbit|k|K)</token> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rulegroup id="verbs_colloquials" name="formes col·loquials d'alguns verbs"> <rule> <pattern> <marker> <token>coneixe</token> </marker> <token regexp="yes">'l|'ls|'ns|-us</token> </pattern> <disambig action="add"> <wd lemma="conèixer" pos="VMN0000"/> </disambig> </rule> <rule> <pattern> <marker> <token>digue</token> </marker> <token regexp="yes">'ls|'ns</token> </pattern> <disambig action="add"> <wd lemma="dir" pos="VMN0000"/> </disambig> </rule> </rulegroup> <rule id="monedes" name="monedes"> <pattern> <token regexp="yes">M[£€$]</token> </pattern> <disambig action="add"> <wd lemma="euros" pos="NCMN000"/> </disambig> </rule> <rule id="mes_info" name="més info"> <pattern> <token regexp="yes">més|\+</token> <marker> <token>info</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> <rulegroup id="CARMEN" name="Carmen"> <rule> <pattern> <marker> <token skip="-1">Carmen</token> </marker> <token regexp="yes" inflected="yes">&context_OPERA;</token> </pattern> <disambig action="add"> <wd lemma="Carmen" pos="NPFSSP0"/> </disambig> </rule> <rule> <pattern> <token skip="-1" regexp="yes" inflected="yes">&context_OPERA;</token> <marker> <token>Carmen</token> </marker> </pattern> <disambig action="add"> <wd lemma="Carmen" pos="NPFSSP0"/> </disambig> </rule> </rulegroup> <rule id="MADE_IN" name="made in"> <pattern> <marker> <token>made</token> <token>in</token> <token regexp="yes" case_sensitive="yes">USA|China|Europe|Taiwan|Spain|France|Germany|Italy</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="prefix_entre_parentesis" name="prefix entre parèntesis"> <pattern> <token>(</token> <marker> <token regexp="yes" spacebefore="no">des|dis|in|mal|anti|pro|tele</token> <token spacebefore="no">)</token> </marker> <token spacebefore="no"/> </pattern> <disambig action="immunize"/> </rule> <rulegroup id="passeja_i_repasseja" name="passeja i repasseja"> <rule> <pattern> <token postag="V.*" postag_regexp="yes"/> <token>i</token> <marker> <token>re<match no="0"/></token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token postag="&pronom_feble;" postag_regexp="yes"/> <token postag="V.*" postag_regexp="yes"/> <token>i</token> <marker> <token><match no="0"/></token> <token>re<match no="1"/></token> </marker> </pattern> <disambig action="immunize"/> </rule> </rulegroup> <rule id="IGNORE_SPELLING_CASTELLS" name="ignorar nomenclatura de castells"> <!-- https://www.esadir.cat/entrades/fitxa/node/Concursos_castellers --> <pattern> <marker> <token regexp="yes">\dde?1?\d(1|f|fa|fm|fmp|ps|sf|sm)?</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="ignore_uppercase_letters" name="A a Z"> <pattern case_sensitive="yes"> <token regexp="yes">[A-Z]</token> <token regexp="yes">[aoi]</token> <token regexp="yes">[A-Z]</token> </pattern> <disambig action="immunize"/> </rule> <rulegroup id="ignore_pp" name="ignorar pp (punts penrcentuals"> <rule> <pattern> <token regexp="yes">[\d \.,]+\dpp</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[\d \.,]+\d</token> <marker> <token>pp</token> </marker> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rule id="IGNORE_SPELLING_LE" name="ignorar le"> <pattern> <marker> <token>le</token> </marker> <token regexp="yes">nozze|jour|courrier|monde|journal</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="IGNORE_LETTER_QUOTES" name="ignore letters between quotes"> <pattern> <token postag="_QM_OPEN"/> <marker> <token regexp="yes" spacebefore="no">.</token> </marker> <token postag="_QM_CLOSE"/> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="IGNORE_LETTER_PARENTHESIS" name="ignore letters between quotes"> <pattern> <token regexp="yes">[\{\[\(]</token> <marker> <token regexp="yes" spacebefore="no">.</token> </marker> <token regexp="yes">[\}\]\)]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rulegroup id="onomatopeies" name="algunes onomatopeies"> <rule> <pattern> <token case_sensitive="yes" regexp="yes">[Mm]mm+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token case_sensitive="yes" regexp="yes">A?a+h+</token> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> <rule name="Ignore spelling of punctuation characters" id="IGNORE_SPELLING_OF_PUNCTUATION"> <pattern> <token regexp="yes">[_~°]+</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule id="IGNORE_SPELLING_APOSTROPHES" name="ignora l'ortografia en algunes apostrofacions"> <pattern> <marker> <token regexp="yes">[dlmnst]</token> </marker> <token regexp="yes">['`´‘’]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <!-- CHUNKER --> <rulegroup id="PERIFRASIS_VERBALS" name="perífrasis verbals"> <rule> <pattern> <token inflected="yes">haver</token> <token regexp="yes">de|d'</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> <rule> <pattern> <token inflected="yes">haver</token> <token postag="V.P.*" postag_regexp="yes"><exception postag="[NA].*" postag_regexp="yes"/></token> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> <rule> <pattern> <token postag="VA.*" postag_regexp="yes" inflected="yes">anar</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> <rule> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">continuar|seguir|estar|anar|prosseguir|acabar</token> <token postag="V.G.*" postag_regexp="yes"/> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> <rule> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">poder|voler|desitjar|deure|saber</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> <rule> <pattern> <token postag="V.*" postag_regexp="yes" inflected="yes" regexp="yes">tornar|començar|anar</token> <token>a</token> <token postag="V.N.*" postag_regexp="yes"/> </pattern> <disambig action="addchunk"> <wd pos="GV"/> <wd pos="GV"/> <wd pos="GV"/> </disambig> </rule> </rulegroup> <rulegroup id="MATEMATIQUES" name="notació matemàtica"> <rule> <pattern> <token regexp="yes">[∀-⋿]</token> <token regexp="yes">[a-z]</token> </pattern> <disambig action="immunize"/> </rule> <rule> <pattern> <token regexp="yes">[a-z]</token> <token regexp="yes">[=><\+]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[=><]</token> <token regexp="yes">[a-z]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[a-z][⁰ⁱ²³⁴⁵⁶⁷⁸⁹⁺⁻⁼⁽⁾ⁿ₀₁₂₃₄₅₆₇₈₉₊₋₌₍₎ₐₑₒₓₔₕₖₗₘₙₚₛₜ]</token> </pattern> <disambig action="ignore_spelling"/> </rule> <rule> <pattern> <token regexp="yes">[a-z]</token> <token regexp="yes">[⁰ⁱ²³⁴⁵⁶⁷⁸⁹⁺⁻⁼⁽⁾ⁿ₀₁₂₃₄₅₆₇₈₉₊₋₌₍₎ₐₑₒₓₔₕₖₗₘₙₚₛₜ]</token> </pattern> <disambig action="ignore_spelling"/> </rule> </rulegroup> </rules>
© 2015 - 2025 Weber Informatics LLC | Privacy Policy