|
39 | 39 | 'nisso': {'form': 'em isso', 'lemma': 'em este'},
|
40 | 40 | 'nisto': {'form': 'em isto', 'lemma': 'em este',
|
41 | 41 | 'upos': 'ADP PRON', 'main': 1, 'shape': 'subtree'},
|
42 |
| - 'no': {'form': 'em o', 'lemma': 'em o'}, |
43 |
| - 'nos': {'form': 'em os', 'lemma': 'em o'}, |
| 42 | + 'no': {'form': 'em o', 'lemma': 'em o'}, # PRON cases are excluded below |
| 43 | + 'nos': {'form': 'em os', 'lemma': 'em o'}, # PRON cases are excluded below |
44 | 44 | 'num': {'form': 'em um', 'lemma': 'em um'},
|
45 | 45 | 'numa': {'form': 'em uma', 'lemma': 'em um'},
|
46 | 46 | 'numas': {'form': 'em umas', 'lemma': 'em um'},
|
@@ -79,6 +79,11 @@ class AddMwt(udapi.block.ud.addmwt.AddMwt):
|
79 | 79 |
|
80 | 80 | def multiword_analysis(self, node):
|
81 | 81 | """Return a dict with MWT info or None if `node` does not represent a multiword token."""
|
| 82 | + |
| 83 | + # "no" can be either a contraction of "em o", or a pronoun |
| 84 | + if node.form.lower() in ('no', 'nos') and node.upos == 'PRON': |
| 85 | + return |
| 86 | + |
82 | 87 | analysis = MWTS.get(node.form.lower(), None)
|
83 | 88 |
|
84 | 89 | # If the input is e.g.:
|
|
0 commit comments