|
6 | 6 | | is specific to the training corpus and can be defined in the respective
|
7 | 7 | | language data's #[+a("/usage/adding-languages#tag-map") #[code tag_map.py]].
|
8 | 8 |
|
9 |
| -+accordion("Universal part-of-speech tags") |
| 9 | ++accordion("Universal Part-of-speech Tags") |
10 | 10 | p
|
11 | 11 | | spaCy also maps all language-specific part-of-speech tags to a small,
|
12 | 12 | | fixed set of word type tags following the
|
|
17 | 17 | | #[+api("token#attributes") #[code Token.pos_]] attributes.
|
18 | 18 |
|
19 | 19 | +table(["POS", "Description", "Examples"])
|
20 |
| - +univ-pos-row("ADJ", "adjective", "big, old, green, incomprehensible, first") |
21 |
| - +univ-pos-row("ADP", "adposition", "in, to, during") |
22 |
| - +univ-pos-row("ADV", "adverb", "very, tomorrow, down, where, there") |
23 |
| - +univ-pos-row("AUX", "auxiliary", "is, has (done), will (do), should (do)") |
24 |
| - +univ-pos-row("CONJ", "conjunction", "and, or, but") |
25 |
| - +univ-pos-row("CCONJ", "coordinating conjunction", "and, or, but") |
26 |
| - +univ-pos-row("DET", "determiner", "a, an, the") |
27 |
| - +univ-pos-row("INTJ", "interjection", "psst, ouch, bravo, hello") |
28 |
| - +univ-pos-row("NOUN", "noun", "girl, cat, tree, air, beauty") |
29 |
| - +univ-pos-row("NUM", "numeral", "1, 2017, one, seventy-seven, IV, MMXIV") |
30 |
| - +univ-pos-row("PART", "particle", "'s, not, ") |
31 |
| - +univ-pos-row("PRON", "pronoun", "I, you, he, she, myself, themselves, somebody") |
32 |
| - +univ-pos-row("PROPN", "proper noun", "Mary, John, Londin, NATO, HBO") |
33 |
| - +univ-pos-row("PUNCT", "punctuation", "., (, ), ?") |
34 |
| - +univ-pos-row("SCONJ", "subordinating conjunction", "if, while, that") |
35 |
| - +univ-pos-row("SYM", "symbol", "$, %, §, ©, +, −, ×, ÷, =, :), 😝") |
36 |
| - +univ-pos-row("VERB", "verb", "run, runs, running, eat, ate, eating") |
37 |
| - +univ-pos-row("X", "other", "sfpksdpsxmsa") |
38 |
| - +univ-pos-row("SPACE", "space", "") |
| 20 | + +ud-row("ADJ", "adjective", "big, old, green, incomprehensible, first") |
| 21 | + +ud-row("ADP", "adposition", "in, to, during") |
| 22 | + +ud-row("ADV", "adverb", "very, tomorrow, down, where, there") |
| 23 | + +ud-row("AUX", "auxiliary", "is, has (done), will (do), should (do)") |
| 24 | + +ud-row("CONJ", "conjunction", "and, or, but") |
| 25 | + +ud-row("CCONJ", "coordinating conjunction", "and, or, but") |
| 26 | + +ud-row("DET", "determiner", "a, an, the") |
| 27 | + +ud-row("INTJ", "interjection", "psst, ouch, bravo, hello") |
| 28 | + +ud-row("NOUN", "noun", "girl, cat, tree, air, beauty") |
| 29 | + +ud-row("NUM", "numeral", "1, 2017, one, seventy-seven, IV, MMXIV") |
| 30 | + +ud-row("PART", "particle", "'s, not, ") |
| 31 | + +ud-row("PRON", "pronoun", "I, you, he, she, myself, themselves, somebody") |
| 32 | + +ud-row("PROPN", "proper noun", "Mary, John, Londin, NATO, HBO") |
| 33 | + +ud-row("PUNCT", "punctuation", "., (, ), ?") |
| 34 | + +ud-row("SCONJ", "subordinating conjunction", "if, while, that") |
| 35 | + +ud-row("SYM", "symbol", "$, %, §, ©, +, −, ×, ÷, =, :), 😝") |
| 36 | + +ud-row("VERB", "verb", "run, runs, running, eat, ate, eating") |
| 37 | + +ud-row("X", "other", "sfpksdpsxmsa") |
| 38 | + +ud-row("SPACE", "space", "") |
39 | 39 |
|
40 | 40 | +accordion("English", "pos-en")
|
41 | 41 | p
|
|
0 commit comments