|
20 | 20 | from pattern.it import parse as parse_it
|
21 | 21 | from pattern.nl import parse as parse_nl
|
22 | 22 |
|
23 |
| -print parse_de("die schwarze Katzen", chunks=False) # die/DT schwarze/JJ Katzen/NNS |
24 |
| -print parse_es("los gatos negros" , chunks=False) # los/DT gatos/NNS negros/JJ |
25 |
| -print parse_fr("les chats noirs" , chunks=False) # les/DT chats/NNS noirs/JJ |
26 |
| -print parse_it("i gatti neri" , chunks=False) # i/DT gatti/NNS neri/JJ |
27 |
| -print parse_nl("de zwarte katten" , chunks=False) # de/DT zwarte/JJ katten/NNS |
| 23 | +print parse_de("die schwarzen Katzen", chunks=False) # die/DT schwarze/JJ Katzen/NNS |
| 24 | +print parse_es("los gatos negros" , chunks=False) # los/DT gatos/NNS negros/JJ |
| 25 | +print parse_fr("les chats noirs" , chunks=False) # les/DT chats/NNS noirs/JJ |
| 26 | +print parse_it("i gatti neri" , chunks=False) # i/DT gatti/NNS neri/JJ |
| 27 | +print parse_nl("de zwarte katten" , chunks=False) # de/DT zwarte/JJ katten/NNS |
28 | 28 | print
|
29 | 29 |
|
30 | 30 | # In some cases, this means the original tagset is mapped to Penn Treebank:
|
|
34 | 34 | from pattern.es import PAROLE
|
35 | 35 | from pattern.nl import WOTAN
|
36 | 36 |
|
37 |
| -print parse_de("die schwarze Katzen", chunks=False, tagset=STTS) |
38 |
| -print parse_es("los gatos negros" , chunks=False, tagset=PAROLE) |
39 |
| -print parse_nl("de zwarte katten" , chunks=False, tagset=WOTAN) |
| 37 | +print parse_de("die schwarzen Katzen", chunks=False, tagset=STTS) |
| 38 | +print parse_es("los gatos negros" , chunks=False, tagset=PAROLE) |
| 39 | +print parse_nl("de zwarte katten" , chunks=False, tagset=WOTAN) |
40 | 40 | print
|
41 | 41 |
|
42 | 42 | # Not all languages are equally suited to Penn Treebank,
|
|
73 | 73 |
|
74 | 74 | from pattern.text import parse
|
75 | 75 |
|
76 |
| -print parse("die schwarze Katzen", chunks=False, language="de", tagset=UNIVERSAL) |
77 |
| -print parse("the black cats" , chunks=False, language="en", tagset=UNIVERSAL) |
78 |
| -print parse("los gatos negros" , chunks=False, language="es", tagset=UNIVERSAL) |
79 |
| -print parse("les chats noirs" , chunks=False, language="fr", tagset=UNIVERSAL) |
80 |
| -print parse("i gatti neri" , chunks=False, language="it", tagset=UNIVERSAL) |
81 |
| -print parse("de zwarte katten" , chunks=False, language="nl", tagset=UNIVERSAL) |
| 76 | +print parse("die schwarzen Katzen", chunks=False, language="de", tagset=UNIVERSAL) |
| 77 | +print parse("the black cats" , chunks=False, language="en", tagset=UNIVERSAL) |
| 78 | +print parse("los gatos negros" , chunks=False, language="es", tagset=UNIVERSAL) |
| 79 | +print parse("les chats noirs" , chunks=False, language="fr", tagset=UNIVERSAL) |
| 80 | +print parse("i gatti neri" , chunks=False, language="it", tagset=UNIVERSAL) |
| 81 | +print parse("de zwarte katten" , chunks=False, language="nl", tagset=UNIVERSAL) |
82 | 82 | print
|
83 | 83 |
|
84 | 84 | # This comes at the expense of (in this example) losing information about plural nouns (NNS => NN).
|
|
0 commit comments