You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
39 lines
1.1 KiB
Python
39 lines
1.1 KiB
Python
from __future__ import print_function
|
|
from __future__ import unicode_literals
|
|
|
|
from builtins import str, bytes, dict, int
|
|
|
|
import os
|
|
import sys
|
|
sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", ".."))
|
|
|
|
from pattern.en import parse, Text
|
|
|
|
# The easiest way to analyze the output of the parser is to create a Text.
|
|
# A Text is a "parse tree" of linked Python objects.
|
|
# A Text is essentially a list of Sentence objects.
|
|
# Each Sentence is a list of Word objects.
|
|
# Each Word can be part of a Chunk object, accessible with Word.chunk.
|
|
s = "I eat pizza with a silver fork."
|
|
s = parse(s)
|
|
s = Text(s)
|
|
|
|
# You can also use the parsetree() function,
|
|
# which is the equivalent of Text(parse()).
|
|
|
|
print(s[0].words) # A list of all the words in the first sentence.
|
|
print(s[0].chunks) # A list of all the chunks in the first sentence.
|
|
print(s[0].chunks[-1].words)
|
|
print("")
|
|
|
|
for sentence in s:
|
|
for word in sentence:
|
|
print(word.string,
|
|
word.type,
|
|
word.chunk,
|
|
word.pnp)
|
|
|
|
# A Text can be exported as an XML-string (among other).
|
|
print("")
|
|
print(s.xml)
|