1 # This Python file uses the following encoding: utf-8
3 Created on May 30, 2011
8 from mjacob
.nltk
.grammar
.TreeAdjoiningGrammar
import TreeAdjoiningGrammar
9 from mjacob
.nltk
.parse
.tag
.earley
.rules
import TAG_EARLEY_STRATEGY
10 from mjacob
.nltk
.parse
.tag
.TagChartParser
import TagChartParser
14 raw_data
= nltk
.data
.load('grammars/large_grammars/atis_sentences.txt', format
='raw')
15 sentences
= [x
[0] for x
in nltk
.parse
.util
.extract_test_sentences(raw_data
)][:1]
18 grammar
= TreeAdjoiningGrammar(cfg
=nltk
.data
.load('grammars/large_grammars/atis.cfg'))
20 grammar
= TreeAdjoiningGrammar("../integration/tag_chart/degenerate_1/grammar.yaml")
22 grammar
= TreeAdjoiningGrammar("../integration/tag_chart/cross_serial_2/grammar.yaml")
24 parser
= TagChartParser(grammar
)
27 chart
= parser
.chart_parse(sentences
[0])
29 chart
= parser
.chart_parse(['John'])
31 chart
= parser
.chart_parse("Jan Piet Marie de kinderen zag helpen leren zwemmen".split(' '))
35 print(chart
.parses(grammar
.start().symbol(), TAG_EARLEY_STRATEGY
))