Note - Natural Language Processing with Python (Chapter9)

最新推荐文章于 2024-09-07 21:01:55 发布

_Meilinger_

最新推荐文章于 2024-09-07 21:01:55 发布

阅读量121

点赞数

分类专栏：碎片笔记文章标签： nlp 自然语言处理 python

本文链接：https://blog.csdn.net/qq_36332660/article/details/109891290

版权

碎片笔记专栏收录该内容

49 篇文章 3 订阅

订阅专栏

import nltk
from nltk import load_parser


# Example 9.1
kim = {'CAT': 'NP', 'ORTH': 'Kim', 'REF': 'k'}
chase = {'CAT': 'V', 'ORTH': 'chased', 'REL': 'chase'}
chase['AGT'] = 'sbj'
chase['PAT'] = 'obj'
lee = {'CAT': 'NP', 'ORTH': 'Lee', 'REF': 'l'}
sent = "Kim chased Lee"
tokens = sent.split()
def lex2fs(word):
    for fs in [kim, lee, chase]:
        if fs['ORTH'] == word:
            return fs
subj, verb, obj = lex2fs(tokens[0]), lex2fs(tokens[1]), lex2fs(tokens[2])
verb['AGT'] = subj['REF']
verb['PAT'] = obj['REF']
for k in ['ORTH', 'REL', 'AGT', 'PAT']:
    print("%-5s => %s" % (k, verb[k]))


surprise = {'CAT': 'V', 'ORTH': 'surprised', 'REL': 'surprise',
            'SRC': 'sbj', 'EXP': 'obj'}


nltk.data.show_cfg('grammars/book_grammars/feat0.fcfg')



grammar = nltk.data.load('grammars/book_grammars/feat0.fcfg')
print(grammar)


# Example 9.2
tokens = 'Kim likes children'.split()
cp = load_parser('grammars/book_grammars/feat0.fcfg', trace=2)
trees = cp.parse(tokens)
for tree in trees:
    print(tree)


# 9.2 Processing Feature Structures
fs1 = nltk.FeatStruct(TENSE='past', NUM='sg')
print(fs1)

fs1 = nltk.FeatStruct(PER=3, NUM='pl', GND='fem')
print(fs1['GND'])
fs1['CASE'] = 'acc'

fs2 = nltk.FeatStruct(POS='N', AGR=fs1)
print(fs2)
print(fs2['AGR'])
print(fs2['AGR']['PER'])

print(nltk.FeatStruct("[POS='N', AGR=[PER=3, NUM='pl', GND='fem']]"))

print(nltk.FeatStruct(NAME='Lee', TELNO='01 27 86 42 96', AGE=33))


print(nltk.FeatStruct("""[NAME='Lee', ADDRESS=(1)[NUMBER=74, STREET='rue Pascal'],
SPOUSE=[NAME='Kim', ADDRESS->(1)]]"""))

print(nltk.FeatStruct("[A='a', B=(1)[C='c'], D->(1), E->(1)]"))


# Subsumption and Unification
fs1 = nltk.FeatStruct(NUMBER=74, STREET='rue Pascal')
fs2 = nltk.FeatStruct(CITY='Paris')
print(fs1.unify(fs2))
print(fs2.unify(fs1))


fs0 = nltk.FeatStruct(A='a')
fs1 = nltk.FeatStruct(A='b')
fs2 = fs0.unify(fs1)
print(fs2)


fs0 = nltk.FeatStruct("""[
NAME=Lee,
ADDRESS=[NUMBER=74,STREET='rue Pascal'],
SPOUSE= [NAME=Kim,ADDRESS=[NUMBER=74,STREET='rue Pascal']]
]""")
print(fs0)

fs1 = nltk.FeatStruct("[SPOUSE = [ADDRESS = [CITY = Paris]]]")
print(fs1.unify(fs0))

fs2 = nltk.FeatStruct("""[
NAME=Lee,
ADDRESS=(1)[NUMBER=74, STREET='rue Pascal'],
SPOUSE=[NAME=Kim, ADDRESS->(1)]
]""")
print(fs1.unify(fs2))


fs1 = nltk.FeatStruct("[ADDRESS1=[NUMBER=74, STREET='rue Pascal']]")
fs2 = nltk.FeatStruct("[ADDRESS1=?x, ADDRESS2=?x]")
print(fs2)
print(fs2.unify(fs1))


# 9.3 Extending a Feature based Grammar
nltk.data.show_cfg('grammars/book_grammars/feat1.fcfg')
cp = load_parser('grammars/book_grammars/feat1.fcfg')
tokens = 'who do you claim that you like'.split()
trees = cp.parse(tokens)
for tree in trees:
    print(tree)


# Example 9.3
tokens = 'you claim that you like cats'.split()
for tree in cp.parse(tokens):
    print(tree)

tokens = 'rarely do you sing'.split()
for tree in cp.parse(tokens):
    print(tree)


nltk.data.show_cfg('grammars/book_grammars/german.fcfg')


# Example 9.4
tokens = 'ich folge den Katzen'.split()
cp = load_parser('grammars/book_grammars/german.fcfg')
for tree in cp.parse(tokens):
    print(tree)

cp = load_parser('grammars/book_grammars/german.fcfg', trace=2)
tokens = 'ich folge den Katze'.split()
for tree in cp.parse(tokens):
    print(tree)

_Meilinger_

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
打赏
0
评论
Note - Natural Language Processing with Python (Chapter9)

import nltkfrom nltk import load_parser# Example 9.1kim = {'CAT': 'NP', 'ORTH': 'Kim', 'REF': 'k'}chase = {'CAT': 'V', 'ORTH': 'chased', 'REL': 'chase'}chase['AGT'] = 'sbj'chase['PAT'] = 'obj'lee = {'CAT': 'NP', 'ORTH': 'Lee', 'REF': 'l'}sent = .
复制链接

扫一扫