赞
踩
import nltk
from nltk import word_tokenize
s='I was watching TV'
print(nltk.pos_tag(word_tokenize(s)))
from nltk.tag.stanford import StanfordPOSTagger
import nltk
stan_tagger=StanfordPOSTagger('models/english-bidirectional-distdim.tagger','standford-postagger.jar')
tokens=nltk.word_tokenize(s)
print(stan_tagger.tag(tokens))
from nltk.corpus import brown
import nltk
tags=[tag for (word,tag) in brown.tagged_words(categories='news')]
print(nltk.FreqDist(tags))
brown_tagged_sents=brown.tagged_sents(categories='news')
default_tagger=nltk.DefaultTagger('NN')
print(default_tagger.evaluate(brown_tagged_sents))
from nltk.corpus import brown import nltk tags=[tag for (word,tag) in brown.tagged_words(categories='news')] print(nltk.FreqDist(tags)) brown_tagged_sents=brown.tagged_sents(categories='news') default_tagger=nltk.DefaultTagger('NN') # print(default_tagger.evaluate(brown_tagged_sents)) from nltk.tag import UnigramTagger,DefaultTagger,BigramTagger,TrigramTagger train_data=brown_tagged_sents[:int(len(brown_tagged_sents)*0.9)] test_data=brown_tagged_sents[int(len(brown_tagged_sents)*0.9):] unigram_tagger=UnigramTagger(train_data,backoff=default_tagger) print(unigram_tagger.evaluate(test_data)) bigram_tagger=BigramTagger(train_data,backoff=unigram_tagger) print(bigram_tagger.evaluate(test_data)) trigram_tagger=TrigramTagger(train_data,backoff=bigram_tagger) print(trigram_tagger.evaluate(test_data))
赞
踩
Copyright © 2003-2013 www.wpsshop.cn 版权所有,并保留所有权利。