Home - hpscript/nlp GitHub Wiki
英語
$ pip3 install nltk
import nltk
nltk.download('punkt')
nltk.download('averaged_perceptron_tagger')
s = "The Brooklyn Nets appeared to be well on their way to taking a 3-0 series lead over the Boston Celtics Friday night, as they erupted out of the TD Garden gates on a 19-4 run in the first four minutes of action."
morph = nltk.word_tokenize(s)
pos = nltk.pos_tag(morph)
print(pos)
中国語
$ pip3 install jieba
import jieba.posseg as pseg
fen_cixing = pseg.cut("学习辉煌党史重温峥嵘岁月发扬延安精神奋斗新的征程")
for word, flag in fen_cixing:
print(word, flag)
mecab
https://zenn.dev/yukiko_bass/scraps/0f91d67da6d444
Vagranfile
Vagrant.configure("2") do |config|
config.vm.box = "ubuntu/xenial64"
config.vm.provider :virtualbox do |vb|
vb.customize ["modifyvm", :id, "--memory", 4096]
end
end