feature_names
# ['beats', 'best', 'both', 'brazil', 'germany', 'is', 'love', 'sweden']
# 创建数据帧
pd.DataFrame...]
# ['Hi I Love This Song', '10000 Agree LoveIT', 'Right']
移除停止词
# 加载库
from nltk.corpus import stopwords...# 你第一次需要下载停止词的集合
import nltk
nltk.download('stopwords')
'''
[nltk_data] Downloading package stopwords...# 创建单词标记
tokenized_words = ['i', 'am', 'humbled', 'by', 'this', 'traditional', 'meeting']
词干提取通过识别和删除词缀...展示词性
text_tagged
# [('Chris', 'NNP'), ('loved', 'VBD'), ('outdoor', 'RP'), ('running', 'VBG')]
输出是一个元组列表