问题描述
我制作了不同的模型来预测评论是正面的还是负面的(情绪)。现在我想测试不同的模型或只有一种气味的单一模型(例如“食物是美味”)。我该怎么做?
我的代码如下:
# Train model with vectorizer and classifier
# Random Forest
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.ensemble import RandomForestClassifier
from sklearn.linear_model import LogisticRegression
from sklearn.svm import LinearSVC
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import classification_report
from sklearn.pipeline import Pipeline
from sklearn.metrics import confusion_matrix,classification_report
RandomForestClassifier = RandomForestClassifier()
LogisticRegression = LogisticRegression(solver = "lbfgs")
LinearSVC = LinearSVC()
KNeighborsClassifier = KNeighborsClassifier(n_neighbors=5)
clf_list = [RandomForestClassifier,LogisticRegression,LinearSVC,KNeighborsClassifier]
# Model training
from sklearn.model_selection import train_test_split
Independent_var = reviews_english['Review Gast']
Dependent_var = reviews_english['sentiment'] # positive or negative
IV_train,IV_test,DV_train,DV_test = train_test_split(Independent_var,Dependent_var,test_size = 0.2,random_state = 500 )
print('IV_train :',len(IV_train))
print('IV_test :',len(IV_test))
print('DV_train :',len(DV_train))
print('DV_test :',len(DV_test))
tvec_1 = TfidfVectorizer (lowercase=True,stop_words=STOPWORDS,ngram_range=(1,2))
#tvec_1 = TfidfVectorizer (binary=True,norm=False,use_idf = False,smooth_idf=False,lowercase=True,stop_words='english',min_df=1,max_df=1.0,max_features=None,1))
for n,clf in enumerate(clf_list):
model_tvec1 = Pipeline([('vectorizer',tvec_1),('classifier',clf)])
# Model learning
model_tvec1.fit(IV_train,DV_train)
# Model prediction on training and test data
pred_train_tvec1 = model_tvec.predict(IV_train)
pred_test_tvec1 = model_tvec.predict(IV_test)
# Performances
report_training_tvec1 = classification_report(DV_train,pred_train_tvec1)
report_test_tvec1 = classification_report(DV_test,pred_test_tvec1)
print("*************************" " Training report",clf,"*********************")
print(report_training)
print("*************************" " Test report","*********************")
print(report_test)
解决方法
暂无找到可以解决该程序问题的有效方法,小编努力寻找整理中!
如果你已经找到好的解决方法,欢迎将解决方案带上本链接一起发送给小编。
小编邮箱:dio#foxmail.com (将#修改为@)