Commit 886190a8 by Vik Paruchuri

Test cv script

parent a3b5a6be
...@@ -9,6 +9,7 @@ sys.path.append(one_up_path) ...@@ -9,6 +9,7 @@ sys.path.append(one_up_path)
import util_functions import util_functions
import essay_set import essay_set
import feature_extractor import feature_extractor
import numpy
from sklearn.ensemble import GradientBoostingClassifier from sklearn.ensemble import GradientBoostingClassifier
...@@ -30,8 +31,8 @@ for i in xrange(1,len(lines)): ...@@ -30,8 +31,8 @@ for i in xrange(1,len(lines)):
scores.append(int(score)) scores.append(int(score))
texts.append(text) texts.append(text)
eset.add_essay(text,int(score)) eset.add_essay(text,int(score))
if score==0: #if int(score)==0:
eset.generate_additional_essays(text,int(score)) # eset.generate_additional_essays(text,int(score))
extractor=feature_extractor.FeatureExtractor() extractor=feature_extractor.FeatureExtractor()
extractor.initialize_dictionaries(eset) extractor.initialize_dictionaries(eset)
...@@ -43,9 +44,13 @@ clf=GradientBoostingClassifier(n_estimators=100, learn_rate=.05, ...@@ -43,9 +44,13 @@ clf=GradientBoostingClassifier(n_estimators=100, learn_rate=.05,
cv_preds=util_functions.gen_cv_preds(clf,train_feats,scores) cv_preds=util_functions.gen_cv_preds(clf,train_feats,scores)
kappa=util_functions.quadratic_weighted_kappa(cv_preds,scores) err=numpy.mean(numpy.abs(cv_preds-scores))
print err
outfile=open("cvout.tsv",'w+') kappa=util_functions.quadratic_weighted_kappa(list(cv_preds),scores)
print kappa
outfile=open("full_cvout.tsv",'w+')
outfile.write("cv_pred" + "\t" + "actual") outfile.write("cv_pred" + "\t" + "actual")
for i in xrange(0,len(cv_preds)): for i in xrange(0,len(cv_preds)):
outfile.write("{0}\t{1}".format(cv_preds[i],scores[i])) outfile.write("{0}\t{1}".format(cv_preds[i],scores[i]))
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment