Skip to content

Commit ce1850b

Browse files
author
Priyansh Gupta
committed
Adding Base Project
1 parent b46b42d commit ce1850b

File tree

6 files changed

+19
-36
lines changed

6 files changed

+19
-36
lines changed

BNIEFinal.txt

-9.99 KB
Binary file not shown.

BNPJFinal.txt

-9.99 KB
Binary file not shown.

BNSNFinal.txt

-9.99 KB
Binary file not shown.

BNTFFinal.txt

-9.99 KB
Binary file not shown.

pyGen.py

Lines changed: 8 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,6 @@
88
from sklearn.feature_extraction.text import CountVectorizer
99
from sklearn.feature_extraction.text import TfidfVectorizer
1010
from sklearn.naive_bayes import GaussianNB
11-
from sklearn.naive_bayes import MultinomialNB
12-
from sklearn.metrics import accuracy_score
1311
from sklearn import svm
1412
csvFile=open('newfrequency300.csv', 'rt')
1513
csvReader=csv.reader(csvFile)
@@ -28,21 +26,17 @@
2826
x=vectorizer.fit_transform(corpus).toarray()
2927
result=np.append(x,y,axis=1)
3028
X=pandas.DataFrame(result)
31-
#model=GaussianNB()
32-
model=MultinomialNB()
29+
model=GaussianNB()
3330
train = X.sample(frac=0.8, random_state=1)
3431
test=X.drop(train.index)
3532
y_train=train[301]
3633
y_test=test[301]
37-
print('Training model for Judging/Perception')
3834
print(train.shape)
3935
print(test.shape)
4036
xtrain=train.drop(301,axis=1)
4137
xtest=test.drop(301,axis=1)
4238
model.fit(xtrain,y_train)
43-
print(model)
44-
print('Accuracy : %f' % accuracy_score(y_true=xtrain[0][:66403],y_pred=xtest[0][:]))
45-
pickle.dump(model, open('BNPJFinal.txt', 'wb'))
39+
pickle.dump(model, open('BNPJFinal.sav', 'wb'))
4640
del result
4741

4842
y=[]
@@ -58,21 +52,17 @@
5852
x=vectorizer.fit_transform(corpus).toarray()
5953
result=np.append(x,y,axis=1)
6054
X=pandas.DataFrame(result)
61-
#model=GaussianNB()
62-
model=MultinomialNB()
55+
model=GaussianNB()
6356
train = X.sample(frac=0.8, random_state=1)
6457
test=X.drop(train.index)
6558
y_train=train[301]
6659
y_test=test[301]
67-
print('Training model for Introversion/Extraversion')
6860
print(train.shape)
6961
print(test.shape)
7062
xtrain=train.drop(301,axis=1)
7163
xtest=test.drop(301,axis=1)
7264
model.fit(xtrain,y_train)
73-
print(model)
74-
print('Accuracy : %f' % accuracy_score(y_true=xtrain[0][:85570],y_pred=xtest[0][:]))
75-
pickle.dump(model, open('BNIEFinal.txt', 'wb'))
65+
pickle.dump(model, open('BNIEFinal.sav', 'wb'))
7666
del result
7767

7868
y=[]
@@ -88,21 +78,17 @@
8878
x=vectorizer.fit_transform(corpus).toarray()
8979
result=np.append(x,y,axis=1)
9080
X=pandas.DataFrame(result)
91-
#model=GaussianNB()
92-
model=MultinomialNB()
81+
model=GaussianNB()
9382
train = X.sample(frac=0.8, random_state=1)
9483
test=X.drop(train.index)
9584
y_train=train[301]
9685
y_test=test[301]
97-
print('Training model for Thinking/Feeling')
9886
print(train.shape)
9987
print(test.shape)
10088
xtrain=train.drop(301,axis=1)
10189
xtest=test.drop(301,axis=1)
10290
model.fit(xtrain,y_train)
103-
print(model)
104-
print('Accuracy : %f' % accuracy_score(y_true=xtrain[0][:64000],y_pred=xtest[0][:]))
105-
pickle.dump(model, open('BNTFFinal.txt', 'wb'))
91+
pickle.dump(model, open('BNTFFinal.sav', 'wb'))
10692
del result
10793

10894
y=[]
@@ -118,18 +104,14 @@
118104
x=vectorizer.fit_transform(corpus).toarray()
119105
result=np.append(x,y,axis=1)
120106
X=pandas.DataFrame(result)
121-
#model=GaussianNB()
122-
model=MultinomialNB()
107+
model=GaussianNB()
123108
train = X.sample(frac=0.8, random_state=1)
124109
test=X.drop(train.index)
125110
y_train=train[301]
126111
y_test=test[301]
127-
print('Training model for Sensing/iNtuition')
128112
print(train.shape)
129113
print(test.shape)
130114
xtrain=train.drop(301,axis=1)
131115
xtest=test.drop(301,axis=1)
132116
model.fit(xtrain,y_train)
133-
print(model)
134-
print('Accuracy : %f' % accuracy_score(y_true=xtrain[0][:47135],y_pred=xtest[0][:]))
135-
pickle.dump(model, open('BNSNFinal.txt', 'wb'))
117+
pickle.dump(model, open('BNSNFinal.sav', 'wb'))

pyPredict.py

Lines changed: 11 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
# -*- coding: utf-8 -*-
12
from nltk.corpus import stopwords
23
from nltk.tokenize import word_tokenize
34
from nltk.stem import *
@@ -18,10 +19,10 @@
1819
from sklearn.feature_extraction.text import TfidfVectorizer
1920
from collections import Counter
2021

21-
ckey='M9cjHbuSsAFkUZWPrbhY2Q0kL'
22-
csecret='aYpMuByAZWZoouhqHEjs3BqUNhwF9NfoEHodGk8nBUdOpBJCgR'
23-
atoken='994417184322433025-TAGgZ6on9CY8Sn6jyfjJ4giFx8h2jIh'
24-
asecret='tUItYxsghg0m4kw6QqmiKLVkQzLeNN2r6ZzLSFrvQSARQ'
22+
ckey='...'
23+
csecret='...'
24+
atoken='...'
25+
asecret='...'
2526
auth=tweepy.OAuthHandler(ckey, csecret)
2627
auth.set_access_token(atoken, asecret)
2728
api=tweepy.API(auth)
@@ -125,7 +126,7 @@ def getTweets(user):
125126
with open('user.csv','rt') as f:
126127
csvReader=csv.reader(f)
127128
tweetList=[rows[0] for rows in csvReader]
128-
#os.remove('user.csv')
129+
os.remove('user.csv')
129130
with open('newfrequency300.csv','rt') as f:
130131
csvReader=csv.reader(f)
131132
mydict={rows[1]: int(rows[0]) for rows in csvReader}
@@ -135,10 +136,10 @@ def getTweets(user):
135136
df=pd.DataFrame(x)
136137

137138

138-
model_IE = pickle.load(open("BNIEFinal.txt", 'rb'))
139-
model_SN = pickle.load(open("BNSNFinal.txt", 'rb'))
140-
model_TF = pickle.load(open('BNTFFinal.txt', 'rb'))
141-
model_PJ = pickle.load(open('BNPJFinal.txt', 'rb'))
139+
model_IE = pickle.load(open("BNIEFinal.sav", 'rb'))
140+
model_SN = pickle.load(open("BNSNFinal.sav", 'rb'))
141+
model_TF = pickle.load(open('BNTFFinal.sav', 'rb'))
142+
model_PJ = pickle.load(open('BNPJFinal.sav', 'rb'))
142143

143144
answer=[]
144145
IE=model_IE.predict(df)
@@ -179,4 +180,4 @@ def getTweets(user):
179180
else:
180181
answer.append("J")
181182
mbti="".join(answer)
182-
print(mbti)
183+
print(mbti)

0 commit comments

Comments
 (0)