Skip to content

Commit c71dbe8

Browse files
authored
Update Bag_of_words.py
1 parent 748dd39 commit c71dbe8

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

Bag_of_words.py

+6-6
Original file line numberDiff line numberDiff line change
@@ -8,8 +8,8 @@
88
vocabulary = vocab()
99

1010
# Defining the list of path where all the training data files are stored.
11-
filePaths = (list(paths.list_files("enron1/train/ham")) + list(paths.list_files("enron4/train/ham")) + list(paths.list_files("hw1/train/ham"))
12-
+ list(paths.list_files("enron1/train/spam")) + list(paths.list_files("enron4/train/spam")) + list(paths.list_files("hw1/train/spam")))
11+
filePaths = (list(paths.list_files("Datasets/enron1/train/ham")) + list(paths.list_files("Datasets/enron4/train/ham")) + list(paths.list_files("Datasets/hw1/train/ham"))
12+
+ list(paths.list_files("Datasets/enron1/train/spam")) + list(paths.list_files("Datasets/enron4/train/spam")) + list(paths.list_files("Datasets/hw1/train/spam")))
1313

1414
# Reading all training data file and preparing a corresponding features*example matrix for bag_of_words model using CountVectorizer() method.
1515
vec = CountVectorizer()
@@ -56,8 +56,8 @@ def BOW_test(filePaths):
5656
# Defining a ham function to create a features*example matrix of ham training data.
5757
def ham():
5858
# Defining the list of path where all the ham training data files are stored.
59-
filePaths = (list(paths.list_files("enron1/train/ham")) + list(
60-
paths.list_files("enron4/train/ham")) + list(paths.list_files("hw1/train/ham")))
59+
filePaths = (list(paths.list_files("Datasets/enron1/train/ham")) + list(
60+
paths.list_files("Datasets/enron4/train/ham")) + list(paths.list_files("Datasets/hw1/train/ham")))
6161

6262
data = []
6363

@@ -79,8 +79,8 @@ def ham():
7979
# Defining a spam function to create a features*example matrix of spam training data.
8080
def spam():
8181
# Defining the list of path where all the spam training data files are stored.
82-
filePaths = (list(paths.list_files("enron1/train/spam")) + list(
83-
paths.list_files("enron4/train/spam")) + list(paths.list_files("hw1/train/spam")))
82+
filePaths = (list(paths.list_files("Datasets/enron1/train/spam")) + list(
83+
paths.list_files("Datasets/enron4/train/spam")) + list(paths.list_files("Datasets/hw1/train/spam")))
8484

8585
data = []
8686

0 commit comments

Comments
 (0)