8
8
vocabulary = vocab ()
9
9
10
10
# Defining the list of path where all the training data files are stored.
11
- filePaths = (list (paths .list_files ("enron1/train/ham" )) + list (paths .list_files ("enron4/train/ham" )) + list (paths .list_files ("hw1/train/ham" ))
12
- + list (paths .list_files ("enron1/train/spam" )) + list (paths .list_files ("enron4/train/spam" )) + list (paths .list_files ("hw1/train/spam" )))
11
+ filePaths = (list (paths .list_files ("Datasets/ enron1/train/ham" )) + list (paths .list_files ("Datasets/ enron4/train/ham" )) + list (paths .list_files ("Datasets/ hw1/train/ham" ))
12
+ + list (paths .list_files ("Datasets/ enron1/train/spam" )) + list (paths .list_files ("Datasets/ enron4/train/spam" )) + list (paths .list_files ("Datasets/ hw1/train/spam" )))
13
13
14
14
# Reading all training data file and preparing a corresponding features*example matrix for bag_of_words model using CountVectorizer() method.
15
15
vec = CountVectorizer ()
@@ -56,8 +56,8 @@ def BOW_test(filePaths):
56
56
# Defining a ham function to create a features*example matrix of ham training data.
57
57
def ham ():
58
58
# Defining the list of path where all the ham training data files are stored.
59
- filePaths = (list (paths .list_files ("enron1/train/ham" )) + list (
60
- paths .list_files ("enron4/train/ham" )) + list (paths .list_files ("hw1/train/ham" )))
59
+ filePaths = (list (paths .list_files ("Datasets/ enron1/train/ham" )) + list (
60
+ paths .list_files ("Datasets/ enron4/train/ham" )) + list (paths .list_files ("Datasets/ hw1/train/ham" )))
61
61
62
62
data = []
63
63
@@ -79,8 +79,8 @@ def ham():
79
79
# Defining a spam function to create a features*example matrix of spam training data.
80
80
def spam ():
81
81
# Defining the list of path where all the spam training data files are stored.
82
- filePaths = (list (paths .list_files ("enron1/train/spam" )) + list (
83
- paths .list_files ("enron4/train/spam" )) + list (paths .list_files ("hw1/train/spam" )))
82
+ filePaths = (list (paths .list_files ("Datasets/ enron1/train/spam" )) + list (
83
+ paths .list_files ("Datasets/ enron4/train/spam" )) + list (paths .list_files ("Datasets/ hw1/train/spam" )))
84
84
85
85
data = []
86
86
0 commit comments