test_filename = "test.csv"
train_filename = "train.csv"
train_news = pd.read_csv(train_filename)
test_news = pd.read_csv(test_filename)
//we will start with simple bag of words technique
//creating feature vector - document term matrix
countV = CountVectorizer()
train_count = countV.fit_transform(train_news["Statement"])
//print training doc term matrix
//we have matrix of size of (10240, 12196) by calling below
After Change
train_count = countV.fit_transform(DataPrep.train_news["Statement"].values)
print(countV)
print(train_count)
//print training doc term matrix
//we have matrix of size of (10240, 12196) by calling below
def get_countVectorizer_stats():