changed tokenize.py to score.py

kevin-wittmer · Apr 18, 2016 · 97f7602 · 97f7602
1 parent 98b8392
commit 97f7602
Showing 1 changed file with 18 additions and 0 deletions.
diff --git a/score.py b/score.py
@@ -0,0 +1,18 @@
+import csv
+
+# Split each tweet into a list of words
+def stemmify(tweet_string):
+	word_list = tweet_string.split()
+	return word_list
+
+# Open csv file containing tweets
+csvfile = open('clean_data/collection3.csv')
+csvreader = csv.DictReader(csvfile)
+
+# Split each tweet into a list of words and print the list
+for tweet in csvreader:
+	stemmed_words = stemmify(tweet['text'])
+	print stemmed_words
+
+# Close the csv file
+csvfile.close()