bo-graduation/nltk-book/chapter1.py

import nltk

file=open('faceapp.txt','r')
raw=file.read()
tokens = nltk.word_tokenize(raw)
faceapp = nltk.Text(tokens)


# my stopwords are common words I don't want to count, like "a", "an", "the".
stopwords = set(line.strip() for line in open('stopwords.txt'))

# dictionary
wordcount = {}

# spliting words from punctuation so "book" and "book!" counts as the same word
for word in raw.lower().split():
    word = word.replace(".","")
    word = word.replace(",","")
    word = word.replace(":","")
    word = word.replace("\"","")
    word = word.replace("!","")
    word = word.replace("â€œ","")
    word = word.replace("â€˜","")
    word = word.replace("*","")
    word = word.replace("(","")
    word = word.replace(")","")


faceapp.concordance('a')
first script 5 years ago			`import nltk`

second script 5 years ago			`file=open('faceapp.txt','r')`
			`raw=file.read()`
first script 5 years ago			`tokens = nltk.word_tokenize(raw)`
			`faceapp = nltk.Text(tokens)`

second script 5 years ago
			`# my stopwords are common words I don't want to count, like "a", "an", "the".`
			`stopwords = set(line.strip() for line in open('stopwords.txt'))`

			`# dictionary`
			`wordcount = {}`

			`# spliting words from punctuation so "book" and "book!" counts as the same word`
			`for word in raw.lower().split():`
			`word = word.replace(".","")`
			`word = word.replace(",","")`
			`word = word.replace(":","")`
			`word = word.replace("\"","")`
			`word = word.replace("!","")`
			`word = word.replace("â€œ","")`
			`word = word.replace("â€˜","")`
			`word = word.replace("*","")`
			`word = word.replace("(","")`
			`word = word.replace(")","")`


			`faceapp.concordance('a')`