Various scripts for playing around with natural language processing/generation

generate_random.py 327B

1234567891011121314151617
  1. import nltk
  2. import random
  3. TEXT = nltk.corpus.genesis.words('english-kjv.txt')
  4. def main():
  5. bigrams = nltk.bigrams(TEXT)
  6. cfdist = nltk.ConditionalFreqDist(bigrams)
  7. word = random.choice(bigrams)[0]
  8. for i in range(15):
  9. print word,
  10. word = cfdist[word].max()
  11. if __name__ == '__main__':
  12. main()