Difference between revisions of "Guinea Pig"
From Cohen Courses
Jump to navigationJump to search (Created page with "= Quick Start = == Running wordcount.py == Set up a directory that contains the file <code>gp.py</code> and a second script called <code>wordcount.py</code> which contains t...") |
|||
Line 6: | Line 6: | ||
second script called <code>wordcount.py</code> which contains this | second script called <code>wordcount.py</code> which contains this | ||
code: | code: | ||
+ | |||
+ | # always start like this | ||
+ | from gp import * | ||
+ | import sys | ||
+ | |||
+ | # supporting routines can go here | ||
+ | def tokens(line): | ||
+ | for tok in line.split(): | ||
+ | yield tok.lower() | ||
+ | |||
+ | #always subclass Planner | ||
+ | class WordCount(Planner): | ||
+ | |||
+ | wc = ReadLines('corpus.txt') | FlattenBy(by=tokens) | Group(by=lambda x:x, reducingWith=ReduceToCount()) | ||
+ | |||
+ | # always end like this | ||
+ | if __name__ == "__main__": | ||
+ | WordCount().main(sys.argv) |
Revision as of 15:13, 9 May 2014
Quick Start
Running wordcount.py
Set up a directory that contains the file gp.py
and a
second script called wordcount.py
which contains this
code:
# always start like this from gp import * import sys
# supporting routines can go here def tokens(line): for tok in line.split(): yield tok.lower()
#always subclass Planner class WordCount(Planner):
wc = ReadLines('corpus.txt') | FlattenBy(by=tokens) | Group(by=lambda x:x, reducingWith=ReduceToCount())
# always end like this if __name__ == "__main__": WordCount().main(sys.argv)