" ", , , - , %%file, :
%%file wordcount.py
from mrjob.job import MRJob
class MRWordFrequencyCount(MRJob):
def mapper(self, _, line):
yield "chars", len(line)
yield "words", len(line.split())
yield "lines", 1
def reducer(self, key, values):
yield key, sum(values)
mrjob :
import wordcount
reload(wordcount)
mr_job = wordcount.MRWordFrequencyCount(args=['example.txt'])
with mr_job.make_runner() as runner:
runner.run()
for line in runner.stream_output():
key, value = mr_job.parse_output_line(line)
print key, value
, wordcount.py MRWordFrequencyCount wordcount - . , Python , wordcount.py iPython , . reload() .
: https://groups.google.com/d/msg/mrjob/CfdAgcEaC-I/8XfJPXCjTvQJ
()
mrjob, .
! python mrjob.py shakespeare.txt
: http://jupyter.cs.brynmawr.edu/hub/dblank/public/Jupyter%20Magics.ipynb