#!/usr/bin/python
import sys
for line in sys.stdin:
#去除字符串两边的空格
line = line.strip()
#按照空格去划分单词
words = line.split()
for word in words:
print '%s %s' % (word, 1)
reducer.py
#!/usr/bin/python
from operator import itemgetter
import sys
word2count = {}
for line in sys.stdin:
line = line.strip()
word, count = line.split(' ', 1)
try:
count = int(count)
word2count[word] = word2count.get(word, 0) + count
except ValueError:
pass
sorted_word2count = sorted(word2count.items(), key=itemgetter(0))
for word, count in sorted_word2count:
print '%s %s'% (word, count)