python统计文本文件的字数

s

转的,出处找不到了。

还有这个也不错:https://code.google.com/p/pyzh/


统计文本文件的字数,从当前目录下的file.txt取文件

# -*- coding: GBK -*-
import string
import sys
reload(sys)

def compareItems((w1,c1), (w2,c2)):
    if c1 > c2:
        return - 1
    elif c1 == c2:
        return cmp(w1, w2)
    else:
        return 1

def main():
    fname = "file.txt"
    
    try:
        text = open(fname,'r').read()
        text = string.lower(text)
    except:
        print "\nfile.txt is not exist!!! or There is a R/W error! "
        sys.exit()

    for ch in '!"#$%&()*+,-./:;<=>?@[\\]^_`{|}~':
        text = string.replace(text, ch, ' ')
    words = string.split(text)

  
    counts = {}
    for w in words:
        counts[w] = counts.get(w,0) + 1
    
    n = input("\n输入要统计的top单词数:")
    items = counts.items()
    
    items.sort(compareItems)
    
    max = len(items)
    print "\n单词总计:" + str(len(words))
    print "单词净个数(已去重):" + str(max)
    print "\n"
    if n > max:
        n = max
    for i in range(n):
        print "%-10s%5d" % items[i]

if __name__ == '__main__': 
    main()





s


你可能感兴趣的:(python统计文本文件的字数)