python 统计英语小说词汇频率

mac2025-06-01  32

import pandas as pd import numpy as np import re from collections import Counter with open ("/home/baba/txt/1.txt",'r',encoding='gbk') as f: words=f.read().lower() rule=re.compile(r'\w+') words=re.findall(rule,words) counter_words=Counter(words) common_words=counter_words.most_common(10) print(common_words) [('the', 7845), ('i', 7255), ('and', 6625), ('to', 5226), ('a', 4468), ('of', 4366), ('you', 2993), ('in', 2767), ('was', 2525), ('it', 2413)]

 

 

最新回复(0)