Python 读取文件并统计单词出现次数

发布时间 2023-08-23 16:34:29作者: steve.z
#
#   py_count_words.py
#   py_learn
#
#   Created by Z. Steve on 2023/8/23 10:30.
#
import re
from collections import Counter


def count_words(text):
    # 使用正则表达式将文本拆分为单词
    words = re.findall(r'\b\w+\b', text.lower())  # 转换为小写以进行不区分大小写的统计
    word_count = Counter(words)
    return word_count


def read_file():
    fs = open(file='/Users/stevexiaohuzhao/PycharmProjects/py_learn/words.txt', mode='r', encoding='utf-8')
    txt = fs.read()
    fs.close()
    return txt


article = read_file()
word_count = count_words(article)

# 打印每个单词及其出现次数
for word, count in word_count.items():
    print(f"{word}: {count}")