| import os |
| import chardet |
| from tkinter import filedialog |
| from concurrent.futures import ThreadPoolExecutor |
| |
| |
| def get_all_chardet(filename, max_bytes=1048576): |
| try: |
| with open(file=filename, mode='rb') as f3: |
| data = f3.read(max_bytes) |
| except Exception as e: |
| print(f"无法读取文件 {filename},错误信息:{e}") |
| return |
| |
| if not data: |
| print(f"文件 {filename} 内容为空") |
| return |
| |
| result = chardet.detect(data) |
| if not result['encoding']: |
| print(f"文件 {filename} 的编码检测失败") |
| return |
| a = list(result.values()) |
| print(f"{filename} 编码为: {a[0]}") |
| |
| |
| def all_chardet_files(Folderpath): |
| with ThreadPoolExecutor() as executor: |
| for filepath, dirnames, filenames in os.walk(Folderpath): |
| for filename in filenames: |
| full_path = os.path.join(filepath, filename) |
| executor.submit(get_all_chardet, full_path) |
| |
| |
| def by_filetype(Folderpath): |
| filetype = input('输入指定文件类型,例如.xml: ') |
| with ThreadPoolExecutor() as executor: |
| for filepath, dirnames, filenames in os.walk(Folderpath): |
| for filename in filenames: |
| if os.path.splitext(filename)[1] == filetype: |
| full_path = os.path.join(filepath, filename) |
| executor.submit(get_all_chardet, full_path) |
| |
| |
| def get_specified_chardet(filename, b, max_bytes=1048576): |
| try: |
| with open(file=filename, mode='rb') as f3: |
| data = f3.read(max_bytes) |
| except Exception as e: |
| print(f"无法读取文件 {filename},错误信息:{e}") |
| return |
| |
| if not data: |
| print(f"文件 {filename} 内容为空") |
| return |
| |
| result = chardet.detect(data) |
| a = list(result.values()) |
| if a[0] == b: |
| print(f"文件 {filename} 编码为指定的 {b}") |
| |
| |
| def specified_chardet_files(Folderpath): |
| b = input("请输入需要检测的编码: ") |
| print(f"编码是 {b} 的文件如下:") |
| with ThreadPoolExecutor() as executor: |
| for filepath, dirnames, filenames in os.walk(Folderpath): |
| for filename in filenames: |
| full_path = os.path.join(filepath, filename) |
| executor.submit(get_specified_chardet, full_path, b) |
| |
| |
| def get_no_specified_chardet(filename, b, max_bytes=1048576): |
| try: |
| with open(file=filename, mode='rb') as f3: |
| data = f3.read(max_bytes) |
| except Exception as e: |
| print(f"无法读取文件 {filename},错误信息:{e}") |
| return |
| |
| if not data: |
| print(f"文件 {filename} 内容为空") |
| return |
| |
| result = chardet.detect(data) |
| a = list(result.values()) |
| if a[0] != b: |
| print(f"文件 {filename} 编码不是 {b}") |
| |
| |
| def no_specified_chardet_files(Folderpath): |
| b = input("请输入需要检测的编码: ") |
| print(f"编码不是 {b} 的文件如下:") |
| with ThreadPoolExecutor() as executor: |
| for filepath, dirnames, filenames in os.walk(Folderpath): |
| for filename in filenames: |
| full_path = os.path.join(filepath, filename) |
| executor.submit(get_no_specified_chardet, full_path, b) |
| |
| |
| def case(): |
| print("utf-8 GB2312 ascii 等") |
| print("1. 输出所有文件的编码") |
| print("2. 输出指定类型文件的编码") |
| print("3. 输出指定编码的文件") |
| print("4. 输出非指定编码的文件") |
| a = int(input("请输入选项:")) |
| if a == 1: |
| all_chardet_files(Folderpath) |
| elif a == 2: |
| by_filetype(Folderpath) |
| elif a == 3: |
| specified_chardet_files(Folderpath) |
| elif a == 4: |
| no_specified_chardet_files(Folderpath) |
| |
| if __name__ == '__main__': |
| print("输入需要检测的路径") |
| Folderpath = filedialog.askdirectory() |
| print("检测的路径是 " + Folderpath) |
| case() |
| ask = input("是否继续?y or exit").lower() |
| while ask == 'y': |
| case() |
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 阿里最新开源QwQ-32B,效果媲美deepseek-r1满血版,部署成本又又又降低了!
· AI编程工具终极对决:字节Trae VS Cursor,谁才是开发者新宠?
· 开源Multi-agent AI智能体框架aevatar.ai,欢迎大家贡献代码
· Manus重磅发布:全球首款通用AI代理技术深度解析与实战指南
· 被坑几百块钱后,我竟然真的恢复了删除的微信聊天记录!