-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathTranslateAllCNtoTW.py
132 lines (109 loc) · 5.55 KB
/
TranslateAllCNtoTW.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
import os
import re
import zipfile
import shutil
import requests
import logging
from functools import lru_cache
# 設定欲翻譯的資料夾位置
FOLDER_PATH = (r'C:\Users\user\Desktop\example_folder')
session = requests.Session()
header = {"Content-type": "application/json", "Accept": "application/json"}
# 设置 translate_logger 和 process_logger
translate_logger = logging.getLogger('translate')
translate_logger.setLevel(logging.INFO)
process_logger = logging.getLogger('process')
process_logger.setLevel(logging.INFO)
# 创建 file handlers
translate_handler = logging.FileHandler(FOLDER_PATH+r'\\translate.log', mode='w', encoding='utf-8')
process_handler = logging.FileHandler(FOLDER_PATH+r'\\process.log', mode='w', encoding='utf-8')
# 设置日志格式
formatter = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
translate_handler.setFormatter(formatter)
process_handler.setFormatter(formatter)
console = logging.StreamHandler()
# 添加 handler 到 logger
translate_logger.addHandler(translate_handler)
translate_logger.addHandler(console)
process_logger.addHandler(process_handler)
process_logger.addHandler(console)
@lru_cache(maxsize=512) # 設置緩存的最大大小為無限制
def translate_text(text):
"""
利用 zhconvert 的 API 翻譯中文文本
"""
url = "https://api.zhconvert.org/convert"
params = {"converter": "Taiwan", "text": text}
response = session.get(url, headers=header, params=params)
if response.status_code == 200:
return response.json()["data"]["text"]
else:
return ""
def translate_file(file_path):
# 讀取檔案內容
with open(file_path, 'r', encoding='utf-8') as f:
content = f.read()
# 找到所有需要翻譯的內容
translate_logger.info(f'translate before: {text}')
translated_text = translate_text(text)
translate_logger.info(f'translate after: {translated_text}')
content = translated_text
# 將翻譯後的內容寫回到原檔案
with open(file_path, 'w', encoding='utf-8') as f:
f.write(content)
def translate_folder(folder_path):
# with open(os.path.join(FOLDER_PATH, 'translate.log'), 'a', encoding='utf-8') as f:
# 翻譯資料夾中的所有檔案
for root, dirs, files in os.walk(folder_path):
for file in files:
file_path = os.path.join(root, file)
ext = os.path.splitext(file_path)[1].lower()
if ext == '.txt':
# 翻譯純文字檔案
# print('Translating file: {}'.format(file_path))
process_logger.info('Translating file: {}'.format(file_path))
translate_file(file_path)
# 記錄翻譯完成的檔案路徑
process_logger.info('Translated: {}'.format(file_path))
# print('Translated: {}'.format(file_path))
# 遍歷資料夾內所有檔案和子資料夾,檢查是否有壓縮檔案
for root, dirs, files in os.walk(folder_path):
for file in files:
file_path = os.path.join(root, file)
ext = os.path.splitext(file_path)[1].lower()
if ext == '.zip':
# 檢查壓縮檔案內部是否有文本檔案
has_txt_file = False
with zipfile.ZipFile(file_path, 'r') as zip_ref:
for name in zip_ref.namelist():
if os.path.splitext(name)[1].lower() == '.txt':
has_txt_file = True
break
if has_txt_file:
# 解壓縮壓縮檔案
process_logger.info('Extracting {}...'.format(file_path))
# print('Extracting {}...'.format(file_path))
with zipfile.ZipFile(file_path, 'r') as zip_ref:
zip_ref.extractall(os.path.join(root, os.path.splitext(file)[0]))
# 遞迴翻譯解壓縮後的資料夾
folder_path_new = os.path.join(root, os.path.splitext(file)[0])
# print('Translating folder: {}'.format(folder_path_new))
process_logger.info('Translating folder: {}'.format(folder_path_new))
translate_folder(folder_path_new)
# 壓縮資料夾並刪除原始資料夾
# print('Recompressing {}...'.format(folder_path_new))
process_logger.info('Recompressing {}...'.format(folder_path_new))
with zipfile.ZipFile(os.path.join(root, file), 'w') as zip_ref:
for root_new, dirs_new, files_new in os.walk(folder_path_new):
for file_new in files_new:
file_path_new = os.path.join(root_new, file_new)
zip_ref.write(file_path_new, os.path.relpath(file_path_new, folder_path_new))
shutil.rmtree(folder_path_new)
# 記錄壓縮完成的檔案路徑
# print('Recompressed: {}'.format(os.path.join(root, file)))
process_logger.info('Recompressed: {}'.format(os.path.join(root, file)))
else:
# print('Skipping empty zip file: {}'.format(file_path))
process_logger.info('Skipping empty zip file: {}'.format(file_path))
if __name__ == "__main__":
translate_folder(FOLDER_PATH)