-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPhoneticGenerator.py
77 lines (59 loc) · 2.62 KB
/
PhoneticGenerator.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
import re
from pinyin import PinYin
class PhoneticGenerator:
"""处理 iPhone 联系人 VC 格式的转换,提取拼音并添加到字段中"""
def __init__(self, filename='contacts.vcf'):
"""
初始化 PhoneticConvert 对象
:param filename: VCF 文件的路径,默认为 'contacts.vcf'
"""
self.filename = filename
self.py_engine = PinYin()
self.py_engine.load_word()
def convert(self):
"""将 VCF 文件中的联系人姓名转换为拼音,并添加到 X-PHONETIC 字段"""
contact_lines = self._read_file()
updated_contact = []
for line in contact_lines:
updated_contact.append(line)
last_name = self._extract_name_part(line, part='last')
if last_name:
phonetic_last_name = self._convert_to_phonetic(last_name)
updated_contact.append(f"X-PHONETIC-LAST-NAME:{phonetic_last_name}\n")
first_name = self._extract_name_part(line, part='first')
if first_name:
phonetic_first_name = self._convert_to_phonetic(first_name)
updated_contact.append(f"X-PHONETIC-FIRST-NAME:{phonetic_first_name}\n")
self._write_file(updated_contact)
def _read_file(self):
"""读取 VCF 文件并返回文件中的每一行"""
with open(self.filename, 'r', encoding='utf-8') as f:
return f.readlines()
def _write_file(self, updated_contact):
"""将更新后的联系人信息写回到 VCF 文件"""
with open(self.filename, 'w', encoding='utf-8') as fout:
fout.writelines(updated_contact)
def _extract_name_part(self, line, part='last'):
"""
从联系人信息中提取姓或名
:param line: VCF 文件中的一行
:param part: 提取部分,'last' 为姓,'first' 为名
:return: 姓或名,如果未找到则返回 None
"""
if part == 'last':
match = re.findall(r"N:([^;]+);", line) # 匹配姓
else:
match = re.findall(r"N:[^;]*;([^;]+);", line) # 匹配名
return match[0] if match else None
def _convert_to_phonetic(self, name):
"""
将汉字转换为拼音,并将拼音的每个字母首字母大写
:param name: 姓或名
:return: 转换后的拼音字符串
"""
pinyin_list = self.py_engine.hanzi2pinyin(name)
return ''.join([item.capitalize() for item in pinyin_list if item])
if __name__ == '__main__':
filename = 'contacts.vcf'
generator = PhoneticGenerator(filename)
generator.convert()