Skip to content

Commit 402f69a

Browse files
committed
Merge branch 'develop'
2 parents 0b2447a + 5c337c2 commit 402f69a

8 files changed

Lines changed: 80 additions & 27 deletions

File tree

.travis.yml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
language: python
22
python:
3-
- 3.4
3+
- 3.5
44

55
sudo: false
66

@@ -9,6 +9,7 @@ env:
99
- TOX_ENV=py27
1010
- TOX_ENV=py33
1111
- TOX_ENV=py34
12+
- TOX_ENV=py35
1213
- TOX_ENV=pypy
1314
- TOX_ENV=py2_snownlp
1415
- TOX_ENV=py2_jieba

CHANGELOG.rst

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,14 @@ Changelog
22
---------
33

44

5+
0.9.0 (2015-09-20)
6+
++++++++++++++++++++
7+
8+
* **不兼容** 将拼音词典库里的国际音标字母替换为 ASCII 字母. Thanks `@MingStar`_ :
9+
* ``ɑ -> a``
10+
* ``ɡ -> g``
11+
12+
513
0.8.5 (2015-08-23)
614
++++++++++++++++++++
715

README.rst

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -170,9 +170,11 @@ Related Projects
170170

171171
* `hotoo/pinyin`__: 汉语拼音转换工具 Node.js/JavaScript 版。
172172
* `mozillazg/go-pinyin`__: 汉语拼音转换工具 Go 版。
173+
* `mozillazg/rust-pinyin`__: 汉语拼音转换工具 Rust 版。
173174

174175
__ https://github.com/hotoo/pinyin
175176
__ https://github.com/mozillazg/go-pinyin
177+
__ https://github.com/mozillazg/rust-pinyin
176178

177179

178180
.. |Build| image:: https://img.shields.io/travis/mozillazg/python-pinyin/master.svg

pypinyin/__init__.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
from . import phonetic_symbol, pinyin_dict
1515

1616
__title__ = 'pypinyin'
17-
__version__ = '0.8.5'
17+
__version__ = '0.9.0'
1818
__author__ = 'mozillazg, 闲耘'
1919
__license__ = 'MIT'
2020
__copyright__ = 'Copyright (c) 2014 mozillazg, 闲耘'
@@ -48,7 +48,7 @@
4848
# 单字拼音库
4949
PINYIN_DICT = pinyin_dict.pinyin_dict.copy()
5050
# 声母表
51-
_INITIALS = 'b,p,m,f,d,t,n,l,g,k,h,j,q,x,r,zh,ch,sh,z,c,s,'.split(',')
51+
_INITIALS = 'b,p,m,f,d,t,n,l,g,k,h,j,q,x,zh,ch,sh,r,z,c,s'.split(',')
5252
# 带声调字符与使用数字标识的字符的对应关系,类似: {u'ā': 'a1'}
5353
PHONETIC_SYMBOL = phonetic_symbol.phonetic_symbol.copy()
5454
# 所有的带声调字符

pypinyin/phrases_dict.py

Lines changed: 23 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -4733,7 +4733,7 @@
47334733
"干路": [["gàn"], ["lù"]],
47344734
"干馏": [["gān"], ["liú"]],
47354735
"干吗": [["gàn"], ["má"]],
4736-
"干嘛": [["gàn"], [""]],
4736+
"干嘛": [["gàn"], ["ma"]],
47374737
"干么": [["gàn"], ["mǒ"]],
47384738
"干娘": [["gān"], ["niáng"]],
47394739
"干呕": [["gān"], ["ǒu"]],
@@ -5266,7 +5266,7 @@
52665266
"刮削": [["guā"], ["xiāo"]],
52675267
"呱嗒": [["guā"], ["dā"]],
52685268
"呱唧": [["guā"], ["jī"]],
5269-
"呱呱": [["ɡū"], ["ɡū"]],
5269+
"呱呱": [[""], [""]],
52705270
"寡合": [["guǎ"], ["hé"]],
52715271
"寡妻": [["guǎ"], ["qī"]],
52725272
"挂车": [["guà"], ["chē"]],
@@ -7789,7 +7789,7 @@
77897789
"咔嗒": [["kā"], ["dā"]],
77907790
"咖啡": [["kā"], ["fēi"]],
77917791
"咖喱": [["gā"], ["lí"]],
7792-
"喀吧": [["kā"], [""]],
7792+
"喀吧": [["kā"], ["ba"]],
77937793
"喀嚓": [["kā"], ["chā"]],
77947794
"卡尺": [["kǎ"], ["chǐ"]],
77957795
"卡车": [["kǎ"], ["chē"]],
@@ -8267,7 +8267,7 @@
82678267
"拉线": [["lā"], ["xiàn"]],
82688268
"拉杂": [["lā"], ["zá"]],
82698269
"拉账": [["lā"], ["zhàng"]],
8270-
"喇嘛": [["lǎ"], [""]],
8270+
"喇嘛": [["lǎ"], ["ma"]],
82718271
"腊八": [["là"], ["bā"]],
82728272
"腊肠": [["là"], ["cháng"]],
82738273
"腊梅": [["là"], ["méi"]],
@@ -9911,7 +9911,7 @@
99119911
"排版": [["pái"], ["bǎn"]],
99129912
"排笔": [["pái"], ["bǐ"]],
99139913
"排长": [["pái"], ["zhǎng"]],
9914-
"排场": [["pái"], ["chɑng"]],
9914+
"排场": [["pái"], ["chang"]],
99159915
"排除": [["pái"], ["chú"]],
99169916
"排挡": [["pái"], ["dǎng"]],
99179917
"排队": [["pái"], ["duì"]],
@@ -11049,7 +11049,7 @@
1104911049
"染坊": [["rǎn"], ["fáng"]],
1105011050
"攘臂": [["rǎng"], ["bì"]],
1105111051
"嚷叫": [["rǎng"], ["jiào"]],
11052-
"嚷嚷": [["rāng"], ["rɑng"]],
11052+
"嚷嚷": [["rāng"], ["rang"]],
1105311053
"让价": [["ràng"], ["jià"]],
1105411054
"让与": [["ràng"], ["yǔ"]],
1105511055
"饶有": [["ráo"], ["yǒu"]],
@@ -12597,7 +12597,7 @@
1259712597
"缩小": [["suō"], ["xiǎo"]],
1259812598
"缩写": [["suō"], ["xiě"]],
1259912599
"缩印": [["suō"], ["yìn"]],
12600-
"所长": [["suǒ"], ["chánɡ"]],
12600+
"所长": [["suǒ"], ["zhǎng", "cháng"]],
1260112601
"缩影": [["suō"], ["yǐng"]],
1260212602
"所得": [["suǒ"], ["de"]],
1260312603
"所说": [["suǒ"], ["shuō"]],
@@ -13708,7 +13708,7 @@
1370813708
"握别": [["wò"], ["bié"]],
1370913709
"斡旋": [["wò"], ["xuán"]],
1371013710
"乌龟": [["wū"], ["guī"]],
13711-
"乌拉": [["wù"], [""]],
13711+
"乌拉": [["wù"], ["la"]],
1371213712
"乌头": [["wū"], ["tóu"]],
1371313713
"乌有": [["wū"], ["yǒu"]],
1371413714
"污泥": [["wū"], ["ní"]],
@@ -14469,7 +14469,7 @@
1446914469
"新鲜": [["xīn"], ["xiān"]],
1447014470
"新兴": [["xīn"], ["xīng"]],
1447114471
"新雨": [["xīn"], ["yǔ"]],
14472-
"新正": [["xīn"], ["zhēnɡ"]],
14472+
"新正": [["xīn"], ["zhēng"]],
1447314473
"新语": [["xīn"], ["yǔ"]],
1447414474
"新知": [["xīn"], ["zhī"]],
1447514475
"薪传": [["xīn"], ["chuán"]],
@@ -18312,7 +18312,7 @@
1831218312
"碧空如洗": [["bì"], ["kōng"], ["rú"], ["xǐ"]],
1831318313
"碧落黄泉": [["bì"], ["luò"], ["huáng"], ["quán"]],
1831418314
"碧血丹心": [["bì"], ["xuè"], ["dān"], ["xīn"]],
18315-
"蔽聪塞明": [["bì"], ["cōnɡ"], ["sè"], ["mínɡ"]],
18315+
"蔽聪塞明": [["bì"], ["cōng"], ["sè"], ["míng"]],
1831618316
"蔽明塞聪": [["bì"], ["míng"], ["sè"], ["cōng"]],
1831718317
"蔽日干云": [["bì"], ["rì"], ["gān"], ["yún"]],
1831818318
"壁间蛇影": [["bì"], ["jiān"], ["shé"], ["yǐng"]],
@@ -20730,7 +20730,7 @@
2073020730
"达官贵要": [["dá"], ["guān"], ["guì"], ["yào"]],
2073120731
"达官要人": [["dá"], ["guān"], ["yào"], ["rén"]],
2073220732
"达官知命": [["dá"], ["guān"], ["zhī"], ["mìng"]],
20733-
"达赖喇嘛": [["dá"], ["lài"], ["lǎ"], [""]],
20733+
"达赖喇嘛": [["dá"], ["lài"], ["lǎ"], ["ma"]],
2073420734
"达姆弹": [["dá"], ["mǔ"], ["dàn"]],
2073520735
"达权知变": [["dá"], ["quán"], ["zhī"], ["biàn"]],
2073620736
"达人知命": [["dá"], ["rén"], ["zhī"], ["mìng"]],
@@ -21302,7 +21302,7 @@
2130221302
"单忧极瘁": [["dān"], ["yōu"], ["jí"], ["cuì"]],
2130321303
"单子叶植物": [["dān"], ["zi"], ["yè"], ["zhí"], ["wù"]],
2130421304
"担不是": [["dān"], ["bú"], ["shì"]],
21305-
"担担面": [["dàn"], ["dɑn"], ["miàn"]],
21305+
"担担面": [["dàn"], ["dan"], ["miàn"]],
2130621306
"担惊忍怕": [["dān"], ["jīng"], ["rěn"], ["pà"]],
2130721307
"担架队": [["dān"], ["jià"], ["duì"]],
2130821308
"担惊受恐": [["dān"], ["jīng"], ["shòu"], ["kǒng"]],
@@ -24410,7 +24410,7 @@
2441024410
"鼓睛暴眼": [["gǔ"], ["jīng"], ["bào"], ["yǎn"]],
2441124411
"鼓乐喧天": [["gǔ"], ["yuè"], ["xuān"], ["tiān"]],
2441224412
"鼓乐齐鸣": [["gǔ"], ["yuè"], ["qí"], ["míng"]],
24413-
"鼓囊囊": [["gǔ"], ["nāng"], ["nɑng"]],
24413+
"鼓囊囊": [["gǔ"], ["nāng"], ["nang"]],
2441424414
"鼓脑争头": [["gǔ"], ["nǎo"], ["zhēng"], ["tóu"]],
2441524415
"鼓旗相当": [["gǔ"], ["qí"], ["xiāng"], ["dāng"]],
2441624416
"鼓衰力尽": [["gǔ"], ["shuāi"], ["lì"], ["jìn"]],
@@ -28073,7 +28073,7 @@
2807328073
"拉下水": [["lā"], ["xià"], ["shuǐ"]],
2807428074
"拉朽摧枯": [["lā"], ["xiǔ"], ["cuī"], ["kū"]],
2807528075
"拉洋片": [["lā"], ["yáng"], ["piàn"]],
28076-
"喇嘛教": [["lǎ"], [""], ["jiào"]],
28076+
"喇嘛教": [["lǎ"], ["ma"], ["jiào"]],
2807728077
"腊八粥": [["là"], ["bā"], ["zhōu"]],
2807828078
"腊尽春回": [["là"], ["jìn"], ["chūn"], ["huí"]],
2807928079
"瘌痢头": [["là"], ["lì"], ["tóu"]],
@@ -29312,7 +29312,7 @@
2931229312
"忙中有失": [["máng"], ["zhōng"], ["yǒu"], ["shī"]],
2931329313
"芒刺在背": [["máng"], ["cì"], ["zài"], ["bèi"]],
2931429314
"芒寒色正": [["máng"], ["hán"], ["sè"], ["zhèng"]],
29315-
"尨眉皓发": [["mánɡ"], ["méi"], ["hào"], ["fà"]],
29315+
"尨眉皓发": [["máng"], ["méi"], ["hào"], ["fà"]],
2931629316
"盲风怪雨": [["máng"], ["fēng"], ["guài"], ["yǔ"]],
2931729317
"盲风暴雨": [["máng"], ["fēng"], ["bào"], ["yǔ"]],
2931829318
"盲风妒雨": [["máng"], ["fēng"], ["dù"], ["yǔ"]],
@@ -30155,7 +30155,7 @@
3015530155
"闹别扭": [["nào"], ["biè"], ["niǔ"]],
3015630156
"闹肚子": [["nào"], ["dǔ"], ["zi"]],
3015730157
"闹哄哄": [["nào"], ["hōng"], ["hǒng"]],
30158-
"闹嚷嚷": [["nào"], ["rāng"], ["rɑng"]],
30158+
"闹嚷嚷": [["nào"], ["rāng"], ["rang"]],
3015930159
"闹意见": [["nào"], ["yì"], ["jiàn"]],
3016030160
"闹着玩": [["nào"], ["zhe"], ["wán"]],
3016130161
"闹着玩儿": [["nào"], ["zhe"], ["wán"], ["ér"]],
@@ -32828,7 +32828,7 @@
3282832828
"少见多怪": [["shǎo"], ["jiàn"], ["duō"], ["guài"]],
3282932829
"少林拳": [["shǎo"], ["lín"], ["quán"]],
3283032830
"少林寺": [["shǎo"], ["lín"], ["sì"]],
32831-
"少奶奶": [["shào"], ["nǎi"], ["nɑi"]],
32831+
"少奶奶": [["shào"], ["nǎi"], ["nai"]],
3283232832
"少年犯": [["shào"], ["nián"], ["fàn"]],
3283332833
"少年宫": [["shào"], ["nián"], ["gōng"]],
3283432834
"少年老成": [["shào"], ["nián"], ["lǎo"], ["chéng"]],
@@ -33785,7 +33785,7 @@
3378533785
"耍单儿": [["shuǎ"], ["dān"], ["ér"]],
3378633786
"耍滑头": [["shuǎ"], ["huá"], ["tóu"]],
3378733787
"耍流氓": [["shuǎ"], ["liú"], ["máng"]],
33788-
"耍排场": [["shuǎ"], ["pái"], ["chɑng"]],
33788+
"耍排场": [["shuǎ"], ["pái"], ["chang"]],
3378933789
"耍态度": [["shuǎ"], ["tài"], ["dù"]],
3379033790
"耍威风": [["shuǎ"], ["wēi"], ["fēng"]],
3379133791
"衰当益壮": [["shuāi"], ["dāng"], ["yì"], ["zhuàng"]],
@@ -35670,9 +35670,9 @@
3567035670
"乌白马角": [["wū"], ["bái"], ["mǎ"], ["jiǎo"]],
3567135671
"乌骨鸡": [["wū"], ["gǔ"], ["jī"]],
3567235672
"乌合之众": [["wū"], ["hé"], ["zhī"], ["zhòng"]],
35673-
"乌拉草": [["wù"], [""], ["cǎo"]],
35674-
"乌拉尔山脉": [["wù"], [""], ["ěr"], ["shān"], ["mài"]],
35675-
"乌拉圭": [["wù"], [""], ["guī"]],
35673+
"乌拉草": [["wù"], ["la"], ["cǎo"]],
35674+
"乌拉尔山脉": [["wù"], ["la"], ["ěr"], ["shān"], ["mài"]],
35675+
"乌拉圭": [["wù"], ["la"], ["guī"]],
3567635676
"乌溜溜": [["wū"], ["liū"], ["liū"]],
3567735677
"乌鲁木齐": [["wū"], ["lǔ"], ["mù"], ["qí"]],
3567835678
"乌帽红裙": [["wū"], ["mào"], ["hóng"], ["qún"]],
@@ -36068,7 +36068,7 @@
3606836068
"西洋景": [["xī"], ["yáng"], ["jǐng"]],
3606936069
"西洋参": [["xī"], ["yáng"], ["shēn"]],
3607036070
"西印度群岛": [["xī"], ["yìn"], ["dù"], ["qún"], ["dǎo"]],
36071-
"吸风饮露": [["xī"], ["fēnɡ"], ["yǐn"], ["lù"]],
36071+
"吸风饮露": [["xī"], ["fēng"], ["yǐn"], ["lù"]],
3607236072
"吸新吐故": [["xī"], ["xīn"], ["tǔ"], ["gù"]],
3607336073
"吸铁石": [["xī"], ["tiě"], ["shí"]],
3607436074
"吸血鬼": [["xī"], ["xuè"], ["guǐ"]],
@@ -37803,7 +37803,7 @@
3780337803
"一毫不染": [["yī"], ["háo"], ["bù"], ["rǎn"]],
3780437804
"一轰而散": [["yī"], ["hōng"], ["ér"], ["sàn"]],
3780537805
"一呵而就": [["yī"], ["hē"], ["ér"], ["jiù"]],
37806-
"一哄而散": [["yī"], ["hònɡ"], ["ér"], ["sàn"]],
37806+
"一哄而散": [["yī"], ["hòng"], ["ér"], ["sàn"]],
3780737807
"一哄而起": [["yī"], ["hōng"], ["ér"], ["qǐ"]],
3780837808
"一哄而上": [["yì"], ["hōng"], ["ér"], ["shàng"]],
3780937809
"一呼百应": [["yī"], ["hū"], ["bǎi"], ["yìng"]],

setup.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,7 @@ def long_description():
6363
'Programming Language :: Python :: 3',
6464
'Programming Language :: Python :: 3.3',
6565
'Programming Language :: Python :: 3.4',
66+
'Programming Language :: Python :: 3.5',
6667
'Programming Language :: Python :: Implementation :: CPython',
6768
'Programming Language :: Python :: Implementation :: PyPy',
6869
'Topic :: Utilities',

tools/ipa2ascii.py

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
#!/usr/bin/env python
2+
# -*- coding: utf-8 -*-
3+
from __future__ import absolute_import, print_function, unicode_literals
4+
"""将拼音库中的国际音标字母替换为 ASCII 字母"""
5+
6+
from io import open
7+
import sys
8+
9+
10+
def ipa_map_ascii():
11+
return {
12+
'ɑ': 'a',
13+
'b': 'b',
14+
'c': 'c',
15+
'd': 'd',
16+
'e': 'e',
17+
'f': 'f',
18+
'ɡ': 'g',
19+
'h': 'h',
20+
'i': 'i',
21+
'j': 'j',
22+
'k': 'k',
23+
'l': 'l',
24+
'm': 'm',
25+
}
26+
27+
28+
def main(path):
29+
with open(path, 'r+', encoding='utf8') as f:
30+
new_content = f.read()
31+
for ipa, s in ipa_map_ascii().items():
32+
new_content = new_content.replace(ipa, s)
33+
f.seek(0)
34+
f.write(new_content)
35+
f.truncate()
36+
37+
if __name__ == '__main__':
38+
if len(sys.argv) < 2:
39+
sys.exit('Usge: python ipa2ascii.py FILE...')
40+
for path in sys.argv[1:]:
41+
main(path)

tox.ini

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
# and then run "tox" from this directory.
55

66
[tox]
7-
envlist = py26, py27, py33, py34, pypy, py2_jieba, py3_jieba, py2_snownlp, py3_env
7+
envlist = py26, py27, py33, py34, py35, pypy, py2_jieba, py3_jieba, py2_snownlp, py3_env
88

99
[base]
1010
deps =

0 commit comments

Comments
 (0)