diff --git a/CHANGELOG.md b/CHANGELOG.md index 5f05e88..45bdbb1 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,10 +1,12 @@ # ChangeLog -## 0.4.0 (2016-mm-dd): +## 0.4.0 (2016-10-17): * Update PUA.txt 详见 [#7](https://github.com/mozillazg/pinyin-data/issues/7) thanks [@Artoria2e5][@Artoria2e5] * Rename PUA.txt to GBK_PUA.txt 详见 [#7](https://github.com/mozillazg/pinyin-data/issues/7) +* Add kMandarin_8105.txt (《通用规范汉字表》里 8105 个汉字最常用的一个读音) [#9][#9] [#11][#11] +* Update pinyin.txt with latest data ## 0.3.0 (2016-08-19): @@ -29,3 +31,5 @@ [@Artoria2e5]: https://github.com/Artoria2e5 +[#9]: https://github.com/mozillazg/pinyin-data/pull/9 +[#11]: https://github.com/mozillazg/pinyin-data/pull/11 diff --git a/merge_unihan.py b/merge_unihan.py index 11c7b13..f8827ae 100644 --- a/merge_unihan.py +++ b/merge_unihan.py @@ -108,6 +108,6 @@ def extend_pinyins(old_map, new_map, only_no_exists=False): assert set(overwrite_pinyin_map.keys()) - code_set == set() assert set(pua_pinyin_map.keys()) - code_set == set() with open('pinyin.txt', 'w') as fp: - fp.write('# version: 0.3.0\n') + fp.write('# version: 0.4.0\n') fp.write('# source: https://github.com/mozillazg/pinyin-data\n') save_data(new_pinyin_map, fp) diff --git a/pinyin.txt b/pinyin.txt index e8792bd..08f71d5 100644 --- a/pinyin.txt +++ b/pinyin.txt @@ -1,4 +1,4 @@ -# version: 0.3.0 +# version: 0.4.0 # source: https://github.com/mozillazg/pinyin-data U+3007: líng # 〇 U+3400: qiū # 㐀 @@ -2115,6 +2115,7 @@ U+3E01: hǎn # 㸁 U+3E03: diǎn # 㸃 U+3E04: jì # 㸄 U+3E05: jié,jí # 㸅 +U+3E06: kào # 㸆 U+3E07: zuǎn # 㸇 U+3E09: xiè # 㸉 U+3E0A: lài,là # 㸊 @@ -3709,6 +3710,7 @@ U+44E6: diǎn # 䓦 U+44E7: cì # 䓧 U+44E8: yīng # 䓨 U+44EB: qí # 䓫 +U+44EC: zhuó # 䓬 U+44ED: chà # 䓭 U+44EE: mào # 䓮 U+44EF: dú # 䓯 @@ -5888,7 +5890,7 @@ U+4E7A: suǒ # 乺 U+4E7B: yú # 乻 U+4E7C: cui # 乼 U+4E7D: zhě # 乽 -U+4E7E: gān,qián # 乾 +U+4E7E: qián,gān # 乾 U+4E7F: zhì,luàn # 乿 U+4E80: guī # 亀 U+4E81: gān # 亁 @@ -5947,7 +5949,7 @@ U+4EB5: xiè # 亵 U+4EB6: dǎn,dàn,chán,zhān # 亶 U+4EB7: lián # 亷 U+4EB8: duǒ # 亸 -U+4EB9: mén,wěi # 亹 +U+4EB9: wěi,mén # 亹 U+4EBA: rén # 人 U+4EBB: rén # 亻 U+4EBC: jí # 亼 @@ -5974,7 +5976,7 @@ U+4ED0: sǎn # 仐 U+4ED1: lún # 仑 U+4ED2: bīng # 仒 U+4ED3: cāng # 仓 -U+4ED4: zǐ,zī,zǎi # 仔 +U+4ED4: zǎi,zǐ,zī # 仔 U+4ED5: shì # 仕 U+4ED6: tā,tuó # 他 U+4ED7: zhàng # 仗 @@ -6053,7 +6055,7 @@ U+4F1F: wěi # 伟 U+4F20: chuán,zhuàn # 传 U+4F21: chē # 伡 U+4F22: yá # 伢 -U+4F23: xiàn # 伣 +U+4F23: qiàn,xiàn # 伣 U+4F24: shāng # 伤 U+4F25: chāng # 伥 U+4F26: lún # 伦 @@ -6079,7 +6081,7 @@ U+4F39: qū,zù # 伹 U+4F3A: cì,sì # 伺 U+4F3B: bēng # 伻 U+4F3C: shì,sì # 似 -U+4F3D: jiā,qié,gā # 伽 +U+4F3D: gā,jiā,qié # 伽 U+4F3E: pī # 伾 U+4F3F: yì # 伿 U+4F40: sì # 佀 @@ -13574,7 +13576,7 @@ U+6C84: yún # 沄 U+6C85: yuán # 沅 U+6C86: hàng,háng,kàng # 沆 U+6C87: yǎn,wěi # 沇 -U+6C88: chén,shěn,tán # 沈 +U+6C88: shěn,chén,tán # 沈 U+6C89: chén # 沉 U+6C8A: dàn # 沊 U+6C8B: yóu # 沋 @@ -26789,6 +26791,7 @@ U+20142: jié # 𠅂 U+2014C: yí # 𠅌 U+20157: diè # 𠅗 U+2015A: qí # 𠅚 +U+20164: xí # 𠅤 U+2016C: bāo # 𠅬 U+20171: xiè # 𠅱 U+20179: zhàng # 𠅹 @@ -34725,6 +34728,7 @@ U+2666F: dài # 𦙯 U+26671: sān # 𦙱 U+26674: zhù # 𦙴 U+26675: wàn # 𦙵 +U+26676: gǔ # 𦙶 U+26678: sān # 𦙸 U+26679: bàn # 𦙹 U+2667A: jià,jiā # 𦙺 @@ -35248,6 +35252,7 @@ U+26C16: wò # 𦰖 U+26C18: zhǐ # 𦰘 U+26C19: bì # 𦰙 U+26C1B: fén # 𦰛 +U+26C21: nà # 𦰡 U+26C25: bāng # 𦰥 U+26C2A: qiú # 𦰪 U+26C2B: nǐ # 𦰫 @@ -41232,11 +41237,17 @@ U+2A6CA: yín # 𪛊 U+2A6CE: pì # 𪛎 U+2A6D2: lián # 𪛒 U+2A79D: duó # 𪞝 +U+2A7DD: jì # 𪟝 U+2A848: bái # 𪡈 U+2A84F: zhān # 𪡏 U+2A8AE: luán # 𪢮 +U+2A8FB: lóu # 𪣻 +U+2A917: liào # 𪤗 U+2AA0A: sóng # 𪨊 U+2AA17: juē # 𪨗 +U+2AA30: qū # 𪨰 +U+2AA36: shē # 𪨶 +U+2AA58: yǎn # 𪩘 U+2AA9D: yōng # 𪪝 U+2AEB9: nǔ # 𪺹 U+2AED0: cōng # 𪻐 @@ -41245,8 +41256,11 @@ U+2B061: lì # 𫁡 U+2B088: fèi # 𫂈 U+2B099: sù # 𫂙 U+2B0DC: kòu # 𫃜 +U+2B127: yán # 𫄧 U+2B128: chī # 𫄨 +U+2B137: yì # 𫄷 U+2B138: xūn # 𫄸 +U+2B1ED: wěi # 𫇭 U+2B230: qià # 𫈰 U+2B2D0: gǒng # 𫋐 U+2B300: jī # 𫌀 @@ -41254,36 +41268,172 @@ U+2B328: luó # 𫌨 U+2B359: yì # 𫍙 U+2B35F: yí # 𫍟 U+2B362: náo # 𫍢 +U+2B363: tóng # 𫍣 +U+2B36F: xián # 𫍯 U+2B370: xǐ # 𫍰 U+2B372: xiǎo # 𫍲 +U+2B37D: xuān # 𫍽 U+2B3CB: juē,qiāo # 𫏋 U+2B404: yuè # 𫐄 U+2B406: kuài # 𫐆 U+2B409: líng # 𫐉 U+2B410: ní # 𫐐 U+2B413: bù # 𫐓 +U+2B461: méng # 𫑡 U+2B4B6: hán # 𫒶 U+2B4E7: fū # 𫓧 U+2B4E9: cōng # 𫓩 +U+2B4EF: jī # 𫓯 +U+2B4F6: xuān # 𫓶 +U+2B4F9: jī # 𫓹 +U+2B50D: fán # 𫔍 U+2B50E: jué # 𫔎 +U+2B536: niè # 𫔶 +U+2B5AE: yǐ # 𫖮 +U+2B5AF: fǔ # 𫖯 +U+2B5B3: yūn # 𫖳 U+2B5E0: zhāng # 𫗠 U+2B5E6: bù # 𫗦 U+2B5E7: sù # 𫗧 U+2B5EE: huáng # 𫗮 U+2B5F4: zhān # 𫗴 +U+2B61C: wén # 𫘜 U+2B61D: jué # 𫘝 U+2B623: hàn # 𫘣 U+2B624: ái # 𫘤 +U+2B626: táo # 𫘦 +U+2B627: lù # 𫘧 U+2B628: tí # 𫘨 +U+2B62A: yuán # 𫘪 +U+2B62C: xí # 𫘬 U+2B688: xù # 𫚈 U+2B689: hóng # 𫚉 U+2B692: fú # 𫚒 U+2B694: huí # 𫚔 U+2B695: shī # 𫚕 +U+2B696: cǐ # 𫚖 U+2B699: pū # 𫚙 +U+2B6AD: liè # 𫚭 U+2B6DB: zhī # 𫛛 U+2B6DE: jué # 𫛞 U+2B6E2: níng # 𫛢 +U+2B6ED: kuáng # 𫛭 U+2B6F6: chì # 𫛶 U+2B6F8: tí # 𫛸 +U+2B7A9: mén # 𫞩 +U+2B7C5: liáng # 𫟅 +U+2B7E6: suì # 𫟦 +U+2B7F9: hóng # 𫟹 +U+2B7FC: dá # 𫟼 +U+2B806: kuǐ # 𫠆 +U+2B80A: xuán # 𫠊 +U+2B81C: ní # 𫠜 U+2B851: yīn # 𫡑 +U+2B8B8: dàn # 𫢸 +U+2BAC7: ě # 𫫇 +U+2BB5F: ōu # 𫭟 +U+2BB62: lǔn # 𫭢 +U+2BB7C: láo # 𫭼 +U+2BB83: shàn # 𫮃 +U+2BC1B: xíng # 𫰛 +U+2BD77: lì # 𫵷 +U+2BD87: dié # 𫶇 +U+2BDF7: xīn # 𫷷 +U+2BE29: kōu # 𫸩 +U+2C029: wěi # 𬀩 +U+2C02A: xiàn # 𬀪 +U+2C0A9: jiā # 𬂩 +U+2C0CA: zhì # 𬃊 +U+2C1D5: wàn # 𬇕 +U+2C1D9: pèi # 𬇙 +U+2C1F9: guó # 𬇹 +U+2C27C: ōu # 𬉼 +U+2C288: xún # 𬊈 +U+2C2A4: chǎn # 𬊤 +U+2C317: hé # 𬌗 +U+2C35B: lì # 𬍛 +U+2C361: dàng # 𬍡 +U+2C364: xún # 𬍤 +U+2C488: què # 𬒈 +U+2C494: gěng # 𬒔 +U+2C497: lán # 𬒗 +U+2C542: gōng # 𬕂 +U+2C613: xún # 𬘓 +U+2C618: dǎn # 𬘘 +U+2C621: yīn # 𬘡 +U+2C629: tīng # 𬘩 +U+2C62B: huán # 𬘫 +U+2C62C: qiàn # 𬘬 +U+2C62D: lín # 𬘭 +U+2C62F: zhǔn # 𬘯 +U+2C642: yǎn # 𬙂 +U+2C64A: mò # 𬙊 +U+2C64B: xiāng # 𬙋 +U+2C72C: màn # 𬜬 +U+2C72F: liǎng # 𬜯 +U+2C79F: pín # 𬞟 +U+2C7C1: yì # 𬟁 +U+2C7FD: dōng # 𬟽 +U+2C8D9: xū # 𬣙 +U+2C8DE: zhǔ # 𬣞 +U+2C8E1: jiàn # 𬣡 +U+2C8F3: hěn # 𬣳 +U+2C907: yīn # 𬤇 +U+2C90A: shì # 𬤊 +U+2C91D: huì # 𬤝 +U+2CA02: qí # 𬨂 +U+2CA0E: yóu # 𬨎 +U+2CA7D: xún # 𬩽 +U+2CAA9: nóng # 𬪩 +U+2CB29: yì # 𬬩 +U+2CB2D: lún # 𬬭 +U+2CB2E: chǎng # 𬬮 +U+2CB31: jīn # 𬬱 +U+2CB38: shù # 𬬸 +U+2CB39: shén # 𬬹 +U+2CB3B: lú # 𬬻 +U+2CB3F: zhāo # 𬬿 +U+2CB41: mǔ # 𬭁 +U+2CB4A: dù # 𬭊 +U+2CB4E: hóng # 𬭎 +U+2CB5A: chún # 𬭚 +U+2CB5B: bō # 𬭛 +U+2CB64: hóu # 𬭤 +U+2CB69: wēng # 𬭩 +U+2CB6C: wèi # 𬭬 +U+2CB6F: piě # 𬭯 +U+2CB73: xǐ # 𬭳 +U+2CB76: hēi # 𬭶 +U+2CB78: lín # 𬭸 +U+2CB7C: suì # 𬭼 +U+2CBB1: yīn # 𬮱 +U+2CBBF: qí # 𬮿 +U+2CBC0: jī # 𬯀 +U+2CBCE: tuí # 𬯎 +U+2CC56: dí # 𬱖 +U+2CC5F: wěi # 𬱟 +U+2CCF5: pī # 𬳵 +U+2CCF6: jiōng # 𬳶 +U+2CCFD: shēn # 𬳽 +U+2CCFF: tú # 𬳿 +U+2CD02: fēi # 𬴂 +U+2CD03: huō # 𬴃 +U+2CD0A: lín # 𬴊 +U+2CD8B: jū # 𬶋 +U+2CD8D: tuó # 𬶍 +U+2CD8F: wéi # 𬶏 +U+2CD90: zhào # 𬶐 +U+2CD9F: là # 𬶟 +U+2CDA0: liàn # 𬶠 +U+2CDA8: jì # 𬶨 +U+2CDAD: jì # 𬶭 +U+2CDAE: xǐ # 𬶮 +U+2CDD5: bū # 𬷕 +U+2CE18: yǎn # 𬸘 +U+2CE1A: yuè # 𬸚 +U+2CE23: xiān # 𬸣 +U+2CE26: zhuó # 𬸦 +U+2CE2A: fán # 𬸪 +U+2CE7C: xiè # 𬹼 +U+2CE88: yǐ # 𬺈 +U+2CE93: chǔ # 𬺓