o
    
j                     @   s  d dl Z d dlZd dlZd dlZd dlZd dlZdZdZdZdZ	dZ
dZdZdZdZd	Zd
ZddgZddgZddgZddgZddgZdZeeZg dZdZdZdZdZdZee Zeej  Z!e"#e!de$e! dZ%i dddd d!d"d#d$d%d&d'd(d)d*d+d,d-d.d/d0d1d2d3d4d5dd6d7d8d9d:d;d<d=i d>d?d@dAdBdCdDdEdFdGdHdIdJdKdLdMdNdOdPdQdRdSdTdUdVdWdXdYdZd[d\d]d^d_i d`dadbdcdddedfdgdhdidjdkdldmdndodpdqdrdsdtdudvdwdxdydzd{d|d}d~dddi ddddddddddddddddddddddddddddddddddi ddddddddddddddddddddddddddddddddÓddœdddddddddddМ
Z&e"#d'e&( d'e&) dZ*dZ+dZ,e+e, Z-ddԄ e-D Z.ej/ej0 Z1ddԄ e1D Z2e-e1 d Z3ddԄ e3D Z4G dd؄ de5Z6G ddڄ de6Z7G dd܄ de6Z8G ddބ de6Z9e6e7e8e9f\Z:Z;Z<Z=G dd de5Z>G dd de5Z?ed fddZ@ed fddZAed dddddddfddZBG dd dZCG dd dZDG dd dZEG dd dZFG dd dZGG dd dZHG dd dZIdd ZJdd ZKdd ZLG d d dZMeNdkrhe O ZPePjQdddd ePjQdddd ePjQd	dd
d ePjQdddd ePjQdddd ePjQdddd ePjQdddd ePjQdg dddd ePjQdeRddd ePjQdddd ePjQde"g ddd d! ePjQd"d#d$ ePjQd%d&d$ ePS ZTeTjUrd'eT_VeMeTjWeTjXeTjYeTjZeTjKeTj[eTjLeTj\d(Z]eMeTjWeTjXeTjYeTjZeTjKeTj[eTjLeTj\d(Z]d Z^e_eTj`dd)d*Zae_eTjbd+d)d*ZceTjVd,krejdead-d.Zed/eejfv soJ egd-'eejfecd0 eeD ]EZhehd/ Zieire]eiZieireiehd/< egd-'d1d2 eejfD ecd0 e^d7 Z^e^eTjj d kregd3e^ d4ejkdd5 q}nseaD ]pZld6\ZmZieTjVd'kreln jodd7Zpepd  e$epd8krepd ndZmZineln Zieire]eiZieireTjVd'kregemd- ei ecd0 negeiecd0 e^d7 Z^e^eTjj d kr5egd3e^ d4ejkdd5 qW d   n	1 sBw   Y  W d   n	1 sRw   Y  egd3e^ d9ejkdd5 dS dS (:      Nu   零一二三四五六七八九u   零壹贰叁肆伍陆柒捌玖u   零壹貳參肆伍陸柒捌玖u   十百千万u   拾佰仟萬u   亿兆京垓秭穰沟涧正载u   億兆京垓秭穰溝澗正載u   〇u   幺u   两u   兩u   正u   负u   負u   点u   點u   呃u   啊u_  (儿女|儿子|儿孙|女儿|儿媳|妻儿|胎儿|婴儿|新生儿|婴幼儿|幼儿|少儿|小儿|儿歌|儿童|儿科|托儿所|孤儿|儿戏|儿化|台儿庄|鹿儿岛|正儿八经|吊儿郎当|生儿育女|托儿带女|养儿防老|痴儿呆女|佳儿佳妇|儿怜兽扰|儿无常父|儿不嫌母丑|儿行千里母担忧|儿大不由爷|苏乞儿))lowmidhighu   (人民币|美元|日元|英镑|欧元|马克|法郎|加拿大元|澳元|港币|先令|芬兰马克|爱尔兰镑|里拉|荷兰盾|埃斯库多|比塞塔|印尼盾|林吉特|新西兰元|比索|卢布|新加坡元|韩元|泰铢)uu   ((亿|千万|百万|万|千|百)|(亿|千万|百万|万|千|百|)元|(亿|千万|百万|万|千|百|)块|角|毛|分)u  (匹|张|座|回|场|尾|条|个|首|阙|阵|网|炮|顶|丘|棵|只|支|袭|辆|挑|担|颗|壳|窠|曲|墙|群|腔|砣|座|客|贯|扎|捆|刀|令|打|手|罗|坡|山|岭|江|溪|钟|队|单|双|对|出|口|头|脚|板|跳|枝|件|贴|针|线|管|名|位|身|堂|课|本|页|家|户|层|丝|毫|厘|分|钱|两|斤|担|铢|石|钧|锱|忽|(千|毫|微)克|毫|厘|分|寸|尺|丈|里|寻|常|铺|程|(千|分|厘|毫|微)米|撮|勺|合|升|斗|石|盘|碗|碟|叠|桶|笼|盆|盒|杯|钟|斛|锅|簋|篮|盘|桶|罐|瓶|壶|卮|盏|箩|箱|煲|啖|袋|钵|年|月|日|季|刻|时|周|天|秒|分|旬|纪|岁|世|更|夜|春|夏|秋|冬|代|伏|辈|丸|泡|粒|颗|幢|堆|条|根|支|道|面|片|张|颗|块)u   ！？｡。u   ＂＃＄％＆＇（）＊＋，－／：；＜＝＞＠［＼］＾＿｀｛｜｝～｟｠｢｣､、〃《》「」『』【】〔〕〖〗〘〙〚〛〜〝〞〟〰〾〿–—‘’‛“”„‟…‧﹏·〈〉-, u   　 u   ！!u   ＂"u   ＃#u   ＄$   ％%u   ＆&u   ＇'u   （(u   ）)u   ＊*u   ＋+u   ，u   －-u   ．.u   ／/u   ０0u   １1u   ２2u   ３3u   ４4u   ５5u   ６6u   ７7u   ８8u   ９9u   ：:u   ；;u   ＜<u   ＝=u   ＞>u   ？?u   ＠@u   ＡAu   ＢBu   ＣCu   ＤDu   ＥEu   ＦFu   ＧGu   ＨHu   ＩIu   ＪJu   ＫKu   ＬLu   ＭMu   ＮNu   ＯOu   ＰPu   ＱQu   ＲRu   ＳSu   ＴTu   ＵUu   ＶVu   ＷWu   ＸXu   ＹYu   ＺZu   ［[u   ＼\u   ］]u   ＾^u   ＿_u   ｀`u   ａau   ｂbu   ｃcu   ｄdu   ｅeu   ｆfu   ｇgu   ｈhu   ｉiu   ｊju   ｋku   ｌlu   ｍmu   ｎnu   ｏou   ｐpu   ｑqu   ｒru   ｓsu   ｔtuvwxyz{|}~)
u   ｕu   ｖu   ｗu   ｘu   ｙu   ｚu   ｛u   ｜u   ｝u   ～u_  一丁七万丈三上下不与丏丐丑专且丕世丘丙业丛东丝丞丢两严丧个丫中丰串临丸丹为主丽举乂乃久么义之乌乍乎乏乐乒乓乔乖乘乙乜九乞也习乡书乩买乱乳乸乾了予争事二亍于亏云互亓五井亘亚些亟亡亢交亥亦产亨亩享京亭亮亲亳亵亶亸亹人亿什仁仂仃仄仅仆仇仉今介仍从仑仓仔仕他仗付仙仝仞仟仡代令以仨仪仫们仰仲仳仵件价任份仿企伈伉伊伋伍伎伏伐休众优伙会伛伞伟传伢伣伤伥伦伧伪伫伭伯估伲伴伶伸伺似伽伾佁佃但位低住佐佑体何佖佗佘余佚佛作佝佞佟你佣佤佥佩佬佯佰佳佴佶佸佺佻佼佽佾使侁侂侃侄侈侉例侍侏侑侔侗侘供依侠侣侥侦侧侨侩侪侬侮侯侴侵侹便促俄俅俊俍俎俏俐俑俗俘俙俚俜保俞俟信俣俦俨俩俪俫俭修俯俱俳俵俶俸俺俾倌倍倏倒倓倔倕倘候倚倜倞借倡倥倦倧倨倩倪倬倭倮倴债倻值倾偁偃假偈偌偎偏偓偕做停偡健偬偭偰偲偶偷偻偾偿傀傃傅傈傉傍傒傕傣傥傧储傩催傲傺傻僇僎像僔僖僚僦僧僬僭僮僰僳僵僻儆儇儋儒儡儦儳儴儿兀允元兄充兆先光克免兑兔兕兖党兜兢入全八公六兮兰共关兴兵其具典兹养兼兽冀冁内冈冉册再冏冒冔冕冗写军农冠冢冤冥冬冮冯冰冱冲决况冶冷冻冼冽净凄准凇凉凋凌减凑凓凘凛凝几凡凤凫凭凯凰凳凶凸凹出击凼函凿刀刁刃分切刈刊刍刎刑划刖列刘则刚创初删判刨利别刬刭刮到刳制刷券刹刺刻刽刿剀剁剂剃剅削剋剌前剐剑剔剕剖剜剞剟剡剥剧剩剪副割剽剿劁劂劄劈劐劓力劝办功加务劢劣动助努劫劬劭励劲劳劼劾势勃勇勉勋勍勐勒勔勖勘勚募勠勤勰勺勾勿匀包匆匈匍匏匐匕化北匙匜匝匠匡匣匦匪匮匹区医匼匾匿十千卅升午卉半华协卑卒卓单卖南博卜卞卟占卡卢卣卤卦卧卫卬卮卯印危即却卵卷卸卺卿厂厄厅历厉压厌厍厕厖厘厚厝原厢厣厥厦厨厩厮去厾县叁参叆叇又叉及友双反发叔叕取受变叙叚叛叟叠口古句另叨叩只叫召叭叮可台叱史右叵叶号司叹叻叼叽吁吃各吆合吉吊同名后吏吐向吒吓吕吖吗君吝吞吟吠吡吣否吧吨吩含听吭吮启吱吲吴吵吸吹吻吼吽吾呀呃呆呇呈告呋呐呒呓呔呕呖呗员呙呛呜呢呣呤呦周呱呲味呵呶呷呸呻呼命咀咂咄咆咇咉咋和咍咎咏咐咒咔咕咖咙咚咛咝咡咣咤咥咦咧咨咩咪咫咬咯咱咳咴咸咺咻咽咿哀品哂哃哄哆哇哈哉哌响哎哏哐哑哒哓哔哕哗哙哚哝哞哟哢哥哦哧哨哩哪哭哮哱哲哳哺哼哽哿唁唆唇唉唏唐唑唔唛唝唠唢唣唤唧唪唬售唯唰唱唳唵唷唼唾唿啁啃啄商啉啊啐啕啖啜啡啤啥啦啧啪啫啬啭啮啰啴啵啶啷啸啻啼啾喀喁喂喃善喆喇喈喉喊喋喏喑喔喘喙喜喝喟喤喧喱喳喵喷喹喻喽喾嗄嗅嗉嗌嗍嗐嗑嗒嗓嗔嗖嗜嗝嗞嗟嗡嗣嗤嗥嗦嗨嗪嗫嗬嗯嗲嗳嗵嗷嗽嗾嘀嘁嘈嘉嘌嘎嘏嘘嘚嘛嘞嘟嘡嘣嘤嘧嘬嘭嘱嘲嘴嘶嘹嘻嘿噀噂噇噌噍噎噔噗噘噙噜噢噤器噩噪噫噬噱噶噻噼嚄嚅嚆嚎嚏嚓嚚嚣嚭嚯嚷嚼囊囔囚四回囟因囡团囤囫园困囱围囵囷囹固国图囿圃圄圆圈圉圊圌圐圙圜土圢圣在圩圪圫圬圭圮圯地圲圳圹场圻圾址坂均坉坊坋坌坍坎坏坐坑坒块坚坛坜坝坞坟坠坡坤坥坦坨坩坪坫坬坭坯坰坳坷坻坼坽垂垃垄垆垈型垌垍垎垏垒垓垕垙垚垛垞垟垠垡垢垣垤垦垧垩垫垭垮垯垱垲垴垵垸垺垾垿埂埃埆埇埋埌城埏埒埔埕埗埘埙埚埝域埠埤埪埫埭埯埴埵埸培基埼埽堂堃堆堇堉堋堌堍堎堐堑堕堙堞堠堡堤堧堨堪堰堲堵堼堽堾塄塅塆塌塍塑塔塘塝塞塥填塬塱塾墀墁境墅墈墉墐墒墓墕墘墙墚增墟墡墣墦墨墩墼壁壅壑壕壤士壬壮声壳壶壸壹处备复夏夐夔夕外夙多夜够夤夥大天太夫夬夭央夯失头夷夸夹夺夼奁奂奄奇奈奉奋奎奏契奓奔奕奖套奘奚奠奡奢奥奭女奴奶奸她好妁如妃妄妆妇妈妊妍妒妓妖妗妘妙妞妣妤妥妧妨妩妪妫妭妮妯妲妹妻妾姆姈姊始姐姑姒姓委姗姘姚姜姝姞姣姤姥姨姬姮姱姶姹姻姽姿娀威娃娄娅娆娇娈娉娌娑娓娘娜娟娠娣娥娩娱娲娴娵娶娼婀婆婉婊婌婍婕婘婚婞婠婢婤婧婪婫婳婴婵婶婷婺婻婼婿媂媄媆媒媓媖媚媛媞媪媭媱媲媳媵媸媾嫁嫂嫄嫉嫌嫒嫔嫕嫖嫘嫚嫜嫠嫡嫣嫦嫩嫪嫫嫭嫱嫽嬉嬖嬗嬛嬥嬬嬴嬷嬿孀孅子孑孓孔孕孖字存孙孚孛孜孝孟孢季孤孥学孩孪孬孰孱孳孵孺孽宁它宄宅宇守安宋完宏宓宕宗官宙定宛宜宝实宠审客宣室宥宦宧宪宫宬宰害宴宵家宸容宽宾宿寁寂寄寅密寇富寐寒寓寝寞察寡寤寥寨寮寰寸对寺寻导寿封射将尉尊小少尔尕尖尘尚尜尝尢尤尥尧尨尪尬就尴尸尹尺尻尼尽尾尿局屁层屃居屈屉届屋屎屏屐屑展屙属屠屡屣履屦屯山屹屺屼屾屿岁岂岈岊岌岍岐岑岔岖岗岘岙岚岛岜岞岠岢岣岨岩岫岬岭岱岳岵岷岸岽岿峁峂峃峄峋峒峗峘峙峛峡峣峤峥峦峧峨峪峭峰峱峻峿崀崁崂崃崄崆崇崌崎崒崔崖崚崛崞崟崡崤崦崧崩崭崮崴崶崽崾崿嵁嵅嵇嵊嵋嵌嵎嵖嵘嵚嵛嵝嵩嵫嵬嵯嵲嵴嶂嶅嶍嶒嶓嶙嶝嶟嶦嶲嶷巅巇巉巍川州巡巢工左巧巨巩巫差巯己已巳巴巷巽巾币市布帅帆师希帏帐帑帔帕帖帘帙帚帛帜帝帡带帧帨席帮帱帷常帻帼帽幂幄幅幌幔幕幖幛幞幡幢幪干平年并幸幺幻幼幽广庄庆庇床庋序庐庑库应底庖店庙庚府庞废庠庤庥度座庭庱庳庵庶康庸庹庼庾廆廉廊廋廑廒廓廖廙廛廨廪延廷建廿开弁异弃弄弆弇弈弊弋式弑弓引弗弘弛弟张弢弥弦弧弨弩弭弯弱弶弸弹强弼彀归当录彖彗彘彝彟形彤彦彧彩彪彬彭彰影彳彷役彻彼往征徂径待徇很徉徊律徐徒徕得徘徙徛徜御徨循徭微徵德徼徽心必忆忉忌忍忏忐忑忒忖志忘忙忝忞忠忡忤忧忪快忭忮忱忳念忸忺忻忽忾忿怀态怂怃怄怅怆怊怍怎怏怒怔怕怖怙怛怜思怠怡急怦性怨怩怪怫怯怵总怼怿恁恂恃恋恍恐恒恓恔恕恙恚恝恢恣恤恧恨恩恪恫恬恭息恰恳恶恸恹恺恻恼恽恿悃悄悆悈悉悌悍悒悔悖悚悛悝悟悠悢患悦您悫悬悭悯悰悱悲悴悸悻悼情惆惇惊惋惎惑惔惕惘惙惚惛惜惝惟惠惦惧惨惩惫惬惭惮惯惰想惴惶惹惺愀愁愃愆愈愉愍愎意愐愔愕愚感愠愣愤愦愧愫愭愿慆慈慊慌慎慑慕慝慢慥慧慨慬慭慰慵慷憋憎憔憕憙憧憨憩憬憭憷憺憾懂懈懊懋懑懒懔懦懵懿戆戈戊戋戌戍戎戏成我戒戕或戗战戚戛戟戡戢戣戤戥截戬戭戮戳戴户戽戾房所扁扂扃扅扆扇扈扉扊手才扎扑扒打扔托扛扞扣扦执扩扪扫扬扭扮扯扰扳扶批扺扼扽找承技抃抄抉把抑抒抓抔投抖抗折抚抛抟抠抡抢护报抨披抬抱抵抹抻押抽抿拂拃拄担拆拇拈拉拊拌拍拎拐拒拓拔拖拗拘拙招拜拟拢拣拤拥拦拧拨择括拭拮拯拱拳拴拶拷拼拽拾拿持挂指挈按挎挑挓挖挚挛挝挞挟挠挡挣挤挥挦挨挪挫振挲挹挺挽捂捃捅捆捉捋捌捍捎捏捐捕捞损捡换捣捧捩捭据捯捶捷捺捻捽掀掂掇授掉掊掌掎掏掐排掖掘掞掠探掣接控推掩措掬掭掮掰掳掴掷掸掺掼掾揄揆揉揍描提插揕揖揠握揣揩揪揭揳援揶揸揽揿搀搁搂搅搋搌搏搐搒搓搔搛搜搞搠搡搦搪搬搭搴携搽摁摄摅摆摇摈摊摏摒摔摘摛摞摧摩摭摴摸摹摽撂撄撅撇撑撒撕撖撙撞撤撩撬播撮撰撵撷撸撺撼擀擂擅操擎擐擒擘擞擢擤擦擿攀攉攒攘攥攫攮支收攸改攻攽放政故效敉敌敏救敔敕敖教敛敝敞敢散敦敩敫敬数敲整敷文斋斌斐斑斓斗料斛斜斝斟斠斡斤斥斧斩斫断斯新斶方於施旁旃旄旅旆旋旌旎族旐旒旖旗旞无既日旦旧旨早旬旭旮旯旰旱旴旵时旷旸旺旻旿昀昂昃昄昆昇昈昉昊昌明昏昒易昔昕昙昝星映昡昣昤春昧昨昪昫昭是昱昳昴昵昶昺昼昽显晁晃晅晊晋晌晏晐晒晓晔晕晖晗晙晚晞晟晡晢晤晦晨晪晫普景晰晱晴晶晷智晾暂暄暅暇暌暑暕暖暗暝暧暨暮暲暴暵暶暹暾暿曈曌曙曛曜曝曦曩曰曲曳更曷曹曼曾替最月有朋服朏朐朓朔朕朗望朝期朦木未末本札术朱朳朴朵朸机朽杀杂权杄杆杈杉杌李杏材村杓杕杖杙杜杞束杠条来杧杨杩杪杭杯杰杲杳杵杷杻杼松板极构枅枇枉枋枍析枕林枘枚果枝枞枢枣枥枧枨枪枫枭枯枰枲枳枵架枷枸枹柁柃柄柈柊柏某柑柒染柔柖柘柙柚柜柝柞柠柢查柩柬柯柰柱柳柴柷柽柿栀栅标栈栉栊栋栌栎栏栐树栒栓栖栗栝栟校栩株栲栳栴样核根栻格栽栾桀桁桂桃桄桅框案桉桊桌桎桐桑桓桔桕桠桡桢档桤桥桦桧桨桩桫桯桲桴桶桷桹梁梃梅梆梌梏梓梗梠梢梣梦梧梨梭梯械梳梴梵梼梽梾梿检棁棂棉棋棍棐棒棓棕棘棚棠棣棤棨棪棫棬森棰棱棵棹棺棻棼棽椀椁椅椆椋植椎椐椑椒椓椟椠椤椪椭椰椴椸椹椽椿楂楒楔楗楙楚楝楞楠楣楦楩楪楫楮楯楷楸楹楼概榃榄榅榆榇榈榉榍榑榔榕榖榛榜榧榨榫榭榰榱榴榷榻槁槃槊槌槎槐槔槚槛槜槟槠槭槱槲槽槿樊樗樘樟模樨横樯樱樵樽樾橄橇橐橑橘橙橛橞橡橥橦橱橹橼檀檄檎檐檑檗檞檠檩檫檬櫆欂欠次欢欣欤欧欲欸欹欺欻款歃歅歆歇歉歌歙止正此步武歧歪歹死歼殁殂殃殄殆殇殉殊残殍殒殓殖殚殛殡殣殪殳殴段殷殿毁毂毅毋毌母每毐毒毓比毕毖毗毙毛毡毪毫毯毳毵毹毽氅氆氇氍氏氐民氓气氕氖氘氙氚氛氟氡氢氤氦氧氨氩氪氮氯氰氲水永氾氿汀汁求汆汇汈汉汊汋汐汔汕汗汛汜汝汞江池污汤汧汨汩汪汫汭汰汲汴汶汹汽汾沁沂沃沄沅沆沇沈沉沌沏沐沓沔沘沙沚沛沟没沣沤沥沦沧沨沩沪沫沭沮沱河沸油沺治沼沽沾沿泂泃泄泅泇泉泊泌泐泓泔法泖泗泙泚泛泜泞泠泡波泣泥注泪泫泮泯泰泱泳泵泷泸泺泻泼泽泾洁洄洇洈洋洌洎洑洒洓洗洘洙洚洛洞洢洣津洧洨洪洫洭洮洱洲洳洴洵洸洹洺活洼洽派洿流浃浅浆浇浈浉浊测浍济浏浐浑浒浓浔浕浙浚浛浜浞浟浠浡浣浥浦浩浪浬浭浮浯浰浲浴海浸浼涂涄涅消涉涌涍涎涐涑涓涔涕涘涛涝涞涟涠涡涢涣涤润涧涨涩涪涫涮涯液涴涵涸涿淀淄淅淆淇淋淌淏淑淖淘淙淜淝淞淟淠淡淤淦淫淬淮淯深淳淴混淹添淼清渊渌渍渎渐渑渔渗渚渝渟渠渡渣渤渥温渫渭港渰渲渴游渺渼湃湄湉湍湎湑湓湔湖湘湛湜湝湟湣湫湮湲湴湾湿溁溃溅溆溇溉溍溏源溘溚溜溞溟溠溢溥溦溧溪溯溱溲溴溵溶溷溹溺溻溽滁滂滃滆滇滉滋滍滏滑滓滔滕滗滘滚滞滟滠满滢滤滥滦滧滨滩滪滫滴滹漂漆漈漉漋漏漓演漕漖漠漤漦漩漪漫漭漯漱漳漴漶漷漹漻漼漾潆潇潋潍潏潖潘潜潞潟潢潦潩潭潮潲潴潵潸潺潼潽潾澂澄澈澉澌澍澎澛澜澡澥澧澪澭澳澴澶澹澼澽激濂濉濋濑濒濞濠濡濩濮濯瀌瀍瀑瀔瀚瀛瀣瀱瀵瀹瀼灈灌灏灞火灭灯灰灵灶灸灼灾灿炀炅炆炉炊炌炎炒炔炕炖炘炙炜炝炟炣炫炬炭炮炯炱炳炷炸点炻炼炽烀烁烂烃烈烊烔烘烙烛烜烝烟烠烤烦烧烨烩烫烬热烯烶烷烹烺烻烽焆焉焊焌焐焓焕焖焗焘焙焚焜焞焦焯焰焱然煁煃煅煊煋煌煎煓煜煞煟煤煦照煨煮煲煳煴煸煺煽熄熇熊熏熔熘熙熛熜熟熠熥熨熬熵熹熻燃燊燋燎燏燔燕燚燠燥燧燮燹爆爇爔爚爝爟爨爪爬爰爱爵父爷爸爹爻爽爿牁牂片版牌牍牒牖牙牚牛牝牟牡牢牤牥牦牧物牮牯牲牵特牺牻牾牿犀犁犄犇犊犋犍犏犒犟犨犬犯犰犴状犷犸犹狁狂狃狄狈狉狍狎狐狒狗狙狝狞狠狡狨狩独狭狮狯狰狱狲狳狴狷狸狺狻狼猁猃猄猇猊猎猕猖猗猛猜猝猞猡猢猥猩猪猫猬献猯猰猱猴猷猹猺猾猿獍獐獒獗獠獬獭獯獴獾玃玄率玉王玎玑玒玓玕玖玘玙玚玛玞玟玠玡玢玤玥玦玩玫玭玮环现玱玲玳玶玷玹玺玻玼玿珀珂珅珇珈珉珊珋珌珍珏珐珑珒珕珖珙珛珝珞珠珢珣珥珦珧珩珪珫班珰珲珵珷珸珹珺珽琀球琄琅理琇琈琉琊琎琏琐琔琚琛琟琡琢琤琥琦琨琪琫琬琭琮琯琰琲琳琴琵琶琼瑀瑁瑂瑃瑄瑅瑆瑑瑓瑔瑕瑖瑗瑙瑚瑛瑜瑝瑞瑟瑢瑧瑨瑬瑭瑰瑱瑳瑶瑷瑾璀璁璃璆璇璈璋璎璐璒璘璜璞璟璠璥璧璨璩璪璬璮璱璲璺瓀瓒瓖瓘瓜瓞瓠瓢瓣瓤瓦瓮瓯瓴瓶瓷瓻瓿甄甍甏甑甓甗甘甚甜生甡甥甦用甩甪甫甬甭甯田由甲申电男甸町画甾畀畅畈畋界畎畏畔畖留畚畛畜畤略畦番畬畯畲畴畸畹畿疁疃疆疍疏疐疑疔疖疗疙疚疝疟疠疡疢疣疤疥疫疬疭疮疯疰疱疲疳疴疵疸疹疼疽疾痂痃痄病症痈痉痊痍痒痓痔痕痘痛痞痢痣痤痦痧痨痪痫痰痱痴痹痼痿瘀瘁瘃瘅瘆瘊瘌瘐瘕瘗瘘瘙瘛瘟瘠瘢瘤瘥瘦瘩瘪瘫瘭瘰瘳瘴瘵瘸瘼瘾瘿癀癃癌癍癔癖癗癜癞癣癫癯癸登白百癿皂的皆皇皈皋皎皑皓皕皖皙皛皞皤皦皭皮皱皲皴皿盂盅盆盈盉益盍盎盏盐监盒盔盖盗盘盛盟盥盦目盯盱盲直盷相盹盼盾省眄眇眈眉眊看眍眙眚真眠眢眦眨眩眬眭眯眵眶眷眸眺眼着睁睃睄睇睎睐睑睚睛睡睢督睥睦睨睫睬睹睽睾睿瞀瞄瞅瞋瞌瞍瞎瞑瞒瞟瞠瞢瞥瞧瞩瞪瞫瞬瞭瞰瞳瞵瞻瞽瞿矍矗矛矜矞矢矣知矧矩矫矬短矮矰石矶矸矻矼矾矿砀码砂砄砆砉砌砍砑砒研砖砗砘砚砜砝砟砠砣砥砧砫砬砭砮砰破砵砷砸砹砺砻砼砾础硁硅硇硊硌硍硎硐硒硔硕硖硗硙硚硝硪硫硬硭确硼硿碃碇碈碉碌碍碎碏碑碓碗碘碚碛碜碟碡碣碥碧碨碰碱碲碳碴碶碹碾磁磅磉磊磋磏磐磔磕磙磜磡磨磬磲磴磷磹磻礁礅礌礓礞礴礵示礼社祀祁祃祆祇祈祉祊祋祎祏祐祓祕祖祗祚祛祜祝神祟祠祢祥祧票祭祯祲祷祸祺祼祾禀禁禄禅禊禋福禒禔禘禚禛禤禧禳禹禺离禽禾秀私秃秆秉秋种科秒秕秘租秣秤秦秧秩秫秬秭积称秸移秽秾稀稂稃稆程稌稍税稑稔稗稙稚稞稠稣稳稷稹稻稼稽稿穄穆穑穗穙穜穟穰穴究穷穸穹空穿窀突窃窄窅窈窊窍窎窑窒窕窖窗窘窜窝窟窠窣窥窦窨窬窭窳窸窿立竑竖竘站竞竟章竣童竦竫竭端竹竺竽竿笃笄笆笈笊笋笏笑笔笕笙笛笞笠笤笥符笨笪笫第笮笯笱笳笸笺笼笾筀筅筇等筋筌筏筐筑筒答策筘筚筛筜筝筠筢筤筥筦筮筱筲筵筶筷筹筻筼签简箅箍箐箓箔箕箖算箜管箢箦箧箨箩箪箫箬箭箱箴箸篁篆篇篌篑篓篙篚篝篡篥篦篪篮篯篱篷篼篾簃簇簉簋簌簏簕簖簝簟簠簧簪簰簸簿籀籁籍籥米籴类籼籽粉粑粒粕粗粘粜粝粞粟粢粤粥粪粮粱粲粳粹粼粽精粿糁糅糇糈糊糌糍糒糕糖糗糙糜糟糠糨糯糵系紊素索紧紫累絜絮絷綦綮縠縢縻繁繄繇纂纛纠纡红纣纤纥约级纨纩纪纫纬纭纮纯纰纱纲纳纴纵纶纷纸纹纺纻纼纽纾线绀绁绂练组绅细织终绉绊绋绌绍绎经绐绑绒结绔绕绖绗绘给绚绛络绝绞统绠绡绢绣绤绥绦继绨绩绪绫续绮绯绰绱绲绳维绵绶绷绸绹绺绻综绽绾绿缀缁缂缃缄缅缆缇缈缉缊缌缎缐缑缒缓缔缕编缗缘缙缚缛缜缝缞缟缠缡缢缣缤缥缦缧缨缩缪缫缬缭缮缯缰缱缲缳缴缵缶缸缺罂罄罅罍罐网罔罕罗罘罚罟罡罢罨罩罪置罱署罴罶罹罽罾羁羊羌美羑羓羔羕羖羚羝羞羟羡群羧羯羰羱羲羸羹羼羽羿翀翁翂翃翅翈翊翌翎翔翕翘翙翚翛翟翠翡翥翦翩翮翯翰翱翳翷翻翼翾耀老考耄者耆耇耋而耍耏耐耑耒耔耕耖耗耘耙耜耠耢耤耥耦耧耨耩耪耰耱耳耵耶耷耸耻耽耿聂聃聆聊聋职聍聒联聘聚聩聪聱聿肃肄肆肇肉肋肌肓肖肘肚肛肝肟肠股肢肤肥肩肪肫肭肮肯肱育肴肷肸肺肼肽肾肿胀胁胂胃胄胆胈背胍胎胖胗胙胚胛胜胝胞胠胡胣胤胥胧胨胩胪胫胬胭胯胰胱胲胳胴胶胸胺胼能脂脆脉脊脍脎脏脐脑脒脓脔脖脘脚脞脟脩脬脯脱脲脶脸脾脿腆腈腊腋腌腐腑腒腓腔腕腘腙腚腠腥腧腨腩腭腮腯腰腱腴腹腺腻腼腽腾腿膀膂膈膊膏膑膘膙膛膜膝膦膨膳膺膻臀臂臃臆臊臌臑臜臣臧自臬臭至致臻臼臾舀舁舂舄舅舆舌舍舐舒舔舛舜舞舟舠舢舣舥航舫般舭舯舰舱舲舳舴舵舶舷舸船舻舾艄艅艇艉艋艎艏艘艚艟艨艮良艰色艳艴艺艽艾艿节芃芄芈芊芋芍芎芏芑芒芗芘芙芜芝芟芠芡芣芤芥芦芨芩芪芫芬芭芮芯芰花芳芴芷芸芹芼芽芾苁苄苇苈苉苊苋苌苍苎苏苑苒苓苔苕苗苘苛苜苞苟苠苡苣苤若苦苧苫苯英苴苷苹苻苾茀茁茂范茄茅茆茈茉茋茌茎茏茑茓茔茕茗茚茛茜茝茧茨茫茬茭茯茱茳茴茵茶茸茹茺茼茽荀荁荃荄荆荇草荏荐荑荒荓荔荖荙荚荛荜荞荟荠荡荣荤荥荦荧荨荩荪荫荬荭荮药荷荸荻荼荽莅莆莉莎莒莓莘莙莛莜莝莞莠莨莩莪莫莰莱莲莳莴莶获莸莹莺莼莽莿菀菁菂菅菇菉菊菌菍菏菔菖菘菜菝菟菠菡菥菩菪菰菱菲菹菼菽萁萃萄萆萋萌萍萎萏萑萘萚萜萝萣萤营萦萧萨萩萱萳萸萹萼落葆葎葑葖著葙葚葛葜葡董葩葫葬葭葰葱葳葴葵葶葸葺蒂蒄蒇蒈蒉蒋蒌蒎蒐蒗蒙蒜蒟蒡蒨蒯蒱蒲蒴蒸蒹蒺蒻蒽蒿蓁蓂蓄蓇蓉蓊蓍蓏蓐蓑蓓蓖蓝蓟蓠蓢蓣蓥蓦蓬蓰蓼蓿蔀蔃蔈蔊蔌蔑蔓蔗蔚蔟蔡蔫蔬蔷蔸蔹蔺蔻蔼蔽蕃蕈蕉蕊蕖蕗蕙蕞蕤蕨蕰蕲蕴蕹蕺蕻蕾薁薄薅薇薏薛薜薢薤薨薪薮薯薰薳薷薸薹薿藁藉藏藐藓藕藜藟藠藤藦藨藩藻藿蘅蘑蘖蘘蘧蘩蘸蘼虎虏虐虑虒虓虔虚虞虢虤虫虬虮虱虷虸虹虺虻虼虽虾虿蚀蚁蚂蚄蚆蚊蚋蚌蚍蚓蚕蚜蚝蚣蚤蚧蚨蚩蚪蚬蚯蚰蚱蚲蚴蚶蚺蛀蛃蛄蛆蛇蛉蛊蛋蛎蛏蛐蛑蛔蛘蛙蛛蛞蛟蛤蛩蛭蛮蛰蛱蛲蛳蛴蛸蛹蛾蜀蜂蜃蜇蜈蜉蜊蜍蜎蜐蜒蜓蜕蜗蜘蜚蜜蜞蜡蜢蜣蜥蜩蜮蜱蜴蜷蜻蜾蜿蝇蝈蝉蝌蝎蝓蝗蝘蝙蝠蝣蝤蝥蝮蝰蝲蝴蝶蝻蝼蝽蝾螂螃螅螈螋融螗螟螠螣螨螫螬螭螯螱螳螵螺螽蟀蟆蟊蟋蟏蟑蟒蟛蟠蟥蟪蟫蟮蟹蟾蠃蠊蠋蠓蠕蠖蠡蠢蠲蠹蠼血衃衄衅行衍衎衒衔街衙衠衡衢衣补表衩衫衬衮衰衲衷衽衾衿袁袂袄袅袆袈袋袍袒袖袗袜袢袤袪被袭袯袱袷袼裁裂装裆裈裉裎裒裔裕裘裙裛裟裢裣裤裥裨裰裱裳裴裸裹裼裾褂褊褐褒褓褕褙褚褛褟褡褥褪褫褯褰褴褶襁襄襕襚襜襞襟襦襫襻西要覃覆见观觃规觅视觇览觉觊觋觌觎觏觐觑角觖觚觜觞觟解觥触觫觭觯觱觳觿言訄訇訚訾詈詟詹誉誊誓謇警譬计订讣认讥讦讧讨让讪讫训议讯记讱讲讳讴讵讶讷许讹论讻讼讽设访诀证诂诃评诅识诇诈诉诊诋诌词诎诏诐译诒诓诔试诖诗诘诙诚诛诜话诞诟诠诡询诣诤该详诧诨诩诫诬语诮误诰诱诲诳说诵请诸诹诺读诼诽课诿谀谁谂调谄谅谆谇谈谊谋谌谍谎谏谐谑谒谓谔谕谖谗谙谚谛谜谝谞谟谠谡谢谣谤谥谦谧谨谩谪谫谬谭谮谯谰谱谲谳谴谵谶谷谼谿豁豆豇豉豌豕豚象豢豨豪豫豮豳豸豹豺貂貅貆貉貊貌貔貘贝贞负贡财责贤败账货质贩贪贫贬购贮贯贰贱贲贳贴贵贶贷贸费贺贻贼贽贾贿赀赁赂赃资赅赆赇赈赉赊赋赌赍赎赏赐赑赒赓赔赕赖赗赘赙赚赛赜赝赞赟赠赡赢赣赤赦赧赪赫赭走赳赴赵赶起趁趄超越趋趑趔趟趣趯趱足趴趵趸趺趼趾趿跂跃跄跆跋跌跎跏跐跑跖跗跚跛距跞跟跣跤跨跪跬路跱跳践跶跷跸跹跺跻跽踅踉踊踌踏踒踔踝踞踟踢踣踦踩踪踬踮踯踱踵踶踹踺踽蹀蹁蹂蹄蹅蹇蹈蹉蹊蹋蹐蹑蹒蹙蹚蹜蹢蹦蹩蹬蹭蹯蹰蹲蹴蹶蹼蹽蹾蹿躁躅躇躏躐躔躜躞身躬躯躲躺车轧轨轩轪轫转轭轮软轰轱轲轳轴轵轶轷轸轹轺轻轼载轾轿辀辁辂较辄辅辆辇辈辉辊辋辌辍辎辏辐辑辒输辔辕辖辗辘辙辚辛辜辞辟辣辨辩辫辰辱边辽达辿迁迂迄迅过迈迎运近迓返迕还这进远违连迟迢迤迥迦迨迩迪迫迭迮述迳迷迸迹迺追退送适逃逄逅逆选逊逋逍透逐逑递途逖逗通逛逝逞速造逡逢逦逭逮逯逴逵逶逸逻逼逾遁遂遄遆遇遍遏遐遑遒道遗遘遛遢遣遥遨遭遮遴遵遹遽避邀邂邃邈邋邑邓邕邗邘邙邛邝邠邡邢那邦邨邪邬邮邯邰邱邲邳邴邵邶邸邹邺邻邽邾邿郁郃郄郅郇郈郊郎郏郐郑郓郗郚郛郜郝郡郢郤郦郧部郪郫郭郯郴郸都郾郿鄀鄂鄃鄄鄅鄌鄑鄗鄘鄙鄚鄜鄞鄠鄢鄣鄫鄯鄱鄹酂酃酅酆酉酊酋酌配酎酏酐酒酗酚酝酞酡酢酣酤酥酦酩酪酬酮酯酰酱酲酴酵酶酷酸酹酺酽酾酿醅醇醉醋醌醍醐醑醒醚醛醢醨醪醭醮醯醴醵醺醾采釉释里重野量釐金釜鉴銎銮鋆鋈錾鍪鎏鏊鏖鐾鑫钆钇针钉钊钋钌钍钎钏钐钒钓钔钕钖钗钘钙钚钛钜钝钞钟钠钡钢钣钤钥钦钧钨钩钪钫钬钭钮钯钰钱钲钳钴钵钷钹钺钻钼钽钾钿铀铁铂铃铄铅铆铈铉铊铋铌铍铎铏铐铑铒铕铖铗铘铙铚铛铜铝铞铟铠铡铢铣铤铥铧铨铩铪铫铬铭铮铯铰铱铲铳铴铵银铷铸铹铺铻铼铽链铿销锁锂锃锄锅锆锇锈锉锊锋锌锍锎锏锐锑锒锓锔锕锖锗锘错锚锛锜锝锞锟锡锢锣锤锥锦锧锨锩锪锫锬锭键锯锰锱锲锳锴锵锶锷锸锹锺锻锼锽锾锿镀镁镂镃镄镅镆镇镈镉镊镋镌镍镎镏镐镑镒镓镔镕镖镗镘镚镛镜镝镞镠镡镢镣镤镥镦镧镨镩镪镫镬镭镮镯镰镱镲镳镴镵镶长门闩闪闫闭问闯闰闱闲闳间闵闶闷闸闹闺闻闼闽闾闿阀阁阂阃阄阅阆阇阈阉阊阋阌阍阎阏阐阑阒阔阕阖阗阘阙阚阜队阡阪阮阱防阳阴阵阶阻阼阽阿陀陂附际陆陇陈陉陋陌降陎限陑陔陕陛陞陟陡院除陧陨险陪陬陲陴陵陶陷隃隅隆隈隋隍随隐隔隗隘隙障隧隩隰隳隶隹隺隼隽难雀雁雄雅集雇雉雊雌雍雎雏雒雕雠雨雩雪雯雱雳零雷雹雾需霁霄霅霆震霈霉霍霎霏霓霖霜霞霨霪霭霰露霸霹霾青靓靖静靛非靠靡面靥革靬靰靳靴靶靸靺靼靽靿鞁鞅鞋鞍鞑鞒鞔鞘鞠鞡鞣鞧鞨鞫鞬鞭鞮鞯鞲鞳鞴韂韦韧韨韩韪韫韬韭音韵韶页顶顷顸项顺须顼顽顾顿颀颁颂颃预颅领颇颈颉颊颋颌颍颎颏颐频颓颔颖颗题颙颚颛颜额颞颟颠颡颢颤颥颦颧风飏飐飑飒飓飔飕飗飘飙飞食飧飨餍餐餮饔饕饥饧饨饩饪饫饬饭饮饯饰饱饲饳饴饵饶饷饸饹饺饻饼饽饿馁馃馄馅馆馇馈馉馊馋馌馍馏馐馑馒馓馔馕首馗馘香馝馞馥馧馨马驭驮驯驰驱驲驳驴驵驶驷驸驹驺驻驼驽驾驿骀骁骂骃骄骅骆骇骈骉骊骋验骍骎骏骐骑骒骓骕骖骗骘骙骚骛骜骝骞骟骠骡骢骣骤骥骦骧骨骰骱骶骷骸骺骼髀髁髂髃髅髋髌髎髑髓高髡髢髦髫髭髯髹髻髽鬃鬈鬏鬒鬓鬘鬟鬣鬯鬲鬶鬷鬻鬼魁魂魃魄魅魆魇魈魉魋魍魏魑魔鱼鱽鱾鱿鲀鲁鲂鲃鲅鲆鲇鲈鲉鲊鲋鲌鲍鲎鲏鲐鲑鲒鲔鲕鲖鲗鲘鲙鲚鲛鲜鲝鲞鲟鲠鲡鲢鲣鲤鲥鲦鲧鲨鲩鲪鲫鲬鲭鲮鲯鲰鲱鲲鲳鲴鲵鲷鲸鲹鲺鲻鲼鲽鲾鲿鳀鳁鳂鳃鳄鳅鳇鳈鳉鳊鳌鳍鳎鳏鳐鳑鳒鳓鳔鳕鳖鳗鳘鳙鳚鳛鳜鳝鳞鳟鳠鳡鳢鳣鳤鸟鸠鸡鸢鸣鸤鸥鸦鸧鸨鸩鸪鸫鸬鸭鸮鸯鸰鸱鸲鸳鸵鸶鸷鸸鸹鸺鸻鸼鸽鸾鸿鹀鹁鹂鹃鹄鹅鹆鹇鹈鹉鹊鹋鹌鹍鹎鹏鹐鹑鹒鹔鹕鹖鹗鹘鹙鹚鹛鹜鹝鹞鹟鹠鹡鹢鹣鹤鹦鹧鹨鹩鹪鹫鹬鹭鹮鹯鹰鹱鹲鹳鹴鹾鹿麀麂麇麈麋麑麒麓麖麝麟麦麸麹麻麽麾黄黇黉黍黎黏黑黔默黛黜黝黟黠黡黢黥黧黩黪黯黹黻黼黾鼋鼍鼎鼐鼒鼓鼗鼙鼠鼢鼩鼫鼬鼯鼱鼷鼹鼻鼽鼾齁齇齉齐齑齿龀龁龂龃龄龅龆龇龈龉龊龋龌龙龚龛龟龠龢鿍鿎鿏㑇㑊㕮㘎㙍㙘㙦㛃㛚㛹㟃㠇㠓㤘㥄㧐㧑㧟㫰㬊㬎㬚㭎㭕㮾㰀㳇㳘㳚㴔㵐㶲㸆㸌㺄㻬㽏㿠䁖䂮䃅䃎䅟䌹䎃䎖䏝䏡䏲䐃䓖䓛䓨䓫䓬䗖䗛䗪䗴䜣䝙䢺䢼䣘䥽䦃䲟䲠䲢䴓䴔䴕䴖䴗䴘䴙䶮𠅤𠙶𠳐𡎚𡐓𣗋𣲗𣲘𣸣𤧛𤩽𤫉𥔲𥕢𥖨𥻗𦈡𦒍𦙶𦝼𦭜𦰡𧿹𨐈𨙸𨚕𨟠𨭉𨱇𨱏𨱑𨱔𨺙𩽾𩾃𩾌𪟝𪣻𪤗𪨰𪨶𪩘𪾢𫄧𫄨𫄷𫄸𫇭𫌀𫍣𫍯𫍲𫍽𫐄𫐐𫐓𫑡𫓧𫓯𫓶𫓹𫔍𫔎𫔶𫖮𫖯𫖳𫗧𫗴𫘜𫘝𫘦𫘧𫘨𫘪𫘬𫚕𫚖𫚭𫛭𫞩𫟅𫟦𫟹𫟼𫠆𫠊𫠜𫢸𫫇𫭟𫭢𫭼𫮃𫰛𫵷𫶇𫷷𫸩𬀩𬀪𬂩𬃊𬇕𬇙𬇹𬉼𬊈𬊤𬌗𬍛𬍡𬍤𬒈𬒔𬒗𬕂𬘓𬘘𬘡𬘩𬘫𬘬𬘭𬘯𬙂𬙊𬙋𬜬𬜯𬞟𬟁𬟽𬣙𬣞𬣡𬣳𬤇𬤊𬤝𬨂𬨎𬩽𬪩𬬩𬬭𬬮𬬱𬬸𬬹𬬻𬬿𬭁𬭊𬭎𬭚𬭛𬭤𬭩𬭬𬭯𬭳𬭶𬭸𬭼𬮱𬮿𬯀𬯎𬱖𬱟𬳵𬳶𬳽𬳿𬴂𬴃𬴊𬶋𬶍𬶏𬶐𬶟𬶠𬶨𬶭𬶮𬷕𬸘𬸚𬸣𬸦𬸪𬹼𬺈𬺓u   吶诶屌囧飚屄c                 C      i | ]}|d qS T .0rJ   rh   rh   S/home/kuhnn/.local/lib/python3.10/site-packages/TTS/tts/layers/xtts/zh_num2words.py
<dictcomp>~      rl   c                 C   rf   rg   rh   ri   rh   rh   rk   rl     rm   c                 C   rf   rg   rh   ri   rh   rh   rk   rl     rm   c                   @   s(   e Zd ZdZdd Zdd Zdd ZdS )	ChineseCharu   
    中文字符
    每个字符对应简体和繁体,
    e.g. 简体 = '负', 繁体 = '負'
    转换时可转换为简体或繁体
    c                 C      || _ || _d S N
simplifiedtraditional)selfrr   rs   rh   rh   rk   __init__     
zChineseChar.__init__c                 C   s   | j p| jpd S rp   rq   rt   rh   rh   rk   __str__     zChineseChar.__str__c                 C   s   |   S rp   )rx   rw   rh   rh   rk   __repr__  s   zChineseChar.__repr__N)__name__
__module____qualname____doc__ru   rx   rz   rh   rh   rh   rk   rn     s
    rn   c                       s>   e Zd ZdZ fddZdd Zeed dfdd	Z  Z	S )
ChineseNumberUnitu}   
    中文数字/数位字符
    每个字符除繁简体外还有一个额外的大写字符
    e.g. '陆' 和 '陸'
    c                    s(   t t| || || _|| _|| _d S rp   )superr   ru   powerbig_sbig_t)rt   r   rr   rs   r   r   	__class__rh   rk   ru     s   
zChineseNumberUnit.__init__c                 C   s   d | jS )Nz10^{})formatr   rw   rh   rh   rk   rx     s   zChineseNumberUnit.__str__   Fc                 C   s   |rt |d |d |d |d |d dS |td kr.t |d |d |d |d |d dS |td krIt |d d |d |d |d |d dS |td kret td|d |d |d |d |d dS tdt|)	Nr   r   )r   rr   rs   r   r               z.Counting type should be in {0} ({1} provided).)r   NUMBERING_TYPESpow
ValueErrorr   )clsindexvaluenumbering_type
small_unitrh   rh   rk   create  s"   "$zChineseNumberUnit.create)
r{   r|   r}   r~   ru   rx   classmethodr   r   __classcell__rh   rh   r   rk   r     s    r   c                       s6   e Zd ZdZd	 fdd	Zdd Zedd Z  ZS )
ChineseNumberDigitu   
    中文数字字符
    Nc                    s4   t t| || || _|| _|| _|| _|| _d S rp   )r   r   ru   r   r   r   alt_salt_t)rt   r   rr   rs   r   r   r   r   r   rh   rk   ru     s   
zChineseNumberDigit.__init__c                 C   
   t | jS rp   strr   rw   rh   rh   rk   rx        
zChineseNumberDigit.__str__c                 C   s    t ||d |d |d |d S )Nr   r   r   r   )r   )r   rP   r]   rh   rh   rk   r     s    zChineseNumberDigit.createNN)	r{   r|   r}   r~   ru   rx   r   r   r   rh   rh   r   rk   r     s    r   c                       s"   e Zd ZdZd fdd	Z  ZS )ChineseMathu   
    中文数位字符
    Nc                    s.   t t| || || _|| _|| _|| _d S rp   )r   r   ru   symbol
expressionr   r   )rt   rr   rs   r   r   r   rh   rk   ru     s
   
zChineseMath.__init__rp   )r{   r|   r}   r~   ru   r   rh   rh   r   rk   r     s    r   c                   @   s   e Zd ZdZdS )NumberSystemu   
    中文数字系统
    N)r{   r|   r}   r~   rh   rh   rh   rk   r     s    r   c                   @   s    e Zd ZdZdd Zdd ZdS )
MathSymbolu   
    用于中文数字系统的数学符号 (繁/简体), e.g.
    positive = ['正', '正']
    negative = ['负', '負']
    point = ['点', '點']
    c                 C      || _ || _|| _d S rp   )positivenegativepoint)rt   r   r   r   rh   rh   rk   ru        
zMathSymbol.__init__c                 c   s    | j  D ]}|V  qd S rp   )__dict__values)rt   r]   rh   rh   rk   __iter__  s   zMathSymbol.__iter__N)r{   r|   r}   r~   ru   r   rh   rh   rh   rk   r     s    r   r   c                    s  t tt} fddt|D }t tt}dd t|D }t tttt}dd t|D }t	t	|d _
|d _tt|d _
|d _td td |d _
|d _ttd td dd	d
 }ttd td ddd
 }ttd td ddd
 }	t }
|| |
_||
_t|||	|
_|
S )u  
    根据数字系统类型返回创建相应的数字系统，默认为 mid
    NUMBERING_TYPES = ['low', 'mid', 'high']: 中文数字系统类型
        low:  '兆' = '亿' * '十' = $10^{9}$,  '京' = '兆' * '十', etc.
        mid:  '兆' = '亿' * '万' = $10^{12}$, '京' = '兆' * '万', etc.
        high: '兆' = '亿' * '亿' = $10^{16}$, '京' = '兆' * '兆', etc.
    返回对应的数字系统
    c                    s    g | ]\}}t || d qS FCNUr   rj   rP   r]   r   rh   rk   
<listcomp>       z!create_system.<locals>.<listcomp>c                 S   s    g | ]\}}t j||d dqS )T)r   r   r   rh   rh   rk   r   "  r   c                 S   s   g | ]
\}}t ||qS rh   )CNDr   r   rh   rh   rk   r   %  s    r   r   r   r   c                 S   s   | S rp   rh   r_   rh   rh   rk   <lambda>+  s    zcreate_system.<locals>.<lambda>r   c                 S   s   |  S rp   rh   r   rh   rh   rk   r   ,  s    r   c                 S   s   t t| d t| S )Nr   )floatr   )r_   r`   rh   rh   rk   r   -  s    )zip(LARGER_CHINESE_NUMERING_UNITS_SIMPLIFIED)LARGER_CHINESE_NUMERING_UNITS_TRADITIONAL	enumerate)SMALLER_CHINESE_NUMERING_UNITS_SIMPLIFIED*SMALLER_CHINESE_NUMERING_UNITS_TRADITIONALCHINESE_DIGISBIG_CHINESE_DIGIS_SIMPLIFIEDBIG_CHINESE_DIGIS_TRADITIONALZERO_ALTr   r   ONE_ALTTWO_ALTSCMPOSITIVENEGATIVEPOINTr   unitsdigitsr   math)r   all_larger_unitslarger_unitsall_smaller_unitssmaller_unitschinese_digisr   positive_cnnegative_cnpoint_cnsystemrh   r   rk   create_system  s"   


r   c           
         sx   dd   fdd}dd }dd }t |}|| |\}}|||}t||}d	d
d |D }	|r:d||	S |S )Nc                 S   s   |j D ]}| |j|j|j|jfv r|  S q|jD ]}| |j|j|j|j|j|jfv r/|  S q|jD ]}| |j|jfv rA|  S q3d S rp   )	r   rs   rr   r   r   r   r   r   r   )charr   r\   rK   rT   rh   rh   rk   
get_symbol8  s   

 
zchn2num.<locals>.get_symbolc                    sf   | d}} j jj j jjfD ]}|| v r| |\}} nq fdd|D  fdd|D fS )Nr   c                    s   g | ]} |qS rh   rh   ri   )r   r   rh   rk   r   I      z3chn2num.<locals>.string2symbols.<locals>.<listcomp>)r   r   rr   rs   split)chinese_stringr   
int_string
dec_stringrW   r   r   rk   string2symbolsC  s   
(zchn2num.<locals>.string2symbolsc                 S   sP  | rt | d tr| d jdkr|jd g|  } t| dkr<t | d tr<t | d tr<| t| d jd dddd g }d}| D ]c}t |trQ|| d}nt |trct|jdddd}|d7 }|dkrm|| qB|dkrtt|D ]-}t || d  tr|| d  j|jk rt|| d  j|j dddd|| d < qwqB|S )ug   
        一百八 to 一百八十
        一亿一千三百万 to 一亿 一千万 三百万
        r   r   N)
isinstancer   r   r   lenr   appendrange)integer_symbolsr   result
unit_countrZ   current_unitrP   rh   rh   rk   correct_symbolsK  s.    


*,z chn2num.<locals>.correct_symbolsc                    s   dg}d}| D ]> t  tr j|d< qt  trE|d  td j9  <  j|kr@tt fdd|dd |dd<  j}|d qt	|S )u   
        Compute the value.
        When current unit is larger than previous unit, current unit * all previous units will be used as all previous units.
        e.g. '两千万' = 2000 * 10000 not 2000 + 10000
        r   r   
   c                    s   | t d j S )Nr   )r   r   )r]   rZ   rh   rk   r   y  s    z0chn2num.<locals>.compute_value.<locals>.<lambda>N)
r   r   r   r   r   r   listmapr   sum)r   r   
last_powerrh   r   rk   compute_valuek  s   


&
zchn2num.<locals>.compute_valuer   c                 S   s   g | ]}t |jqS rh   r   )rj   rK   rh   rh   rk   r     r   zchn2num.<locals>.<listcomp>z{0}.{1})r   r   joinr   )
r   r   r   r   r   r   int_partdec_partint_strdec_strrh   r   rk   chn2num7  s    
r   FTc	                    s  dfdd	t || d}	t|	dkr|	d }
d}nt|	dkr-|	d }
|	d }ntd	| |rAt|
dkrA|
}n	fd
d|
D }fdd|D }|r^|jjg| 7 }|rtdjd j	jd j
jd jjd j}t|D ]J\}}t|tr|jdkr|t|d k r||d  nd }|dkr||d  nd }t|trt|ttd fr|jdkr|d u s|jdkr|||< q||rd |r҈ d7  n d7  n|rd nd d fdd|D }|r|tjd  jd j	}|r|tjd  jd j	}ttD ]\}}||r%td |   S qt|dkrQ|d td td fv rQ|d td td td fv rQ|dd  }|S )NTc                    s   |  d  s	g S t dkr-|r%t| t kr%jd jt  gS jt  gS t fddtjD }| d |j  }||g  |j d   S )Nr   r   r   c                 3   s"    | ]}|j t k r|V  qd S rp   )r   r   )rj   r\   striped_stringrh   rk   	<genexpr>  s     z-num2chn.<locals>.get_value.<locals>.<genexpr>)lstripr   r   intnextreversedr   r   )value_string	use_zerosresult_unitresult_string)	get_valuer   r   rk   r    s   
"znum2chn.<locals>.get_valuer   r   r   r   r   z3invalid input num string with more than one dot: {}c                       g | ]	} j t| qS rh   r   r   ri   r   rh   rk   r         znum2chn.<locals>.<listcomp>c                    r  rh   r  ri   r   rh   rk   r     r  big_r[   rZ   rs   rr   c                    s   g | ]}t | qS rh   )getattr)rj   rZ   )	attr_namerh   rk   r     r   rg   )r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   typer   r   replacer  r   
startswithr   r   r   r   r   )number_stringr   bigrs   alt_zeroalt_onealt_twor   	use_unitsint_decr   r   result_symbolsdec_symbolsliangrP   r]   next_symbolprevious_symbolr   rW   rh   )r  r  r   rk   num2chn  s`   


0 

   r  c                   @   *   e Zd ZdZd	ddZdd Zdd ZdS )
Cardinalu   
    CARDINAL类
    Nc                 C   ro   rp   )cardinalchntext)rt   r  r  rh   rh   rk   ru     rv   zCardinal.__init__c                 C   r   rp   )r   r  rw   rh   rh   rk   chntext2cardinal  r   zCardinal.chntext2cardinalc                 C   r   rp   )r  r  rw   rh   rh   rk   cardinal2chntext  r   zCardinal.cardinal2chntextr   )r{   r|   r}   r~   ru   r  r  rh   rh   rh   rk   r    
    
r  c                   @   "   e Zd ZdZdddZdd ZdS )Digitu   
    DIGIT类
    Nc                 C   ro   rp   )digitr  )rt   r!  r  rh   rh   rk   ru     rv   zDigit.__init__c                 C   s   t | jdddS )NFr  r  )r  r!  rw   rh   rh   rk   digit2chntext  ry   zDigit.digit2chntextr   )r{   r|   r}   r~   ru   r#  rh   rh   rh   rk   r          
r   c                   @   s$   e Zd ZdZdddZd	ddZdS )
	TelePhoneu   
    TELEPHONE类
    Nc                 C   r   rp   )	telephoneraw_chntextr  )rt   r&  r'  r  rh   rh   rk   ru     r   zTelePhone.__init__Fc                 C   sx   |r| j d}ddd |D | _| jdd| _| jS | j d }ddd |D | _| jdd| _| jS )	Nr   z<SIL>c                 S      g | ]	}t |d d dqS Fr"  r  rj   partrh   rh   rk   r   $  r  z/TelePhone.telephone2chntext.<locals>.<listcomp>r   r   z<SP>c                 S   r(  r)  r*  r+  rh   rh   rk   r   (  r  )r&  r   r   r'  r	  r  strip)rt   fixed	sil_partssp_partsrh   rh   rk   telephone2chntext!  s   zTelePhone.telephone2chntext)NNNr   )r{   r|   r}   r~   ru   r1  rh   rh   rh   rk   r%    s    
r%  c                   @   r  )
Fractionu   
    FRACTION类
    Nc                 C   ro   rp   )fractionr  )rt   r3  r  rh   rh   rk   ru   2  rv   zFraction.__init__c                 C   $   | j d\}}t|d t| S )N   分之r   )r  r   r   )rt   denominator	numeratorrh   rh   rk   chntext2fraction6     zFraction.chntext2fractionc                 C   r4  )Nr   r5  )r3  r   r  )rt   r7  r6  rh   rh   rk   fraction2chntext:  r9  zFraction.fraction2chntextr   )r{   r|   r}   r~   ru   r8  r:  rh   rh   rh   rk   r2  -  s
    
r2  c                   @   r  )Dateu   
    DATE类
    Nc                 C   ro   rp   )dater  )rt   r<  r  rh   rh   rk   ru   D  rv   zDate.__init__c                 C   s   | j }z| dd\}}t|d d }W n ty%   |}d}Y nw |r]z| dd\}}t|d d }W n tyJ   |}d}Y nw |r\t|d d d |d  }nd}d}|| | }|| _| jS )Nu   年r   r!  r   u   月r  r   )	r<  r-  r   r   r#  r   r  r  r  )rt   r<  yearothermonthdayr  rh   rh   rk   date2chntext`  s0   zDate.date2chntextr   )r{   r|   r}   r~   ru   rC  rh   rh   rh   rk   r;  ?  s    
r;  c                   @   r  )Moneyu   
    MONEY类
    Nc                 C   ro   rp   )moneyr  )rt   rE  r  rh   rh   rk   ru   ~  rv   zMoney.__init__c                 C   sR   | j }td}||}|r#|D ]}||d t|d d }q|| _| jS )N(\d+(\.\d+)?)r   r>  )rE  recompilefindallr	  r  r  r  )rt   rE  patternmatchersmatcherrh   rh   rk   money2chntext  s   

 zMoney.money2chntextr   )r{   r|   r}   r~   ru   rM  rh   rh   rh   rk   rD  y  r$  rD  c                   @   r  )

Percentageu   
    PERCENTAGE类
    Nc                 C   ro   rp   )
percentager  )rt   rO  r  rh   rh   rk   ru     rv   zPercentage.__init__c                 C   s   t | j dd S Nu	   百分之r   )r   r  r-  rw   rh   rh   rk   chntext2percentage     zPercentage.chntext2percentagec                 C   s   dt | j d S rP  )r  rO  r-  rw   rh   rh   rk   percentage2chntext  rR  zPercentage.percentage2chntextr   )r{   r|   r}   r~   ru   rQ  rS  rh   rh   rh   rk   rN    r  rN  c                 C   s  d|  d }t d}||}|r'|D ]}||d t|d d d}qt dt d t d	 }||}|rP|D ]}||d t|d d
 d}q=t d}||}|rq|D ]}||d t	|d d
 d}q^t d}||}|r|D ]}||d t	|d dj
ddd}qt d}||}|r|D ]}||t|d d}q|dd}t d}||}|r|D ]}||d t|d d d}qt dt }||}|r|D ]}||d t|d d d}qt d}||}|r|D ]}||t|d d}q
t d}||}|r=|D ]}||d t|d d d}q)t d}||}|ra|D ]}||d |d d |d  d}qL|ddS )NrE   r   u@   \D+((([089]\d|(19|20)\d{2})年)?(\d{1,2}月(\d{1,2}[日号])?)?)r   )r<  r   u   \D+((\d+(\.\d+)?)[多余几]?z(\dz?)?))rE  z5\D((\+?86 ?)?1([38]\d|5[0-35-9]|7[678]|9[89])\d{8})\D)r&  z.\D((0(10|2[1-3]|[3-9]\d{2})-?)?[1-9]\d{6,7})\DT)r.  z	(\d+/\d+))r3  r   r   z(\d+(\.\d+)?%))rO  u   (\d+(\.\d+)?)[多余几]?r>  z
(\d{4,32})r=  rF  u   (([a-zA-Z]+)二([a-zA-Z]+))r   r   )rG  rH  rI  r	  r;  rC  CURRENCY_UNITSrD  rM  r%  r1  r2  r:  rN  rS  COM_QUANTIFIERSr  r  r   r#  r   rstrip)raw_texttextrJ  rK  rL  rh   rh   rk   normalize_nsw  sj   

"
"

"

&



"
"



$

&rY  c                 C   s   d}t d| rWt d|  }d}t| r(t|  }|d |d kr(d}|dkr?|| d|d   }| |d d } n|| d|d   }| |d d } t d| s||  } | S )uV   
    去除儿化音词中的儿:
    他女儿在那边儿 -> 他女儿在那边
    r   u   儿r   r   N)rG  searchspanER_WHITELIST_PATTERN)rX  new_strrH   remove_er_flagrI   rh   rh   rk   remove_erhua  s    
r_  c                 C   sh   |   }g }t|D ]$\}}|dkr)t||d  d r)t|d r)|d || q
d|S )Nr   r   r   r   r   )r   r   IN_EN_CHARSgetr   r   )rX  tokensnewrR   r[   rh   rh   rk   remove_space  s   $

rd  c                   @   sP   e Zd Z								ddedededededed	ed
efddZdd ZdS )TextNormFr   
to_banjiaoto_upperto_lowerremove_fillersr_  check_charsrd  cc_modec	           
      C   sR   || _ || _|| _|| _|| _|| _|| _d | _|r'ddlm	}	 |	|| _d S d S )Nr   )OpenCC)
rf  rg  rh  ri  r_  rj  rd  ccopenccrl  )
rt   rf  rg  rh  ri  r_  rj  rd  rk  rl  rh   rh   rk   ru   "  s   zTextNorm.__init__c                 C   s   | j r	| j |}| jr|t}| jr| }| jr| }| j	r-t
D ]}||d}q$| jr4t|}t|}|t}| jrZ|D ]}t|sYtd| d| tjd  dS qB| jrat|}|S )Nr   zWARNING: illegal char z in: file)rm  convertrf  	translateQJ2BJ_TRANSFORMrg  upperrh  lowerri  FILLER_CHARSr	  r_  rY  PUNCS_TRANSFORMrj  IN_VALID_CHARSra  printsysstderrrd  )rt   rX  rJ   rh   rh   rk   __call__;  s0   


zTextNorm.__call__N)FFFFFFFr   )r{   r|   r}   boolr   ru   r|  rh   rh   rh   rk   re  !  s6    	
re  __main__z--to_banjiao
store_truez!convert quanjiao chars to banjiao)actionhelpz
--to_upperzconvert to upper casez
--to_lowerzconvert to lower casez--remove_fillersu&   remove filler chars such as "呃, 啊"z--remove_erhuauH   remove erhua chars such as "他女儿在那边儿 -> 他女儿在那边"z--check_charsz'skip sentences containing illegal charsz--remove_spacezremove whitespacez	--cc_mode)r   t2ss2tz)convert between traditional to simplified)choicesdefaultr  z--log_intervali'  z)log interval in number of processed lines)r  r  r  z	--has_keyz,will be deprecated, set --format ark insteadz--format)txtarktsvr  zinput format)r  r  r  r  ifilez%input filename, assume utf-8 encoding)r  ofilezoutput filenamer  )rf  rg  rh  ri  r_  rj  rd  rk  utf8)encodingzw+r  	)	delimiterTEXTro  c                 C   s   g | ]}t | qS rh   )item)rj   rM   rh   rh   rk   r     s    r   ztext norm: z lines done.)rp  flush)r   r   )maxsplitr   z lines done in total.)qargparsecsvosrG  stringrz  r   r   r   $SMALLER_BIG_CHINESE_UNITS_SIMPLIFIED%SMALLER_BIG_CHINESE_UNITS_TRADITIONALr   r   r   r   r   r   r   r   r   r   rv  ER_WHITELISTrH  r\  r   CURRENCY_NAMESrT  rU  CN_PUNCS_STOPCN_PUNCS_NONSTOPCN_PUNCSpunctuationPUNCSr   	maketransr   rw  QJ2BJr   keysr   rs  CN_CHARS_COMMONCN_CHARS_EXTCN_CHARSIN_CH_CHARSascii_lettersr   EN_CHARSr`  VALID_CHARSrx  objectrn   r   r   r   CCr   r   r   r   r   r   r   r  r  r   r%  r2  r;  rD  rN  rY  r_  rd  re  r{   ArgumentParserrW   add_argumentr   
parse_argsargshas_keyr   rf  rg  rh  ri  rj  rk  
normalizerndoneopenr  istreamr  ostream
DictReaderreader
fieldnamesry  r  rX  log_intervalr{  rS   keyr-  r   colsrh   rh   rh   rk   <module>   s  

	
 !"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUV"a N&"$T
g:[>"0

&
( "(