DL-Art-School/codes/data/audio/gpt_tts_tokenizer.json

1 line
258 KiB
JSON
Raw Normal View History

2021-12-23 21:32:33 +00:00
{"version":"1.0","truncation":null,"padding":null,"added_tokens":[{"id":0,"special":true,"content":"[STOP]","single_word":false,"lstrip":false,"rstrip":false,"normalized":false},{"id":1,"special":true,"content":"[UNK]","single_word":false,"lstrip":false,"rstrip":false,"normalized":false}],"normalizer":null,"pre_tokenizer":{"type":"Whitespace"},"post_processor":null,"decoder":null,"model":{"type":"BPE","dropout":null,"unk_token":"[UNK]","continuing_subword_prefix":"$$$","end_of_word_suffix":null,"fuse_unk":false,"vocab":{"[STOP]":0,"[UNK]":1,"!":2,"\"":3,"#":4,"$":5,"%":6,"&":7,"'":8,"(":9,")":10,"*":11,"+":12,",":13,"-":14,".":15,"/":16,"0":17,"1":18,"2":19,"3":20,"4":21,"5":22,"6":23,"7":24,"8":25,"9":26,":":27,";":28,"=":29,"?":30,"@":31,"[":32,"\\":33,"]":34,"^":35,"_":36,"a":37,"b":38,"c":39,"d":40,"e":41,"f":42,"g":43,"h":44,"i":45,"j":46,"k":47,"l":48,"m":49,"n":50,"o":51,"p":52,"q":53,"r":54,"s":55,"t":56,"u":57,"v":58,"w":59,"x":60,"y":61,"z":62,"{":63,"}":64,"ʼ":65,"—":66,"$$$h":67,"$$$a":68,"$$$r":69,"$$$c":70,"$$$o":71,"$$$k":72,"$$$e":73,"$$$s":74,"$$$n":75,"$$$t":76,"$$$l":77,"$$$d":78,"$$$i":79,"$$$m":80,"$$$p":81,"$$$q":82,"$$$u":83,"$$$y":84,"$$$z":85,"$$$w":86,"$$$j":87,"$$$v":88,"$$$b":89,"$$$f":90,"$$$g":91,"$$$0":92,"$$$4":93,"$$$8":94,"$$$6":95,"$$$x":96,"$$$9":97,"$$$2":98,"$$$1":99,"$$$3":100,"$$$,":101,"$$$5":102,"$$$7":103,"$$$?":104,"$$$]":105,"$$$.":106,"$$$_":107,"$$$*":108,"$$$-":109,"$$$'":110,"$$$!":111,"$$$\"":112,"$$$ʼ":113,"$$$^":114,"$$$=":115,"$$$:":116,"$$$)":117,"$$$;":118,"$$$+":119,"$$$/":120,"$$$[":121,"$$$(":122,"$$$—":123,"$$$}":124,"$$$\\":125,"$$$he":126,"the":127,"$$$in":128,"$$$er":129,"$$$ed":130,"$$$nd":131,"$$$ou":132,"$$$ing":133,"$$$at":134,"to":135,"$$$re":136,"and":137,"th":138,"$$$is":139,"$$$en":140,"$$$as":141,"$$$on":142,"$$$ar":143,"$$$or":144,"$$$an":145,"$$$es":146,"$$$ll":147,"of":148,"he":149,"in":150,"$$$it":151,"$$$om":152,"ha":153,"be":154,"$$$ow":155,"was":156,"$$$ut":157,"her":158,"$$$le":159,"it":160,"$$$ld":161,"$$$ot":162,"$$$ac":163,"on":164,"$$$id":165,"$$$gh":166,"st":167,"$$$et":168,"you":169,"his":170,"that":171,"$$$ic":172,"she":173,"$$$ly":174,"$$$st":175,"$$$im":176,"$$$ve":177,"$$$ay":178,"$$$al":179,"as":180,"wh":181,"$$$se":182,"re":183,"$$$ad":184,"$$$ver":185,"$$$ent":186,"$$$ir":187,"my":188,"$$$ght":189,"$$$ur":190,"$$$oo":191,"for":192,"$$$ith":193,"$$$ould":194,"with":195,"$$$ion":196,"me":197,"had":198,"an":199,"at":200,"li":201,"$$$ke":202,"$$$am":203,"sh":204,"but":205,"fr":206,"$$$all":207,"$$$her":208,"we":209,"se":210,"him":211,"do":212,"$$$ter":213,"$$$ro":214,"$$$ight":215,"$$$ked":216,"$$$pp":217,"$$$ain":218,"$$$ce":219,"not":220,"$$$ch":221,"ne":222,"$$$il":223,"so":224,"$$$ack":225,"''":226,"$$$ill":227,"is":228,"$$$ore":229,"$$$ant":230,"out":231,"$$$el":232,"they":233,"$$$ri":234,"$$$rou":235,"up":236,"$$$ct":237,"whe":238,"kn":239,"$$$out":240,"$$$ust":241,"from":242,"$$$ome":243,"$$$ard":244,"ch":245,"$$$us":246,"sa":247,"have":248,"this":249,"de":250,"$$$un":251,"$$$ra":252,"$$$ere":253,"le":254,"ab":255,"all":256,"$$$hing":257,"al":258,"what":259,"were":260,"$$$king":261,"no":262,"go":263,"$$$ind":264,"int":265,"$$$ge":266,"could":267,"$$$ie":268,"would":269,"su":270,"$$$est":271,"one":272,"$$$ess":273,"did":274,"$$$nt":275,"like":276,"$$$art":277,"con":278,"$$$one":279,"loo":280,"fe":281,"$$$hed":282,"back":283,"there":284,"$$$own":285,"$$$ers":286,"sp":287,"cl":288,"if":289,"$$$ss":290,"ex":291,"$$$ul":292,"$$$op":293,"$$$ab":294,"or":295,"into":296,"wor":297,"$$$and":298,"$$$ast":299,"when":300,"$$$ood":301,"$$$um":302,"$$$ide":303,"ag":304,"ro":305,"$$$ace":306,"$$$ck":307,"$$$ist":308,"$$$ally":309,"them":310,"just":311,"$$$ep":312,"bl":313,"tr":314,"$$$ation":315,"$$$ol":316,"about":317,"$$$ate":318,"hand":319,"$$$au":320,"over":321,"$$$ven":322,"$$$ong":323,"then":324,"see":325,"been":326,"$$$ake":327,"$$$way":328,"$$$ig":329,"$$$ap":330,"com":331,"te":332,"pl":333,"mo":334,"by":335,"tim":336,"$$$if":337,"any":338,"know":339,"$$$lf":340,"ey":341,"$$$ous":342,"some":343,"are":344,"sm":345,"said":346,"dow