wav2vec2-1b-Y / vocab.json
Gummybear05's picture
Upload tokenizer
b66cb52 verified
raw
history blame
17.3 kB
{
"(": 1,
")": 2,
":": 3,
"?": 4,
"N": 5,
"P": 6,
"S": 7,
"[PAD]": 1227,
"[UNK]": 1226,
"|": 0,
"": 8,
"’": 9,
"가": 10,
"각": 11,
"간": 12,
"갈": 13,
"감": 14,
"갑": 15,
"값": 16,
"갓": 17,
"갔": 18,
"강": 19,
"갖": 20,
"같": 21,
"개": 22,
"객": 23,
"갠": 24,
"갯": 25,
"갱": 26,
"갸": 27,
"걀": 28,
"걔": 29,
"거": 30,
"걱": 31,
"건": 32,
"걷": 33,
"걸": 34,
"검": 35,
"겁": 36,
"것": 37,
"겉": 38,
"겊": 39,
"게": 40,
"겐": 41,
"겟": 42,
"겠": 43,
"겨": 44,
"격": 45,
"겪": 46,
"견": 47,
"결": 48,
"겸": 49,
"겹": 50,
"겼": 51,
"경": 52,
"곁": 53,
"계": 54,
"고": 55,
"곡": 56,
"곤": 57,
"곧": 58,
"골": 59,
"곰": 60,
"곱": 61,
"곳": 62,
"공": 63,
"곶": 64,
"과": 65,
"관": 66,
"광": 67,
"괜": 68,
"괭": 69,
"괴": 70,
"굉": 71,
"교": 72,
"구": 73,
"국": 74,
"군": 75,
"굳": 76,
"굴": 77,
"굵": 78,
"굶": 79,
"굽": 80,
"굿": 81,
"궁": 82,
"궂": 83,
"궈": 84,
"권": 85,
"귀": 86,
"귄": 87,
"규": 88,
"균": 89,
"귤": 90,
"그": 91,
"극": 92,
"근": 93,
"글": 94,
"긁": 95,
"금": 96,
"급": 97,
"긋": 98,
"긍": 99,
"기": 100,
"긴": 101,
"길": 102,
"김": 103,
"깁": 104,
"깃": 105,
"깄": 106,
"깅": 107,
"깊": 108,
"까": 109,
"깍": 110,
"깎": 111,
"깐": 112,
"깔": 113,
"깜": 114,
"깝": 115,
"깥": 116,
"깨": 117,
"깬": 118,
"깽": 119,
"꺼": 120,
"꺽": 121,
"껀": 122,
"껌": 123,
"껍": 124,
"껏": 125,
"껑": 126,
"께": 127,
"껴": 128,
"꼈": 129,
"꼬": 130,
"꼭": 131,
"꼰": 132,
"꼼": 133,
"꼽": 134,
"꽁": 135,
"꽂": 136,
"꽃": 137,
"꽝": 138,
"꽤": 139,
"꾀": 140,
"꾸": 141,
"꾹": 142,
"꾼": 143,
"꿀": 144,
"꿈": 145,
"꿉": 146,
"꿍": 147,
"꿔": 148,
"꿨": 149,
"뀌": 150,
"뀐": 151,
"뀔": 152,
"끄": 153,
"끈": 154,
"끊": 155,
"끌": 156,
"끓": 157,
"끔": 158,
"끗": 159,
"끝": 160,
"끼": 161,
"낀": 162,
"낄": 163,
"낌": 164,
"나": 165,
"낙": 166,
"난": 167,
"날": 168,
"남": 169,
"납": 170,
"낫": 171,
"났": 172,
"낭": 173,
"낮": 174,
"낯": 175,
"낳": 176,
"내": 177,
"낸": 178,
"낼": 179,
"냄": 180,
"냈": 181,
"냉": 182,
"냐": 183,
"냥": 184,
"너": 185,
"넉": 186,
"넌": 187,
"널": 188,
"넓": 189,
"넘": 190,
"넣": 191,
"네": 192,
"넷": 193,
"녀": 194,
"녁": 195,
"년": 196,
"념": 197,
"녔": 198,
"녕": 199,
"노": 200,
"녹": 201,
"논": 202,
"놀": 203,
"놈": 204,
"농": 205,
"높": 206,
"놓": 207,
"놔": 208,
"놨": 209,
"뇌": 210,
"뇨": 211,
"누": 212,
"눅": 213,
"눈": 214,
"눌": 215,
"눕": 216,
"눗": 217,
"눠": 218,
"눴": 219,
"뉘": 220,
"뉴": 221,
"늄": 222,
"느": 223,
"는": 224,
"늘": 225,
"늙": 226,
"능": 227,
"늦": 228,
"늪": 229,
"늬": 230,
"니": 231,
"닌": 232,
"닐": 233,
"님": 234,
"닙": 235,
"닝": 236,
"다": 237,
"닥": 238,
"닦": 239,
"단": 240,
"닫": 241,
"달": 242,
"닭": 243,
"닮": 244,
"담": 245,
"답": 246,
"닷": 247,
"당": 248,
"닿": 249,
"대": 250,
"댁": 251,
"댄": 252,
"댓": 253,
"댔": 254,
"댕": 255,
"더": 256,
"덕": 257,
"던": 258,
"덜": 259,
"덟": 260,
"덥": 261,
"덧": 262,
"덩": 263,
"덮": 264,
"데": 265,
"덴": 266,
"델": 267,
"도": 268,
"독": 269,
"돈": 270,
"돋": 271,
"돌": 272,
"돕": 273,
"돗": 274,
"동": 275,
"돼": 276,
"됐": 277,
"되": 278,
"된": 279,
"될": 280,
"됨": 281,
"됩": 282,
"두": 283,
"둑": 284,
"둔": 285,
"둘": 286,
"둠": 287,
"둥": 288,
"둬": 289,
"뒀": 290,
"뒤": 291,
"뒷": 292,
"뒹": 293,
"드": 294,
"득": 295,
"든": 296,
"듣": 297,
"들": 298,
"듬": 299,
"듯": 300,
"등": 301,
"듸": 302,
"디": 303,
"딘": 304,
"딜": 305,
"딤": 306,
"딨": 307,
"딩": 308,
"딪": 309,
"따": 310,
"딱": 311,
"딴": 312,
"딸": 313,
"땀": 314,
"땅": 315,
"때": 316,
"땐": 317,
"땜": 318,
"땠": 319,
"땡": 320,
"떠": 321,
"떡": 322,
"떤": 323,
"떨": 324,
"떴": 325,
"떻": 326,
"떼": 327,
"또": 328,
"똑": 329,
"똘": 330,
"똥": 331,
"뚜": 332,
"뚝": 333,
"뚫": 334,
"뚱": 335,
"뛰": 336,
"뜀": 337,
"뜨": 338,
"뜩": 339,
"뜬": 340,
"뜯": 341,
"뜰": 342,
"뜸": 343,
"뜻": 344,
"띄": 345,
"띕": 346,
"띠": 347,
"띵": 348,
"라": 349,
"락": 350,
"란": 351,
"랄": 352,
"람": 353,
"랍": 354,
"랐": 355,
"랑": 356,
"랗": 357,
"래": 358,
"랙": 359,
"랜": 360,
"램": 361,
"랩": 362,
"랫": 363,
"랬": 364,
"랭": 365,
"랴": 366,
"략": 367,
"량": 368,
"러": 369,
"럭": 370,
"런": 371,
"럴": 372,
"럼": 373,
"럽": 374,
"럿": 375,
"렀": 376,
"렁": 377,
"렇": 378,
"레": 379,
"렉": 380,
"렌": 381,
"렘": 382,
"려": 383,
"력": 384,
"련": 385,
"렬": 386,
"렴": 387,
"렵": 388,
"렷": 389,
"렸": 390,
"령": 391,
"례": 392,
"로": 393,
"록": 394,
"론": 395,
"롤": 396,
"롭": 397,
"롯": 398,
"롱": 399,
"뢰": 400,
"료": 401,
"루": 402,
"룩": 403,
"룰": 404,
"룸": 405,
"룹": 406,
"뤄": 407,
"뤘": 408,
"류": 409,
"륙": 410,
"륜": 411,
"률": 412,
"륨": 413,
"륭": 414,
"르": 415,
"른": 416,
"를": 417,
"름": 418,
"릅": 419,
"릇": 420,
"릉": 421,
"릎": 422,
"리": 423,
"릭": 424,
"린": 425,
"릴": 426,
"림": 427,
"립": 428,
"릿": 429,
"링": 430,
"마": 431,
"막": 432,
"만": 433,
"많": 434,
"말": 435,
"맑": 436,
"맘": 437,
"맙": 438,
"맛": 439,
"망": 440,
"맞": 441,
"맡": 442,
"매": 443,
"맥": 444,
"맨": 445,
"맵": 446,
"맷": 447,
"맹": 448,
"머": 449,
"먹": 450,
"먼": 451,
"멀": 452,
"멈": 453,
"멋": 454,
"멍": 455,
"메": 456,
"멘": 457,
"멜": 458,
"멤": 459,
"멧": 460,
"멩": 461,
"며": 462,
"면": 463,
"멸": 464,
"명": 465,
"몇": 466,
"모": 467,
"목": 468,
"몬": 469,
"몰": 470,
"몸": 471,
"몹": 472,
"못": 473,
"몽": 474,
"묘": 475,
"무": 476,
"묵": 477,
"묶": 478,
"문": 479,
"묻": 480,
"물": 481,
"묽": 482,
"뭉": 483,
"뭐": 484,
"뭔": 485,
"뭘": 486,
"뮤": 487,
"므": 488,
"미": 489,
"믹": 490,
"민": 491,
"믿": 492,
"밀": 493,
"밉": 494,
"밌": 495,
"밍": 496,
"밑": 497,
"바": 498,
"박": 499,
"밖": 500,
"반": 501,
"받": 502,
"발": 503,
"밝": 504,
"밟": 505,
"밤": 506,
"밥": 507,
"방": 508,
"밭": 509,
"배": 510,
"백": 511,
"밴": 512,
"밸": 513,
"뱀": 514,
"뱃": 515,
"버": 516,
"벅": 517,
"번": 518,
"벌": 519,
"범": 520,
"법": 521,
"벗": 522,
"베": 523,
"벤": 524,
"벨": 525,
"벳": 526,
"벼": 527,
"벽": 528,
"변": 529,
"별": 530,
"볍": 531,
"병": 532,
"볕": 533,
"보": 534,
"복": 535,
"볶": 536,
"본": 537,
"볼": 538,
"봄": 539,
"봅": 540,
"봇": 541,
"봉": 542,
"봐": 543,
"봤": 544,
"봬": 545,
"뵈": 546,
"부": 547,
"북": 548,
"분": 549,
"불": 550,
"붉": 551,
"붐": 552,
"붓": 553,
"붕": 554,
"붙": 555,
"뷔": 556,
"뷰": 557,
"브": 558,
"블": 559,
"비": 560,
"빅": 561,
"빈": 562,
"빌": 563,
"빔": 564,
"빕": 565,
"빗": 566,
"빙": 567,
"빛": 568,
"빠": 569,
"빡": 570,
"빨": 571,
"빴": 572,
"빵": 573,
"빼": 574,
"빽": 575,
"뺀": 576,
"뺄": 577,
"뺏": 578,
"뺐": 579,
"뺨": 580,
"뻐": 581,
"뻔": 582,
"뻗": 583,
"뻥": 584,
"뼈": 585,
"뼛": 586,
"뽀": 587,
"뽑": 588,
"뽕": 589,
"뾰": 590,
"뿌": 591,
"뿍": 592,
"뿐": 593,
"뿜": 594,
"쁘": 595,
"쁜": 596,
"쁠": 597,
"삐": 598,
"사": 599,
"삭": 600,
"산": 601,
"살": 602,
"삶": 603,
"삼": 604,
"샀": 605,
"상": 606,
"새": 607,
"색": 608,
"샐": 609,
"샘": 610,
"샛": 611,
"생": 612,
"샤": 613,
"샴": 614,
"샵": 615,
"샷": 616,
"섀": 617,
"서": 618,
"석": 619,
"섞": 620,
"선": 621,
"설": 622,
"섬": 623,
"섭": 624,
"섯": 625,
"섰": 626,
"성": 627,
"세": 628,
"센": 629,
"셀": 630,
"셈": 631,
"셋": 632,
"셔": 633,
"션": 634,
"셜": 635,
"셨": 636,
"셰": 637,
"소": 638,
"속": 639,
"손": 640,
"솔": 641,
"솜": 642,
"송": 643,
"쇄": 644,
"쇠": 645,
"쇼": 646,
"숄": 647,
"숍": 648,
"수": 649,
"숙": 650,
"순": 651,
"숟": 652,
"술": 653,
"숨": 654,
"숫": 655,
"숭": 656,
"숯": 657,
"숱": 658,
"쉐": 659,
"쉬": 660,
"쉴": 661,
"쉽": 662,
"슈": 663,
"슐": 664,
"슘": 665,
"스": 666,
"슥": 667,
"슨": 668,
"슬": 669,
"슴": 670,
"습": 671,
"슷": 672,
"승": 673,
"시": 674,
"식": 675,
"신": 676,
"싣": 677,
"실": 678,
"싫": 679,
"심": 680,
"십": 681,
"싱": 682,
"싶": 683,
"싸": 684,
"싹": 685,
"싼": 686,
"쌀": 687,
"쌈": 688,
"쌌": 689,
"쌓": 690,
"쌤": 691,
"쌩": 692,
"써": 693,
"썩": 694,
"썬": 695,
"썰": 696,
"썼": 697,
"쎄": 698,
"쏘": 699,
"쏙": 700,
"쏟": 701,
"쏠": 702,
"쐬": 703,
"쑤": 704,
"쑥": 705,
"쓰": 706,
"쓴": 707,
"쓸": 708,
"씀": 709,
"씁": 710,
"씨": 711,
"씩": 712,
"씬": 713,
"씹": 714,
"씻": 715,
"아": 716,
"악": 717,
"안": 718,
"앉": 719,
"않": 720,
"알": 721,
"앓": 722,
"암": 723,
"압": 724,
"앗": 725,
"았": 726,
"앙": 727,
"앞": 728,
"애": 729,
"액": 730,
"앤": 731,
"앨": 732,
"앱": 733,
"앵": 734,
"야": 735,
"약": 736,
"얀": 737,
"얄": 738,
"얇": 739,
"얌": 740,
"양": 741,
"얘": 742,
"어": 743,
"억": 744,
"언": 745,
"얹": 746,
"얻": 747,
"얼": 748,
"엄": 749,
"업": 750,
"없": 751,
"엇": 752,
"었": 753,
"엉": 754,
"엊": 755,
"엌": 756,
"엎": 757,
"에": 758,
"엑": 759,
"엔": 760,
"엘": 761,
"엠": 762,
"엣": 763,
"엥": 764,
"여": 765,
"역": 766,
"연": 767,
"열": 768,
"염": 769,
"엽": 770,
"엿": 771,
"였": 772,
"영": 773,
"옆": 774,
"예": 775,
"옛": 776,
"오": 777,
"옥": 778,
"온": 779,
"올": 780,
"옮": 781,
"옵": 782,
"옷": 783,
"옹": 784,
"와": 785,
"왁": 786,
"완": 787,
"왔": 788,
"왕": 789,
"왜": 790,
"왠": 791,
"외": 792,
"왼": 793,
"요": 794,
"욕": 795,
"용": 796,
"우": 797,
"욱": 798,
"운": 799,
"울": 800,
"움": 801,
"웃": 802,
"웅": 803,
"워": 804,
"웍": 805,
"원": 806,
"월": 807,
"웠": 808,
"웨": 809,
"웬": 810,
"웰": 811,
"웹": 812,
"위": 813,
"윗": 814,
"유": 815,
"육": 816,
"윤": 817,
"율": 818,
"윳": 819,
"융": 820,
"으": 821,
"은": 822,
"을": 823,
"읊": 824,
"음": 825,
"읍": 826,
"응": 827,
"의": 828,
"이": 829,
"익": 830,
"인": 831,
"일": 832,
"읽": 833,
"잃": 834,
"임": 835,
"입": 836,
"잇": 837,
"있": 838,
"잉": 839,
"잊": 840,
"잌": 841,
"잎": 842,
"자": 843,
"작": 844,
"잔": 845,
"잖": 846,
"잘": 847,
"잠": 848,
"잡": 849,
"잣": 850,
"잤": 851,
"장": 852,
"재": 853,
"잼": 854,
"쟁": 855,
"쟤": 856,
"저": 857,
"적": 858,
"전": 859,
"절": 860,
"젊": 861,
"점": 862,
"접": 863,
"젓": 864,
"정": 865,
"젖": 866,
"제": 867,
"젝": 868,
"젠": 869,
"져": 870,
"졌": 871,
"조": 872,
"족": 873,
"존": 874,
"졸": 875,
"좀": 876,
"좁": 877,
"종": 878,
"좋": 879,
"좌": 880,
"죄": 881,
"죠": 882,
"주": 883,
"죽": 884,
"준": 885,
"줄": 886,
"줌": 887,
"중": 888,
"줘": 889,
"줬": 890,
"쥐": 891,
"쥬": 892,
"즈": 893,
"즉": 894,
"즌": 895,
"즐": 896,
"즘": 897,
"즙": 898,
"증": 899,
"지": 900,
"직": 901,
"진": 902,
"질": 903,
"짐": 904,
"집": 905,
"짓": 906,
"징": 907,
"짚": 908,
"짜": 909,
"짝": 910,
"짧": 911,
"짬": 912,
"짰": 913,
"짱": 914,
"째": 915,
"쨌": 916,
"쨍": 917,
"쩌": 918,
"쩍": 919,
"쩐": 920,
"쩔": 921,
"쩜": 922,
"쩡": 923,
"쪄": 924,
"쪘": 925,
"쪼": 926,
"쪽": 927,
"쫀": 928,
"쫄": 929,
"쫌": 930,
"쫓": 931,
"쫙": 932,
"쬐": 933,
"쭈": 934,
"쭉": 935,
"쭤": 936,
"쯤": 937,
"찌": 938,
"찍": 939,
"찐": 940,
"찔": 941,
"찜": 942,
"찝": 943,
"찢": 944,
"차": 945,
"착": 946,
"찬": 947,
"찮": 948,
"찰": 949,
"참": 950,
"찹": 951,
"창": 952,
"찾": 953,
"채": 954,
"책": 955,
"챙": 956,
"챠": 957,
"처": 958,
"척": 959,
"천": 960,
"철": 961,
"첨": 962,
"첫": 963,
"청": 964,
"체": 965,
"쳇": 966,
"쳐": 967,
"쳤": 968,
"초": 969,
"촉": 970,
"촌": 971,
"촐": 972,
"총": 973,
"촬": 974,
"최": 975,
"추": 976,
"축": 977,
"춘": 978,
"출": 979,
"춤": 980,
"춥": 981,
"춧": 982,
"충": 983,
"춰": 984,
"췄": 985,
"취": 986,
"츄": 987,
"츠": 988,
"측": 989,
"층": 990,
"치": 991,
"칙": 992,
"친": 993,
"칠": 994,
"칡": 995,
"침": 996,
"칫": 997,
"칭": 998,
"카": 999,
"칵": 1000,
"칸": 1001,
"칼": 1002,
"캉": 1003,
"캐": 1004,
"캔": 1005,
"캠": 1006,
"캡": 1007,
"캬": 1008,
"커": 1009,
"컥": 1010,
"컨": 1011,
"컬": 1012,
"컴": 1013,
"컵": 1014,
"컷": 1015,
"컸": 1016,
"케": 1017,
"켓": 1018,
"켜": 1019,
"켰": 1020,
"코": 1021,
"콕": 1022,
"콘": 1023,
"콜": 1024,
"콤": 1025,
"콧": 1026,
"콩": 1027,
"쾌": 1028,
"쿄": 1029,
"쿠": 1030,
"쿡": 1031,
"쿨": 1032,
"쿵": 1033,
"쿽": 1034,
"퀴": 1035,
"큐": 1036,
"큘": 1037,
"크": 1038,
"큰": 1039,
"클": 1040,
"큼": 1041,
"키": 1042,
"킨": 1043,
"킬": 1044,
"킹": 1045,
"타": 1046,
"탁": 1047,
"탄": 1048,
"탈": 1049,
"탐": 1050,
"탑": 1051,
"탓": 1052,
"탔": 1053,
"탕": 1054,
"태": 1055,
"택": 1056,
"탭": 1057,
"탱": 1058,
"터": 1059,
"턱": 1060,
"턴": 1061,
"털": 1062,
"텀": 1063,
"텁": 1064,
"텃": 1065,
"텅": 1066,
"테": 1067,
"텍": 1068,
"텐": 1069,
"텔": 1070,
"템": 1071,
"텨": 1072,
"토": 1073,
"톡": 1074,
"톤": 1075,
"톨": 1076,
"톱": 1077,
"통": 1078,
"퇴": 1079,
"투": 1080,
"툰": 1081,
"툴": 1082,
"퉁": 1083,
"튀": 1084,
"튈": 1085,
"튜": 1086,
"트": 1087,
"특": 1088,
"튼": 1089,
"틀": 1090,
"틈": 1091,
"틔": 1092,
"티": 1093,
"틱": 1094,
"틴": 1095,
"틸": 1096,
"팀": 1097,
"팁": 1098,
"팅": 1099,
"파": 1100,
"팍": 1101,
"팎": 1102,
"판": 1103,
"팔": 1104,
"팟": 1105,
"팠": 1106,
"팡": 1107,
"패": 1108,
"팩": 1109,
"팬": 1110,
"팰": 1111,
"팸": 1112,
"팽": 1113,
"퍼": 1114,
"펄": 1115,
"펍": 1116,
"페": 1117,
"펙": 1118,
"펜": 1119,
"펭": 1120,
"펴": 1121,
"편": 1122,
"펼": 1123,
"폈": 1124,
"평": 1125,
"폐": 1126,
"포": 1127,
"폭": 1128,
"폰": 1129,
"폴": 1130,
"폼": 1131,
"표": 1132,
"푸": 1133,
"푹": 1134,
"푼": 1135,
"풀": 1136,
"품": 1137,
"풍": 1138,
"퓨": 1139,
"프": 1140,
"픈": 1141,
"플": 1142,
"픔": 1143,
"피": 1144,
"픽": 1145,
"핀": 1146,
"필": 1147,
"핏": 1148,
"핑": 1149,
"하": 1150,
"학": 1151,
"한": 1152,
"할": 1153,
"함": 1154,
"합": 1155,
"핫": 1156,
"항": 1157,
"해": 1158,
"핵": 1159,
"핸": 1160,
"햄": 1161,
"햇": 1162,
"했": 1163,
"행": 1164,
"향": 1165,
"허": 1166,
"헌": 1167,
"헐": 1168,
"험": 1169,
"헛": 1170,
"헝": 1171,
"헤": 1172,
"헬": 1173,
"헹": 1174,
"혀": 1175,
"혁": 1176,
"현": 1177,
"혈": 1178,
"협": 1179,
"혔": 1180,
"형": 1181,
"혜": 1182,
"호": 1183,
"혹": 1184,
"혼": 1185,
"홀": 1186,
"홈": 1187,
"홉": 1188,
"홍": 1189,
"화": 1190,
"확": 1191,
"환": 1192,
"활": 1193,
"황": 1194,
"회": 1195,
"획": 1196,
"횟": 1197,
"횡": 1198,
"효": 1199,
"후": 1200,
"훅": 1201,
"훈": 1202,
"훌": 1203,
"훑": 1204,
"훤": 1205,
"훨": 1206,
"훼": 1207,
"휘": 1208,
"휠": 1209,
"휩": 1210,
"휴": 1211,
"흐": 1212,
"흑": 1213,
"흔": 1214,
"흘": 1215,
"흙": 1216,
"흠": 1217,
"흡": 1218,
"흥": 1219,
"희": 1220,
"흰": 1221,
"히": 1222,
"힌": 1223,
"힐": 1224,
"힘": 1225
}