update
Browse files- utils/symbol.py +1 -0
- vocab/__init__.py +1 -1
    	
        utils/symbol.py
    CHANGED
    
    | @@ -1,5 +1,6 @@ | |
| 1 | 
             
            """
         | 
| 2 | 
             
            special_symbols: https://github.com/google/sentencepiece/blob/master/doc/special_symbols.md
         | 
|  | |
| 3 | 
             
            """
         | 
| 4 |  | 
| 5 | 
             
            import sys
         | 
|  | |
| 1 | 
             
            """
         | 
| 2 | 
             
            special_symbols: https://github.com/google/sentencepiece/blob/master/doc/special_symbols.md
         | 
| 3 | 
            +
            emoji:
         | 
| 4 | 
             
            """
         | 
| 5 |  | 
| 6 | 
             
            import sys
         | 
    	
        vocab/__init__.py
    CHANGED
    
    | @@ -44,7 +44,7 @@ uniq_tokenizers = [ | |
| 44 |  | 
| 45 | 
             
            all_tokenizers = [
         | 
| 46 | 
             
                "gpt_35_turbo",
         | 
| 47 | 
            -
                " | 
| 48 | 
             
                "gpt2",
         | 
| 49 | 
             
                "gpt2_chinese",
         | 
| 50 | 
             
                "bert_base_cased",
         | 
|  | |
| 44 |  | 
| 45 | 
             
            all_tokenizers = [
         | 
| 46 | 
             
                "gpt_35_turbo",
         | 
| 47 | 
            +
                "gpt_4",
         | 
| 48 | 
             
                "gpt2",
         | 
| 49 | 
             
                "gpt2_chinese",
         | 
| 50 | 
             
                "bert_base_cased",
         |