Training in progress, step 500
Browse files
    	
        adapter_config.json
    ADDED
    
    | @@ -0,0 +1,27 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "alpha_pattern": {},
         | 
| 3 | 
            +
              "auto_mapping": null,
         | 
| 4 | 
            +
              "base_model_name_or_path": "google/mt5-Large",
         | 
| 5 | 
            +
              "bias": "none",
         | 
| 6 | 
            +
              "fan_in_fan_out": false,
         | 
| 7 | 
            +
              "inference_mode": true,
         | 
| 8 | 
            +
              "init_lora_weights": true,
         | 
| 9 | 
            +
              "layers_pattern": null,
         | 
| 10 | 
            +
              "layers_to_transform": null,
         | 
| 11 | 
            +
              "loftq_config": {},
         | 
| 12 | 
            +
              "lora_alpha": 8,
         | 
| 13 | 
            +
              "lora_dropout": 0.05,
         | 
| 14 | 
            +
              "megatron_config": null,
         | 
| 15 | 
            +
              "megatron_core": "megatron.core",
         | 
| 16 | 
            +
              "modules_to_save": null,
         | 
| 17 | 
            +
              "peft_type": "LORA",
         | 
| 18 | 
            +
              "r": 4,
         | 
| 19 | 
            +
              "rank_pattern": {},
         | 
| 20 | 
            +
              "revision": null,
         | 
| 21 | 
            +
              "target_modules": [
         | 
| 22 | 
            +
                "v",
         | 
| 23 | 
            +
                "q"
         | 
| 24 | 
            +
              ],
         | 
| 25 | 
            +
              "task_type": "SEQ_2_SEQ_LM",
         | 
| 26 | 
            +
              "use_rslora": false
         | 
| 27 | 
            +
            }
         | 
    	
        adapter_model.safetensors
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:d612a508fe5408d387f328fecaf0e2683202de123946f504285594638eeb31e0
         | 
| 3 | 
            +
            size 4758888
         | 
    	
        runs/Jan20_04-17-58_52591a348f32/events.out.tfevents.1705724279.52591a348f32.26.0
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:01036174d9863925a8c93d270e00064317b79306a6dc0ff31aae461a7b9647ad
         | 
| 3 | 
            +
            size 5305
         | 
    	
        training_args.bin
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:4aa04dae3537f94c70d15b18f8300cd37cb0be80a6bc061be602a4ac0bb3f833
         | 
| 3 | 
            +
            size 4475
         | 
