Training in progress, step 100
Browse files
    	
        config.json
    CHANGED
    
    | 
         @@ -3,6 +3,7 @@ 
     | 
|
| 3 | 
         
             
              "architectures": [
         
     | 
| 4 | 
         
             
                "MistralForCausalLM"
         
     | 
| 5 | 
         
             
              ],
         
     | 
| 
         | 
|
| 6 | 
         
             
              "bos_token_id": 1,
         
     | 
| 7 | 
         
             
              "eos_token_id": 2,
         
     | 
| 8 | 
         
             
              "hidden_act": "silu",
         
     | 
| 
         @@ -19,7 +20,7 @@ 
     | 
|
| 19 | 
         
             
              "sliding_window": 4096,
         
     | 
| 20 | 
         
             
              "tie_word_embeddings": false,
         
     | 
| 21 | 
         
             
              "torch_dtype": "bfloat16",
         
     | 
| 22 | 
         
            -
              "transformers_version": "4. 
     | 
| 23 | 
         
             
              "use_cache": false,
         
     | 
| 24 | 
         
             
              "vocab_size": 32000
         
     | 
| 25 | 
         
             
            }
         
     | 
| 
         | 
|
| 3 | 
         
             
              "architectures": [
         
     | 
| 4 | 
         
             
                "MistralForCausalLM"
         
     | 
| 5 | 
         
             
              ],
         
     | 
| 6 | 
         
            +
              "attention_dropout": 0.0,
         
     | 
| 7 | 
         
             
              "bos_token_id": 1,
         
     | 
| 8 | 
         
             
              "eos_token_id": 2,
         
     | 
| 9 | 
         
             
              "hidden_act": "silu",
         
     | 
| 
         | 
|
| 20 | 
         
             
              "sliding_window": 4096,
         
     | 
| 21 | 
         
             
              "tie_word_embeddings": false,
         
     | 
| 22 | 
         
             
              "torch_dtype": "bfloat16",
         
     | 
| 23 | 
         
            +
              "transformers_version": "4.36.2",
         
     | 
| 24 | 
         
             
              "use_cache": false,
         
     | 
| 25 | 
         
             
              "vocab_size": 32000
         
     | 
| 26 | 
         
             
            }
         
     | 
    	
        runs/Jan09_01-04-39_ip-26-0-175-170/events.out.tfevents.1704762517.ip-26-0-175-170.1764083.0
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:ceb11f48d4f6d55d5d67146e62c0ce6fe2be6ef5e0350ca60c3c4c210b7b23bc
         
     | 
| 3 | 
         
            +
            size 12084
         
     | 
    	
        tokenizer_config.json
    CHANGED
    
    | 
         @@ -1,4 +1,6 @@ 
     | 
|
| 1 | 
         
             
            {
         
     | 
| 
         | 
|
| 
         | 
|
| 2 | 
         
             
              "added_tokens_decoder": {
         
     | 
| 3 | 
         
             
                "0": {
         
     | 
| 4 | 
         
             
                  "content": "<unk>",
         
     | 
| 
         @@ -37,5 +39,5 @@ 
     | 
|
| 37 | 
         
             
              "spaces_between_special_tokens": false,
         
     | 
| 38 | 
         
             
              "tokenizer_class": "LlamaTokenizer",
         
     | 
| 39 | 
         
             
              "unk_token": "<unk>",
         
     | 
| 40 | 
         
            -
              "use_default_system_prompt":  
     | 
| 41 | 
         
             
            }
         
     | 
| 
         | 
|
| 1 | 
         
             
            {
         
     | 
| 2 | 
         
            +
              "add_bos_token": true,
         
     | 
| 3 | 
         
            +
              "add_eos_token": false,
         
     | 
| 4 | 
         
             
              "added_tokens_decoder": {
         
     | 
| 5 | 
         
             
                "0": {
         
     | 
| 6 | 
         
             
                  "content": "<unk>",
         
     | 
| 
         | 
|
| 39 | 
         
             
              "spaces_between_special_tokens": false,
         
     | 
| 40 | 
         
             
              "tokenizer_class": "LlamaTokenizer",
         
     | 
| 41 | 
         
             
              "unk_token": "<unk>",
         
     | 
| 42 | 
         
            +
              "use_default_system_prompt": false
         
     | 
| 43 | 
         
             
            }
         
     | 
    	
        training_args.bin
    CHANGED
    
    | 
         @@ -1,3 +1,3 @@ 
     | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            -
            oid sha256: 
     | 
| 3 | 
         
            -
            size  
     | 
| 
         | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:f8223da2f2f0ee9475bd12cdfd5985b88e1af713b8c6fb49804c639b8f261335
         
     | 
| 3 | 
         
            +
            size 5944
         
     |