Run 4. Outer Step 7. Inner Step 162.
Browse files- config.json +6 -8
 - inner_optimizer.pt +1 -1
 - model.safetensors +1 -1
 
    	
        config.json
    CHANGED
    
    | 
         @@ -268,20 +268,18 @@ 
     | 
|
| 268 | 
         
             
                "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
         
     | 
| 269 | 
         
             
              },
         
     | 
| 270 | 
         
             
              "block_list": [
         
     | 
| 271 | 
         
            -
                 
     | 
| 272 | 
         
            -
                 
     | 
| 273 | 
         
            -
                 
     | 
| 274 | 
         
            -
                 
     | 
| 275 | 
         
            -
                 
     | 
| 276 | 
         
            -
                5499168,
         
     | 
| 277 | 
         
            -
                5499171
         
     | 
| 278 | 
         
             
              ],
         
     | 
| 279 | 
         
             
              "block_size": 1024,
         
     | 
| 280 | 
         
             
              "bos_token_id": 50256,
         
     | 
| 281 | 
         
             
              "embd_pdrop": 0.1,
         
     | 
| 282 | 
         
             
              "eos_token_id": 50256,
         
     | 
| 283 | 
         
             
              "initializer_range": 0.02,
         
     | 
| 284 | 
         
            -
              "inner_step":  
     | 
| 285 | 
         
             
              "inner_steps": 0,
         
     | 
| 286 | 
         
             
              "last_allreduce_block": 5492224,
         
     | 
| 287 | 
         
             
              "layer_norm_epsilon": 1e-05,
         
     | 
| 
         | 
|
| 268 | 
         
             
                "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
         
     | 
| 269 | 
         
             
              },
         
     | 
| 270 | 
         
             
              "block_list": [
         
     | 
| 271 | 
         
            +
                5499173,
         
     | 
| 272 | 
         
            +
                5499176,
         
     | 
| 273 | 
         
            +
                5499177,
         
     | 
| 274 | 
         
            +
                5499180,
         
     | 
| 275 | 
         
            +
                5499180
         
     | 
| 
         | 
|
| 
         | 
|
| 276 | 
         
             
              ],
         
     | 
| 277 | 
         
             
              "block_size": 1024,
         
     | 
| 278 | 
         
             
              "bos_token_id": 50256,
         
     | 
| 279 | 
         
             
              "embd_pdrop": 0.1,
         
     | 
| 280 | 
         
             
              "eos_token_id": 50256,
         
     | 
| 281 | 
         
             
              "initializer_range": 0.02,
         
     | 
| 282 | 
         
            +
              "inner_step": 162,
         
     | 
| 283 | 
         
             
              "inner_steps": 0,
         
     | 
| 284 | 
         
             
              "last_allreduce_block": 5492224,
         
     | 
| 285 | 
         
             
              "layer_norm_epsilon": 1e-05,
         
     | 
    	
        inner_optimizer.pt
    CHANGED
    
    | 
         @@ -1,3 +1,3 @@ 
     | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            -
            oid sha256: 
     | 
| 3 | 
         
             
            size 8081782026
         
     | 
| 
         | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:2d5e6b67201fc7a82e6a10cf940e37c7060e31e1c3fcf1ab6d8c212d9a576a5c
         
     | 
| 3 | 
         
             
            size 8081782026
         
     | 
    	
        model.safetensors
    CHANGED
    
    | 
         @@ -1,3 +1,3 @@ 
     | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            -
            oid sha256: 
     | 
| 3 | 
         
             
            size 4040701744
         
     | 
| 
         | 
|
| 1 | 
         
             
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:10ca06147b7482803ba45d4d98819ac99ce0f3ac2dfd716c44a5887ca5e16a79
         
     | 
| 3 | 
         
             
            size 4040701744
         
     |