Upload unimernet_base.yaml
Browse files
    	
        models/MFR/unimernet_base/unimernet_base.yaml
    ADDED
    
    | 
         @@ -0,0 +1,46 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            model:
         
     | 
| 2 | 
         
            +
              arch: unimernet
         
     | 
| 3 | 
         
            +
              model_type: unimernet
         
     | 
| 4 | 
         
            +
              model_config:
         
     | 
| 5 | 
         
            +
                model_name: ./models/unimernet_base
         
     | 
| 6 | 
         
            +
                max_seq_len: 1536
         
     | 
| 7 | 
         
            +
             
     | 
| 8 | 
         
            +
              load_pretrained: True
         
     | 
| 9 | 
         
            +
              pretrained: './models/unimernet_base/pytorch_model.pth'
         
     | 
| 10 | 
         
            +
              tokenizer_config:
         
     | 
| 11 | 
         
            +
                path: ./models/unimernet_base
         
     | 
| 12 | 
         
            +
             
     | 
| 13 | 
         
            +
            datasets:
         
     | 
| 14 | 
         
            +
              formula_rec_eval:
         
     | 
| 15 | 
         
            +
                vis_processor:
         
     | 
| 16 | 
         
            +
                  eval:
         
     | 
| 17 | 
         
            +
                    name: "formula_image_eval"
         
     | 
| 18 | 
         
            +
                    image_size:
         
     | 
| 19 | 
         
            +
                      - 192
         
     | 
| 20 | 
         
            +
                      - 672
         
     | 
| 21 | 
         
            +
               
         
     | 
| 22 | 
         
            +
            run:
         
     | 
| 23 | 
         
            +
              runner: runner_iter
         
     | 
| 24 | 
         
            +
              task: unimernet_train
         
     | 
| 25 | 
         
            +
             
     | 
| 26 | 
         
            +
              batch_size_train: 64
         
     | 
| 27 | 
         
            +
              batch_size_eval: 64
         
     | 
| 28 | 
         
            +
              num_workers: 1
         
     | 
| 29 | 
         
            +
             
     | 
| 30 | 
         
            +
              iters_per_inner_epoch: 2000
         
     | 
| 31 | 
         
            +
              max_iters: 60000
         
     | 
| 32 | 
         
            +
             
     | 
| 33 | 
         
            +
              seed: 42
         
     | 
| 34 | 
         
            +
              output_dir: "../output/demo"
         
     | 
| 35 | 
         
            +
             
     | 
| 36 | 
         
            +
              evaluate: True
         
     | 
| 37 | 
         
            +
              test_splits: [ "eval" ]
         
     | 
| 38 | 
         
            +
             
     | 
| 39 | 
         
            +
              device: "cuda"
         
     | 
| 40 | 
         
            +
              world_size: 1
         
     | 
| 41 | 
         
            +
              dist_url: "env://"
         
     | 
| 42 | 
         
            +
              distributed: True
         
     | 
| 43 | 
         
            +
              distributed_type: ddp  # or fsdp when train llm
         
     | 
| 44 | 
         
            +
             
     | 
| 45 | 
         
            +
              generate_cfg:
         
     | 
| 46 | 
         
            +
                temperature: 0.0
         
     |