togethercomputer
/

m2-bert-80M-2k-retrieval

@@ -2,7 +2,7 @@
 license: apache-2.0
 language:
 - en
-pipeline_tag: text-classification
 inference: false
 ---
@@ -104,4 +104,4 @@ If you use this model, or otherwise found our work valuable, you can cite us as
   booktitle={Advances in Neural Information Processing Systems},
   year={2023}
 }
-```

 license: apache-2.0
 language:
 - en
+pipeline_tag: sentence-similarity
 inference: false
 ---
   booktitle={Advances in Neural Information Processing Systems},
   year={2023}
 }
+```

config.json CHANGED Viewed

@@ -30,7 +30,7 @@
     "long_conv_kernel_learning_rate": 0.001,
     "long_conv_l_max": 2048,
     "max_position_embeddings": 2048,
-    "model_type": "bert",
     "monarch_mlp_nblocks": 4,
     "num_attention_heads": 12,
     "num_hidden_layers": 12,

     "long_conv_kernel_learning_rate": 0.001,
     "long_conv_l_max": 2048,
     "max_position_embeddings": 2048,
+    "model_type": "m2_bert",
     "monarch_mlp_nblocks": 4,
     "num_attention_heads": 12,
     "num_hidden_layers": 12,