Merge branch 'main' of https://huggingface.co/togethercomputer/m2-bert-80M-2k-retrieval into main
Browse files- README.md +2 -2
- config.json +1 -1
README.md
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
license: apache-2.0
|
| 3 |
language:
|
| 4 |
- en
|
| 5 |
-
pipeline_tag:
|
| 6 |
inference: false
|
| 7 |
---
|
| 8 |
|
|
@@ -104,4 +104,4 @@ If you use this model, or otherwise found our work valuable, you can cite us as
|
|
| 104 |
booktitle={Advances in Neural Information Processing Systems},
|
| 105 |
year={2023}
|
| 106 |
}
|
| 107 |
-
```
|
|
|
|
| 2 |
license: apache-2.0
|
| 3 |
language:
|
| 4 |
- en
|
| 5 |
+
pipeline_tag: sentence-similarity
|
| 6 |
inference: false
|
| 7 |
---
|
| 8 |
|
|
|
|
| 104 |
booktitle={Advances in Neural Information Processing Systems},
|
| 105 |
year={2023}
|
| 106 |
}
|
| 107 |
+
```
|
config.json
CHANGED
|
@@ -30,7 +30,7 @@
|
|
| 30 |
"long_conv_kernel_learning_rate": 0.001,
|
| 31 |
"long_conv_l_max": 2048,
|
| 32 |
"max_position_embeddings": 2048,
|
| 33 |
-
"model_type": "
|
| 34 |
"monarch_mlp_nblocks": 4,
|
| 35 |
"num_attention_heads": 12,
|
| 36 |
"num_hidden_layers": 12,
|
|
|
|
| 30 |
"long_conv_kernel_learning_rate": 0.001,
|
| 31 |
"long_conv_l_max": 2048,
|
| 32 |
"max_position_embeddings": 2048,
|
| 33 |
+
"model_type": "m2_bert",
|
| 34 |
"monarch_mlp_nblocks": 4,
|
| 35 |
"num_attention_heads": 12,
|
| 36 |
"num_hidden_layers": 12,
|