Update README.md
Browse files
README.md
CHANGED
@@ -24,11 +24,7 @@ The **gte-multilingual-base** model is the latest in the [GTE](https://huggingfa
|
|
24 |
- Embedding Dimension: 768
|
25 |
- Max Input Tokens: 8192
|
26 |
|
27 |
-
|
28 |
-
```
|
29 |
-
transformers>=4.39.2
|
30 |
-
flash_attn>=2.5.6
|
31 |
-
```
|
32 |
## Usage
|
33 |
|
34 |
Get Dense Embeddings with Transformers
|
@@ -104,4 +100,17 @@ hybird_scores = model.compute_scores(pairs, dense_weight=1.0, sparse_weight=0.3)
|
|
104 |
print('dense_scores', dense_scores)
|
105 |
print('sparse_scores', sparse_scores)
|
106 |
print('hybird_scores', hybird_scores)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
107 |
```
|
|
|
24 |
- Embedding Dimension: 768
|
25 |
- Max Input Tokens: 8192
|
26 |
|
27 |
+
|
|
|
|
|
|
|
|
|
28 |
## Usage
|
29 |
|
30 |
Get Dense Embeddings with Transformers
|
|
|
100 |
print('dense_scores', dense_scores)
|
101 |
print('sparse_scores', sparse_scores)
|
102 |
print('hybird_scores', hybird_scores)
|
103 |
+
```
|
104 |
+
|
105 |
+
## Citation
|
106 |
+
```
|
107 |
+
@misc{zhang2024mgtegeneralizedlongcontexttext,
|
108 |
+
title={mGTE: Generalized Long-Context Text Representation and Reranking Models for Multilingual Text Retrieval},
|
109 |
+
author={Xin Zhang and Yanzhao Zhang and Dingkun Long and Wen Xie and Ziqi Dai and Jialong Tang and Huan Lin and Baosong Yang and Pengjun Xie and Fei Huang and Meishan Zhang and Wenjie Li and Min Zhang},
|
110 |
+
year={2024},
|
111 |
+
eprint={2407.19669},
|
112 |
+
archivePrefix={arXiv},
|
113 |
+
primaryClass={cs.CL},
|
114 |
+
url={https://arxiv.org/abs/2407.19669},
|
115 |
+
}
|
116 |
```
|