Upload folder using huggingface_hub
Browse files- .ipynb_checkpoints/README-checkpoint.md +597 -0
- 1_Pooling/config.json +10 -0
- README.md +597 -0
- config.json +24 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +14 -0
- optimizer.pt +3 -0
- rng_state.pth +3 -0
- scheduler.pt +3 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +65 -0
- trainer_state.json +188 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
.ipynb_checkpoints/README-checkpoint.md
ADDED
@@ -0,0 +1,597 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model: microsoft/mpnet-base
|
3 |
+
datasets:
|
4 |
+
- mteb/askubuntudupquestions-reranking
|
5 |
+
- mteb/mind_small
|
6 |
+
- mteb/scidocs-reranking
|
7 |
+
- mteb/stackoverflowdupquestions-reranking
|
8 |
+
- mteb/arguana
|
9 |
+
- mteb/climate-fever
|
10 |
+
- mteb/cqadupstack-android
|
11 |
+
- mteb/cqadupstack-english
|
12 |
+
- mteb/biosses-sts
|
13 |
+
- mteb/sickr-sts
|
14 |
+
- mteb/sts12-sts
|
15 |
+
- mteb/sts13-sts
|
16 |
+
language:
|
17 |
+
- en
|
18 |
+
library_name: sentence-transformers
|
19 |
+
pipeline_tag: sentence-similarity
|
20 |
+
tags:
|
21 |
+
- sentence-transformers
|
22 |
+
- sentence-similarity
|
23 |
+
- feature-extraction
|
24 |
+
- generated_from_trainer
|
25 |
+
- dataset_size:5130135
|
26 |
+
- loss:MultipleNegativesSymmetricRankingLoss
|
27 |
+
- loss:CoSENTLoss
|
28 |
+
- dataset_size:8233
|
29 |
+
widget:
|
30 |
+
- source_sentence: "This is a sample source sentence." # Ensure this is not empty
|
31 |
+
target_sentence: "This is a sample target sentence." # Ensure this is not empty
|
32 |
+
sentences:
|
33 |
+
- Broadband is a necessary evolution of internet technology that firms would be
|
34 |
+
wise to avail of if they wish to remain competitive. But it is this very desirability
|
35 |
+
that makes the provision of broadband a lucrative business in which many firms
|
36 |
+
participate. Business on a large scale is rarely organised in diffuse patterns,
|
37 |
+
but clustered in major population centres. Economic development can be furnished
|
38 |
+
by the private sector investing in broadband where there is a market. Growth will
|
39 |
+
not be slowed just because some farmers in Nebraska have slower internet. Singapore
|
40 |
+
is an aberrant example, as it is so small and its population so dense that it
|
41 |
+
would be impossible to compare its provision of broadband access to most other
|
42 |
+
countries.
|
43 |
+
- 'In retrospect, the decision to welcome the former Soviet states in the Baltic
|
44 |
+
into NATO appears foolish. They continue to have a prickly relationship with Russia,
|
45 |
+
which has some legitimate concerns about the treatment of large Russian minorities
|
46 |
+
in Latvia and Estonia, and about the siting of US nuclear defences. Their entry
|
47 |
+
into NATO was forced upon Russia, which naturally saw it as an aggressive move
|
48 |
+
designed to humiliate it, and marked the point when its pro-western policy shifted
|
49 |
+
to a more nationalist and confrontational approach. [1] It also weakened the unity
|
50 |
+
of NATO as there are quite legitimate doubts as to whether all the alliance’s
|
51 |
+
members would really go to war with Russia over the integrity of, say, Estonia.
|
52 |
+
Given this history, it would be madness to compound the problem by extending NATO
|
53 |
+
membership to Georgia and Ukraine. [1] Fraser, Malcolm, ‘Ukraine: there’s no
|
54 |
+
way out unless the west understands its past mistakes’, theguardian.com, 3 March
|
55 |
+
2014,'
|
56 |
+
- 'We need to be critical of the cumulative potential of the tax model proposed.
|
57 |
+
Firstly, the theory of the state’s capacity and how it functions in practice differ
|
58 |
+
substantially. The idea of taxation acting to enhance the productive capacity
|
59 |
+
of a nation is based on assumptions that the institutions, human resources, and
|
60 |
+
state-capacity, are already present. This is not always the case in Africa. Corruption
|
61 |
+
and bad governance are prevalent. Reforms in 1996 to curb corruption in the TRA
|
62 |
+
were reversed due to misunderstanding the nature of corruption amongst tax officials
|
63 |
+
and administration (Fjelstad, 2003). Tax-revenue performance remains comparatively
|
64 |
+
low [1] , there is little reason to simply altering what taxes there are will
|
65 |
+
change this. Finally, alternative methods can be used to assist rural infrastructure
|
66 |
+
projects, and enable national savings. For example, revising the role of agricultural
|
67 |
+
marketing boards [2] . [1] See further readings: Gray and Kahn, 2010. [2] See
|
68 |
+
further readings: Baffes, 2005.'
|
69 |
+
- source_sentence: advantages/disadvantages of installing from source code
|
70 |
+
sentences:
|
71 |
+
- 'is it there any advantage to unticking the `` source code '''' entry of a repository
|
72 |
+
? what is the advantage to build unity from source ffmpeg : installing from repository
|
73 |
+
or compiling from source ?'
|
74 |
+
- 'flash player issues flash player alternative for firefox flash videos go fullscreen
|
75 |
+
once ( firefox ) , then after minimising it and trying to go fullscreen again
|
76 |
+
it freezes ( ubuntu 14.04 , gnome desktop ) choppy flash video playback , ''settings
|
77 |
+
'' disabled for flash as well flash player is not working and do n''t know what
|
78 |
+
to do to fix it flash player : sound distorted error flash chrome in ubuntu 14.04'
|
79 |
+
- how to install newest version of minitube from source installing two version of
|
80 |
+
a software how to find source for a line in $ path ? how do i install network
|
81 |
+
driver source code to /lib/modules/ < kernel version > /build/drivers/net/ethernet
|
82 |
+
ca n't install vmware-view-client from partner repo in saucy why apt-get does
|
83 |
+
n't install the newest software what is the right way to reinstall from source
|
84 |
+
after package was installed via apt ? do i have to remove open drivers to switch
|
85 |
+
to fglrx ? how do i install clang version 3 in 10.10 ? adding extract tool to
|
86 |
+
nautilus ( compiled from source code ) how to point to boost built from source
|
87 |
+
how to remove httpd built from source if i build a package from source how can
|
88 |
+
i uninstall or remove completely ? avoid reinstall virtualbox and update to the
|
89 |
+
latest release installing only ruby 1.9 can i update software installed from source
|
90 |
+
code directly determine which package ( s ) were installed from a particular source
|
91 |
+
- source_sentence: will i be able to upgrade to 13.04 from 12.10 with a wubi installation
|
92 |
+
?
|
93 |
+
sentences:
|
94 |
+
- add cron job on startup from a script
|
95 |
+
- upgrading from 12.10 wubi install to 13.04 can i safely upgrade ubuntu 12.10 to
|
96 |
+
13.04 which installed using wubi ? will i be able to use wubi to install ubuntu
|
97 |
+
releases newer than 12.10 ? installing ubuntu in windows 8 with wubi
|
98 |
+
- upgrade from ubuntu server 12.10 to 13.04 wubi after upgrading windows 7 to windows
|
99 |
+
8 should i use wubi ubuntu 12.04 for my academic studies like writing docs , programming
|
100 |
+
, etc ? how to do a fresh re-installation of ubuntu safely on dual boot ? wubi
|
101 |
+
12.10 installation on windows 8 hangs do i keep my windows installation if i install
|
102 |
+
ubuntu with wubi , the windows installer ? move wubi installation of ubuntu to
|
103 |
+
a different partition in windows failed why was wubi removed from 13.04+ backup
|
104 |
+
, install and restore programms/settings of ubuntu ( wubi ) installation unable
|
105 |
+
to install ubuntu 12.10 with wubi in windows 7 - wubi is stuck upgrading my wubi
|
106 |
+
11.04 to 11.10 no additional driver no usb or dvd drive and not able to migrate
|
107 |
+
wubi ( no clue ) how can i remove windows and upgrade wubi install to a full install
|
108 |
+
without a cd or usb stick ? upgrade ubuntu to 13.04 from 12.10 on dual-boot laptop
|
109 |
+
upgrading ubuntu 12.10 to 13.04 using bootable usb alongside windows 7
|
110 |
+
- source_sentence: how do i use ubuntu 's web application integration ?
|
111 |
+
sentences:
|
112 |
+
- out of the box ubuntu 13.04 with chromium does not automatically use web apps
|
113 |
+
- why i do not have gnome shell with gnome 3 ? no gnome shell after install on ubuntu
|
114 |
+
12.04 inside vmware workstation
|
115 |
+
- how do i put a web application on the launcher ? how can i force ubuntu to use
|
116 |
+
font a instead font b in all applications and web pages ? how to remove the web
|
117 |
+
app shortcut created by chromium ? is there any finished tutorial on how to develop
|
118 |
+
and package unity web apps ? how do i put web applications in my unity launcher
|
119 |
+
? how to ftp transfer files to /var/www ? i would like to set up a ubuntu os on
|
120 |
+
amazon web server , how do i do this is there a way to request support for web
|
121 |
+
applications not currently supported ? how to test web applications for mobile
|
122 |
+
devices on ubuntu ? can i use unity web apps in ubuntu 13.10 ? how to create chrome/chromium
|
123 |
+
web application desktop shortcut ? icedtea-web 1.5 needs confirmation to run trusted
|
124 |
+
applet xul + unity web api hp pavilion dv2000 web camera driver how to open applications
|
125 |
+
after booting a purely command line interface ? trouble connecting to wireless
|
126 |
+
via clear hub express are web apps still part of ubuntu 's future ? newer versions
|
127 |
+
of chromium ? powerpc macs and 12.04 lts application support
|
128 |
+
- source_sentence: 'This form of necrosis, also termed necroptosis, requires the activity
|
129 |
+
of receptor-interacting protein kinase 1 (RIP1) and its related kinase, RIP3 '
|
130 |
+
sentences:
|
131 |
+
- This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive
|
132 |
+
with inactivating TET2 mutations, suggesting that the two types of mutations had
|
133 |
+
similar effects and were thus functionally redundant.
|
134 |
+
- Co-transfection of miRVec-miR-204 and the Renilla-3′ UTR plasmid was in HEK293T
|
135 |
+
cells with TransIT-LT1 Transfection Reagent (Mirus)
|
136 |
+
- TNF-mediated programmed necrosis typically involves the receptor-interacting serine-threonine
|
137 |
+
kinases 1 and 3 (RIP1 and RIP3), as evidenced in human, mouse, and zebrafish cell
|
138 |
+
lines, as well as in a murine sepsis model
|
139 |
+
---
|
140 |
+
|
141 |
+
# SentenceTransformer based on microsoft/mpnet-base
|
142 |
+
|
143 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base) on the [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking), [retrival_1](https://huggingface.co/datasets/mteb/arguana) and [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) datasets. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
144 |
+
|
145 |
+
## Model Details
|
146 |
+
|
147 |
+
### Model Description
|
148 |
+
- **Model Type:** Sentence Transformer
|
149 |
+
- **Base model:** [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base) <!-- at revision 6996ce1e91bd2a9c7d7f61daec37463394f73f09 -->
|
150 |
+
- **Maximum Sequence Length:** 512 tokens
|
151 |
+
- **Output Dimensionality:** 768 tokens
|
152 |
+
- **Similarity Function:** Cosine Similarity
|
153 |
+
- **Training Datasets:**
|
154 |
+
- [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking)
|
155 |
+
- [retrival_1](https://huggingface.co/datasets/mteb/arguana)
|
156 |
+
- [sts_1](https://huggingface.co/datasets/mteb/biosses-sts)
|
157 |
+
- **Language:** en
|
158 |
+
<!-- - **License:** Unknown -->
|
159 |
+
|
160 |
+
### Model Sources
|
161 |
+
|
162 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
163 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
164 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
165 |
+
|
166 |
+
### Full Model Architecture
|
167 |
+
|
168 |
+
```
|
169 |
+
SentenceTransformer(
|
170 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False}) with Transformer model: MPNetModel
|
171 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
172 |
+
)
|
173 |
+
```
|
174 |
+
|
175 |
+
## Usage
|
176 |
+
|
177 |
+
### Direct Usage (Sentence Transformers)
|
178 |
+
|
179 |
+
First install the Sentence Transformers library:
|
180 |
+
|
181 |
+
```bash
|
182 |
+
pip install -U sentence-transformers
|
183 |
+
```
|
184 |
+
|
185 |
+
Then you can load this model and run inference.
|
186 |
+
```python
|
187 |
+
from sentence_transformers import SentenceTransformer
|
188 |
+
|
189 |
+
# Download from the 🤗 Hub
|
190 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
191 |
+
# Run inference
|
192 |
+
sentences = [
|
193 |
+
'This form of necrosis, also termed necroptosis, requires the activity of receptor-interacting protein kinase 1 (RIP1) and its related kinase, RIP3 ',
|
194 |
+
'TNF-mediated programmed necrosis typically involves the receptor-interacting serine-threonine kinases 1 and 3 (RIP1 and RIP3), as evidenced in human, mouse, and zebrafish cell lines, as well as in a murine sepsis model',
|
195 |
+
'This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive with inactivating TET2 mutations, suggesting that the two types of mutations had similar effects and were thus functionally redundant.',
|
196 |
+
]
|
197 |
+
embeddings = model.encode(sentences)
|
198 |
+
print(embeddings.shape)
|
199 |
+
# [3, 768]
|
200 |
+
|
201 |
+
# Get the similarity scores for the embeddings
|
202 |
+
similarities = model.similarity(embeddings, embeddings)
|
203 |
+
print(similarities.shape)
|
204 |
+
# [3, 3]
|
205 |
+
```
|
206 |
+
|
207 |
+
<!--
|
208 |
+
### Direct Usage (Transformers)
|
209 |
+
|
210 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
211 |
+
|
212 |
+
</details>
|
213 |
+
-->
|
214 |
+
|
215 |
+
<!--
|
216 |
+
### Downstream Usage (Sentence Transformers)
|
217 |
+
|
218 |
+
You can finetune this model on your own dataset.
|
219 |
+
|
220 |
+
<details><summary>Click to expand</summary>
|
221 |
+
|
222 |
+
</details>
|
223 |
+
-->
|
224 |
+
|
225 |
+
<!--
|
226 |
+
### Out-of-Scope Use
|
227 |
+
|
228 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
229 |
+
-->
|
230 |
+
|
231 |
+
<!--
|
232 |
+
## Bias, Risks and Limitations
|
233 |
+
|
234 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
235 |
+
-->
|
236 |
+
|
237 |
+
<!--
|
238 |
+
### Recommendations
|
239 |
+
|
240 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
241 |
+
-->
|
242 |
+
|
243 |
+
## Training Details
|
244 |
+
|
245 |
+
### Training Datasets
|
246 |
+
|
247 |
+
#### reranking_1
|
248 |
+
|
249 |
+
* Dataset: [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking) at [4d853f9](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking/tree/4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c)
|
250 |
+
* Size: 337 training samples
|
251 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
252 |
+
* Approximate statistics based on the first 1000 samples:
|
253 |
+
| | anchor | positive | negative |
|
254 |
+
|:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|
|
255 |
+
| type | string | string | string |
|
256 |
+
| details | <ul><li>min: 4 tokens</li><li>mean: 14.94 tokens</li><li>max: 39 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 84.1 tokens</li><li>max: 407 tokens</li></ul> | <ul><li>min: 2 tokens</li><li>mean: 188.2 tokens</li><li>max: 391 tokens</li></ul> |
|
257 |
+
* Samples:
|
258 |
+
| anchor | positive | negative |
|
259 |
+
|:------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
260 |
+
| <code>black screen after installation with wubi</code> | <code>will installing ubuntu harm my computer ? wubi boot problem ca n't install on an emachines e725 black screen after purple ubuntu screen error , then black screen after wubi 11.10 goes into purple screen with black squares trying to login ( using wubi ) system hangs after wubi install screen turns off on boot dark purple screen with graphic corruption at boot , using wubi can i install 32 bit ubuntu on dual boot with 64 bit windows 7 ? black screen during installation ubuntu 12.10 via wubi on hp pavillion g6-1273s1 ubuntu wont boot after installing wubi from windows 7 windows 8 dual boot problem dual boot , ubuntu wo n't boot ! second wubi installation not working ubuntu after boot shows a black screen with a warning reboot required</code> | <code>how to fix black screen after boot purple then black screen after booting ? black screen after the grub screen ca n't boot after update , purple/black screen</code> |
|
261 |
+
| <code>wubi gives error 'nonetype ' object has no attribute 'get_info '</code> | <code>nonetype object has no attribute get_info ubuntu 14.04 can not install ubuntu 13.04 using wubi why does wubi installation fail with `` error : 'none type ' object has no attribute 'get_info ' '' ? error - 'nonetype ' object has no attribute 'get_info ' during xubuntu installation ca n't install 12.04 inside windows 7 using wubi error while installing ubuntu as separate os on my pc ? wubi 's error while installin ubuntu 12.10 on windows 7 why is wubi giving me an error message when i try to install ? ubuntu 12.10 install fails , both native and wubi asus eeepc 1015cx ubuntu 32 bits or 64bits ?</code> | <code>attributeerror : 'module ' object has no attribute openshot does n't launch with `` failed to import '' message software center not working ubuntu one not syncing ... in windows xp sp3 ubuntu one for windows client : `` attributeerror '' messages ubuntu one sign in error ( after installation completed ) : `` nonetype '' object has no attribute `` make file '' `` attributeerror : 'nonetype ' object has no attribute 'group ' '' when trying to use youtube-dl ' '' windows backend object has no attribute 'iso-path ' - see log for details . ' error when trying to install how can i resolve a 'windows backend : object has no attribute iso_path ' error while installing with wubi ? 'module ' object has no attribute 'py2 '</code> |
|
262 |
+
| <code>give permission to /var/www</code> | <code>write permissions in /var/www folder folders and files permission problem user ca n't ftp to a directory but is part of the group that owns it how to give read write permission to a folder and its sub folders and files ? give apache permission to write to /home/*/www/ directories give www-data write permission to /home ? assining permission to www folder problems with the /var/www folder trouble accessing www folders - permission or ownership ? group access to directory i am part of a group , but i can not create files apache 'you do n't have permission to access / on this server '</code> | <code>missing /var/www lubuntu 13.04 change permission from -rwxrwxr-x to drwxrwxr-x wordpress upload permission on nginx & ubuntu how do i restore the default permission on a directory/folder ? file permission in www/html directory for security problem while installing visual paradigm uml tool ? setting up home folders for users for 12.04 server edition -ls : can not open directory . : permission denied changed apache www folder</code> |
|
263 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
264 |
+
```json
|
265 |
+
{
|
266 |
+
"scale": 20.0,
|
267 |
+
"similarity_fct": "cos_sim"
|
268 |
+
}
|
269 |
+
```
|
270 |
+
|
271 |
+
#### retrival_1
|
272 |
+
|
273 |
+
* Dataset: [retrival_1](https://huggingface.co/datasets/mteb/arguana) at [c22ab2a](https://huggingface.co/datasets/mteb/arguana/tree/c22ab2a51041ffd869aaddef7af8d8215647e41a)
|
274 |
+
* Size: 7,806 training samples
|
275 |
+
* Columns: <code>title</code> and <code>text</code>
|
276 |
+
* Approximate statistics based on the first 1000 samples:
|
277 |
+
| | title | text |
|
278 |
+
|:--------|:---------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
279 |
+
| type | string | string |
|
280 |
+
| details | <ul><li>min: 2 tokens</li><li>mean: 5.42 tokens</li><li>max: 17 tokens</li></ul> | <ul><li>min: 41 tokens</li><li>mean: 199.3 tokens</li><li>max: 512 tokens</li></ul> |
|
281 |
+
* Samples:
|
282 |
+
| title | text |
|
283 |
+
|:--------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
284 |
+
| <code></code> | <code>Not having children is environmentally friendly The more people consume in the world, the greater the environmental damage. An average American produces 52 tons of garbage by the age of 75.* However, producing extra litter and pollution is not the only hazard that every child poses to the planet. Increasing world’s population also places incredible stress on Earth’s resources. It is estimated, for instance, that by 2025 three billion people will live in water-scarce countries. By reducing the number of human beings we will manage to avoid numerous overpopulation crises and reverse the damage done to the environment. * Tufts Climate Initiative., 2006,</code> |
|
285 |
+
| <code></code> | <code>The need for interaction is all the more reason to ensure that all ideas are in the marketplace. This way, the veracity of all ideas are questioned. For example, if someone brings bigoted ideas with them as a freshman, perhaps because these ideas were prevalent in the community they grew up in, if they cannot express these ideas and be challenged they may never attempt to integrate. Instead, they will gravitate to those who share their ideas and remain isolated.</code> |
|
286 |
+
| <code></code> | <code>Putting the power to censor the internet, no matter how stringent or specific the guidelines, into the hands of a private organization is misguided. It is the state not individual ISPs who are needed to assess how dangerous a site is, whether it is actually promoting extremism, and ultimately make a decision as to whether a site needs to be blocked. The ISPs may end up being the actors that implement the policy but it has to be government that decides which websites to block and why. This also means that the decision would be much more centralised. Leaving this decision to the discretion of individual ISPs will mean that some websites will be blocked on some ISPs and not on others. Only government can ensure that there is consistency.</code> |
|
287 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
288 |
+
```json
|
289 |
+
{
|
290 |
+
"scale": 20.0,
|
291 |
+
"similarity_fct": "cos_sim"
|
292 |
+
}
|
293 |
+
```
|
294 |
+
|
295 |
+
#### sts_1
|
296 |
+
|
297 |
+
* Dataset: [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) at [9ee918f](https://huggingface.co/datasets/mteb/biosses-sts/tree/9ee918f184421b6bd48b78f6c714d86546106103)
|
298 |
+
* Size: 90 training samples
|
299 |
+
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>score</code>
|
300 |
+
* Approximate statistics based on the first 1000 samples:
|
301 |
+
| | sentence1 | sentence2 | score |
|
302 |
+
|:--------|:-----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
303 |
+
| type | string | string | float |
|
304 |
+
| details | <ul><li>min: 13 tokens</li><li>mean: 39.44 tokens</li><li>max: 88 tokens</li></ul> | <ul><li>min: 12 tokens</li><li>mean: 38.43 tokens</li><li>max: 95 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 2.24</li><li>max: 4.0</li></ul> |
|
305 |
+
* Samples:
|
306 |
+
| sentence1 | sentence2 | score |
|
307 |
+
|:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
308 |
+
| <code>As p16INK4a blocks the inactivation of pRb by cyclin-dependent kinases, and Arf blocks the inactivation of p53 by Mdm2-mediated proteolysis, both have the capacity to cause cell cycle arrest.</code> | <code>By inducing Arf and Ink4a in primary rodent fibroblasts, oncogenic Ras expression leads to growth arrest and premature senescence.</code> | <code>2.4</code> |
|
309 |
+
| <code>Several lines of evidence suggest that the known principal RB pathway lesions in human tumors act in a mutual exclusive manner.</code> | <code>In individual human tumor specimens, these principal components of the pathway—RB-CDK4/6-p16INK4A—are reported to be targeted in a mutually exclusive manner.</code> | <code>3.4</code> |
|
310 |
+
| <code>T47D, MCF-7, Skbr3, HeLa, and Caco-2 cells were transfected by electroporation as described previously.</code> | <code> MCF7 or HeLa cells were electroporated as described previously to more than 95% efficiency with pSuper constructs against the various targets, and 72 hr later, protein expression was analyzed by SDS-PAGE and Western blotting.</code> | <code>3.0</code> |
|
311 |
+
* Loss: [<code>CoSENTLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosentloss) with these parameters:
|
312 |
+
```json
|
313 |
+
{
|
314 |
+
"scale": 20.0,
|
315 |
+
"similarity_fct": "pairwise_cos_sim"
|
316 |
+
}
|
317 |
+
```
|
318 |
+
|
319 |
+
### Evaluation Datasets
|
320 |
+
|
321 |
+
#### reranking_1
|
322 |
+
|
323 |
+
* Dataset: [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking) at [4d853f9](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking/tree/4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c)
|
324 |
+
* Size: 38 evaluation samples
|
325 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
326 |
+
* Approximate statistics based on the first 1000 samples:
|
327 |
+
| | anchor | positive | negative |
|
328 |
+
|:--------|:---------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
329 |
+
| type | string | string | string |
|
330 |
+
| details | <ul><li>min: 7 tokens</li><li>mean: 14.0 tokens</li><li>max: 24 tokens</li></ul> | <ul><li>min: 10 tokens</li><li>mean: 77.58 tokens</li><li>max: 371 tokens</li></ul> | <ul><li>min: 2 tokens</li><li>mean: 196.55 tokens</li><li>max: 291 tokens</li></ul> |
|
331 |
+
* Samples:
|
332 |
+
| anchor | positive | negative |
|
333 |
+
|:-------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
334 |
+
| <code>how do i clean install windows 7 on the `` other '' partition ?</code> | <code>how to partition disk in ubuntu and then install windows 7 ? install windows 7 on seperate partitions without losing grub how do i create a partion to install windows ? doubt : about dual boot ( 14.04 with windows 7 ) how do i install windows 7 from an iso file on a separate partition from ubuntu ? how to partition for a dual boot</code> | <code>install ubuntu in a specific partition side by side with windows 7 windows 7 system partition i have xp on one partition and windows 7 on another . how do i install ubuntu on a seperate partition ? cant ' dual install xubuntu and windows 7 i have formatted a partition for ubuntu . how do i install it on that partition ? grub wo n't load windows 7 ( unknown file system ) how to delete windows xp and integrate its partition to ubuntu ? uninstalling ubuntu when it is on the windows partition upgrading current version of ubuntu , on a multi boot system . a partition is necessary before installing ubuntu on windows 7 ? how to do a clean reinstall of ubuntu ? can i use testdisk to recover the windows partition over which ubuntu was installed ? how to update dual boot windows 7 / ubuntu 13.04 to 14.04 if i chose `` replace windows with ubuntu '' , do i lose the other partition too ?</code> |
|
335 |
+
| <code>is it possible to have two different dpi configurations for two different screens ?</code> | <code>how can i change the dpi of my monitors separately ? using external monitor with laptop monitor as separate monitors resolution in login screen different text scaling factors for different displays ? external display is showing and reporting wrong resolutions hard drive encryption boot screen resolution how to disable clone display mode on ubuntu login screen ?</code> | <code>change logon screen display configuration login screen on the wrong monitor only one resolution available in xorg.conf force gdm login screen to the primary monitor how to find and change the screen dpi ? dual screen different font resolution how can i display laptop screen on the tv by hdmi in kubuntu how do i turn off the laptop screen while using an external monitor ? adapt ubuntu to a high-dpi resolution screen how can i change my login screen resolution when connected to my monitor ( 12.04 ) dpi setting in ubuntu 13.10 resolution of the login screen is wrong on a second monitor force full-screen game to one monitor ?</code> |
|
336 |
+
| <code>any command line calculator for ubuntu ?</code> | <code>quick simple mathematics calculations ubuntu calculator in dash</code> | <code>shortcut to open/focus terminal window how to assign shortcut keys in gnome ? menu bar not visible on gnome-calculator how to permanently enable in-dash calculator in 13.10 a good hex/binary calculator command line calculator that keeps fractional values is there any calculator in software centre which could solve quadratic equations ? how to make shortcut to terminal application ? can calculator show decimal as fraction ? how to open pseudo-terminal devices on terminal ? keep calculator from opening a new window every time i press the `` calculator '' button on the keyboard ? keyboard shortcut for terminal does n't work since updating to 12.10 decimal point from number pad wo n't work on the calculator but will everywhere else how to set qalculator as default calculator ? what is 'calculator ' package ? how to get a 'non-screenlet ' calculator in compiz widget layer ? how do i use the 'scientific ' mode in the calculator ? how can i capture text from my terminal without redirecting it to a text file ?</code> |
|
337 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
338 |
+
```json
|
339 |
+
{
|
340 |
+
"scale": 20.0,
|
341 |
+
"similarity_fct": "cos_sim"
|
342 |
+
}
|
343 |
+
```
|
344 |
+
|
345 |
+
#### retrival_1
|
346 |
+
|
347 |
+
* Dataset: [retrival_1](https://huggingface.co/datasets/mteb/arguana) at [c22ab2a](https://huggingface.co/datasets/mteb/arguana/tree/c22ab2a51041ffd869aaddef7af8d8215647e41a)
|
348 |
+
* Size: 868 evaluation samples
|
349 |
+
* Columns: <code>title</code> and <code>text</code>
|
350 |
+
* Approximate statistics based on the first 1000 samples:
|
351 |
+
| | title | text |
|
352 |
+
|:--------|:--------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
353 |
+
| type | string | string |
|
354 |
+
| details | <ul><li>min: 2 tokens</li><li>mean: 5.0 tokens</li><li>max: 17 tokens</li></ul> | <ul><li>min: 26 tokens</li><li>mean: 204.03 tokens</li><li>max: 512 tokens</li></ul> |
|
355 |
+
* Samples:
|
356 |
+
| title | text |
|
357 |
+
|:--------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
358 |
+
| <code></code> | <code>Behind the veil of ignorance, human beings may not in fact side with what gives them the statistical greatest chance of survival. As Rawls himself notes, people are naturally risk-averse, and thus will select the rules that protect them from the worst possible situations, even if that sacrifice would help many others. Most people find the prospect of being actively killed by the conscious action of another human being worse than simply dying in an accident, and would seek to protect themselves against that worse outcome.</code> |
|
359 |
+
| <code></code> | <code>Schengen membership is not the same as EU membership – some non-EU states, such as Switzerland are part of Schengen, the UK and Ireland are EU member states but are not. Joining Schengen would involve the politically sensitive issue of undocumented migrants, which could not only be fatal to Cape Verde joining Schengen but to integration with Europe itself. Even if it is unlikely, is it that difficult for people to show a passport? Besides, tourism is not just from Europe to outside – a Euro move would only stop Europeans from needing to change currencies. The peg is the best of both worlds in that it means that the currency is stable.</code> |
|
360 |
+
| <code></code> | <code>News organisations cannot be completely transparent if they are to do their job properly and News International is no exception. Such organisations cannot for example reveal their sources as this may sometimes put their sources at risk and would mean that others would not come forward. As part of this news companies need to keep secret how they obtained information. While an attempt by a newspaper to cover up crimes is regrettable this one newspapers actions should not tar the whole company and its other papers.</code> |
|
361 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
362 |
+
```json
|
363 |
+
{
|
364 |
+
"scale": 20.0,
|
365 |
+
"similarity_fct": "cos_sim"
|
366 |
+
}
|
367 |
+
```
|
368 |
+
|
369 |
+
#### sts_1
|
370 |
+
|
371 |
+
* Dataset: [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) at [9ee918f](https://huggingface.co/datasets/mteb/biosses-sts/tree/9ee918f184421b6bd48b78f6c714d86546106103)
|
372 |
+
* Size: 10 evaluation samples
|
373 |
+
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>score</code>
|
374 |
+
* Approximate statistics based on the first 1000 samples:
|
375 |
+
| | sentence1 | sentence2 | score |
|
376 |
+
|:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
377 |
+
| type | string | string | float |
|
378 |
+
| details | <ul><li>min: 17 tokens</li><li>mean: 38.4 tokens</li><li>max: 61 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 46.8 tokens</li><li>max: 62 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 1.76</li><li>max: 3.2</li></ul> |
|
379 |
+
* Samples:
|
380 |
+
| sentence1 | sentence2 | score |
|
381 |
+
|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
382 |
+
| <code>Recently, it was reported that expression of IDH1R132H suppresses TET2 activity and the mutations of IDH1 and IDH2 genes occur in a mutual exclusive manner with that of TET2 gene in AML </code> | <code>The mechanism was clarified by yet another genomic survey, this time involving acute myelogenous leukemia (AML).</code> | <code>1.4</code> |
|
383 |
+
| <code>Recently, it was reported that expression of IDH1R132H suppresses TET2 activity and the mutations of IDH1 and IDH2 genes occur in a mutual exclusive manner with that of TET2 gene in AML.</code> | <code>This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive with inactivating TET2 mutations, suggesting that the two types of mutations had similar effects and were thus functionally redundant.</code> | <code>3.2</code> |
|
384 |
+
| <code>A gene that warrants further studies is the erythropoietin receptor that is 7.4-fold higher expressed in TEL-AML1-positive cases compared to other precursor B-ALL cases confirming other gene expression classification studies.</code> | <code>Another recent gene expression study of large numbers of cases provided support for the hypothesis that distinct leukemias are specified by each of the unique chromosomal abnormalities found in lymphoblastic leukemias.</code> | <code>0.6</code> |
|
385 |
+
* Loss: [<code>CoSENTLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosentloss) with these parameters:
|
386 |
+
```json
|
387 |
+
{
|
388 |
+
"scale": 20.0,
|
389 |
+
"similarity_fct": "pairwise_cos_sim"
|
390 |
+
}
|
391 |
+
```
|
392 |
+
|
393 |
+
### Training Hyperparameters
|
394 |
+
#### Non-Default Hyperparameters
|
395 |
+
|
396 |
+
- `eval_strategy`: epoch
|
397 |
+
- `per_device_train_batch_size`: 2
|
398 |
+
- `per_device_eval_batch_size`: 2
|
399 |
+
- `gradient_accumulation_steps`: 8
|
400 |
+
- `learning_rate`: 2e-05
|
401 |
+
- `num_train_epochs`: 5
|
402 |
+
- `lr_scheduler_type`: cosine
|
403 |
+
- `warmup_ratio`: 0.1
|
404 |
+
- `bf16`: True
|
405 |
+
- `tf32`: True
|
406 |
+
- `optim`: adamw_torch_fused
|
407 |
+
- `batch_sampler`: no_duplicates
|
408 |
+
|
409 |
+
#### All Hyperparameters
|
410 |
+
<details><summary>Click to expand</summary>
|
411 |
+
|
412 |
+
- `overwrite_output_dir`: False
|
413 |
+
- `do_predict`: False
|
414 |
+
- `eval_strategy`: epoch
|
415 |
+
- `prediction_loss_only`: True
|
416 |
+
- `per_device_train_batch_size`: 2
|
417 |
+
- `per_device_eval_batch_size`: 2
|
418 |
+
- `per_gpu_train_batch_size`: None
|
419 |
+
- `per_gpu_eval_batch_size`: None
|
420 |
+
- `gradient_accumulation_steps`: 8
|
421 |
+
- `eval_accumulation_steps`: None
|
422 |
+
- `learning_rate`: 2e-05
|
423 |
+
- `weight_decay`: 0.0
|
424 |
+
- `adam_beta1`: 0.9
|
425 |
+
- `adam_beta2`: 0.999
|
426 |
+
- `adam_epsilon`: 1e-08
|
427 |
+
- `max_grad_norm`: 1.0
|
428 |
+
- `num_train_epochs`: 5
|
429 |
+
- `max_steps`: -1
|
430 |
+
- `lr_scheduler_type`: cosine
|
431 |
+
- `lr_scheduler_kwargs`: {}
|
432 |
+
- `warmup_ratio`: 0.1
|
433 |
+
- `warmup_steps`: 0
|
434 |
+
- `log_level`: passive
|
435 |
+
- `log_level_replica`: warning
|
436 |
+
- `log_on_each_node`: True
|
437 |
+
- `logging_nan_inf_filter`: True
|
438 |
+
- `save_safetensors`: True
|
439 |
+
- `save_on_each_node`: False
|
440 |
+
- `save_only_model`: False
|
441 |
+
- `restore_callback_states_from_checkpoint`: False
|
442 |
+
- `no_cuda`: False
|
443 |
+
- `use_cpu`: False
|
444 |
+
- `use_mps_device`: False
|
445 |
+
- `seed`: 42
|
446 |
+
- `data_seed`: None
|
447 |
+
- `jit_mode_eval`: False
|
448 |
+
- `use_ipex`: False
|
449 |
+
- `bf16`: True
|
450 |
+
- `fp16`: False
|
451 |
+
- `fp16_opt_level`: O1
|
452 |
+
- `half_precision_backend`: auto
|
453 |
+
- `bf16_full_eval`: False
|
454 |
+
- `fp16_full_eval`: False
|
455 |
+
- `tf32`: True
|
456 |
+
- `local_rank`: 0
|
457 |
+
- `ddp_backend`: None
|
458 |
+
- `tpu_num_cores`: None
|
459 |
+
- `tpu_metrics_debug`: False
|
460 |
+
- `debug`: []
|
461 |
+
- `dataloader_drop_last`: False
|
462 |
+
- `dataloader_num_workers`: 0
|
463 |
+
- `dataloader_prefetch_factor`: None
|
464 |
+
- `past_index`: -1
|
465 |
+
- `disable_tqdm`: False
|
466 |
+
- `remove_unused_columns`: True
|
467 |
+
- `label_names`: None
|
468 |
+
- `load_best_model_at_end`: False
|
469 |
+
- `ignore_data_skip`: False
|
470 |
+
- `fsdp`: []
|
471 |
+
- `fsdp_min_num_params`: 0
|
472 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
473 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
474 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
475 |
+
- `deepspeed`: None
|
476 |
+
- `label_smoothing_factor`: 0.0
|
477 |
+
- `optim`: adamw_torch_fused
|
478 |
+
- `optim_args`: None
|
479 |
+
- `adafactor`: False
|
480 |
+
- `group_by_length`: False
|
481 |
+
- `length_column_name`: length
|
482 |
+
- `ddp_find_unused_parameters`: None
|
483 |
+
- `ddp_bucket_cap_mb`: None
|
484 |
+
- `ddp_broadcast_buffers`: False
|
485 |
+
- `dataloader_pin_memory`: True
|
486 |
+
- `dataloader_persistent_workers`: False
|
487 |
+
- `skip_memory_metrics`: True
|
488 |
+
- `use_legacy_prediction_loop`: False
|
489 |
+
- `push_to_hub`: False
|
490 |
+
- `resume_from_checkpoint`: None
|
491 |
+
- `hub_model_id`: None
|
492 |
+
- `hub_strategy`: every_save
|
493 |
+
- `hub_private_repo`: False
|
494 |
+
- `hub_always_push`: False
|
495 |
+
- `gradient_checkpointing`: False
|
496 |
+
- `gradient_checkpointing_kwargs`: None
|
497 |
+
- `include_inputs_for_metrics`: False
|
498 |
+
- `eval_do_concat_batches`: True
|
499 |
+
- `fp16_backend`: auto
|
500 |
+
- `push_to_hub_model_id`: None
|
501 |
+
- `push_to_hub_organization`: None
|
502 |
+
- `mp_parameters`:
|
503 |
+
- `auto_find_batch_size`: False
|
504 |
+
- `full_determinism`: False
|
505 |
+
- `torchdynamo`: None
|
506 |
+
- `ray_scope`: last
|
507 |
+
- `ddp_timeout`: 1800
|
508 |
+
- `torch_compile`: False
|
509 |
+
- `torch_compile_backend`: None
|
510 |
+
- `torch_compile_mode`: None
|
511 |
+
- `dispatch_batches`: None
|
512 |
+
- `split_batches`: None
|
513 |
+
- `include_tokens_per_second`: False
|
514 |
+
- `include_num_input_tokens_seen`: False
|
515 |
+
- `neftune_noise_alpha`: None
|
516 |
+
- `optim_target_modules`: None
|
517 |
+
- `batch_eval_metrics`: False
|
518 |
+
- `batch_sampler`: no_duplicates
|
519 |
+
- `multi_dataset_batch_sampler`: proportional
|
520 |
+
|
521 |
+
</details>
|
522 |
+
|
523 |
+
### Training Logs
|
524 |
+
| Epoch | Step | Training Loss | reranking 1 loss | retrival 1 loss | sts 1 loss |
|
525 |
+
|:------:|:----:|:-------------:|:----------------:|:---------------:|:----------:|
|
526 |
+
| 0.9716 | 500 | 0.4296 | - | - | - |
|
527 |
+
| 0.9988 | 514 | - | 0.2080 | 0.1297 | 0.1096 |
|
528 |
+
| 0.9716 | 500 | 0.0933 | - | - | - |
|
529 |
+
| 0.9988 | 514 | - | 0.2104 | 0.1012 | 0.5515 |
|
530 |
+
| 0.9716 | 500 | 0.0435 | - | - | - |
|
531 |
+
| 0.9988 | 514 | - | 0.2026 | 0.1434 | 0.4824 |
|
532 |
+
| 0.9716 | 500 | 0.0282 | - | - | - |
|
533 |
+
| 0.9988 | 514 | - | 0.1827 | 0.1305 | 0.2950 |
|
534 |
+
| 1.9432 | 1000 | 0.0555 | - | - | - |
|
535 |
+
| 1.9995 | 1029 | - | 0.3932 | 0.0693 | 0.8649 |
|
536 |
+
| 2.9147 | 1500 | 0.0151 | - | - | - |
|
537 |
+
| 2.9983 | 1543 | - | 0.2112 | 0.0555 | 0.5478 |
|
538 |
+
| 3.8863 | 2000 | 0.0036 | - | - | - |
|
539 |
+
| 3.9990 | 2058 | - | 0.1921 | 0.0432 | 0.5912 |
|
540 |
+
| 4.8579 | 2500 | 0.0013 | - | - | - |
|
541 |
+
| 4.9939 | 2570 | - | 0.1904 | 0.0412 | 0.6356 |
|
542 |
+
|
543 |
+
|
544 |
+
### Framework Versions
|
545 |
+
- Python: 3.10.12
|
546 |
+
- Sentence Transformers: 3.0.1
|
547 |
+
- Transformers: 4.41.2
|
548 |
+
- PyTorch: 2.2.0+cu121
|
549 |
+
- Accelerate: 0.31.0
|
550 |
+
- Datasets: 2.20.0
|
551 |
+
- Tokenizers: 0.19.1
|
552 |
+
|
553 |
+
## Citation
|
554 |
+
|
555 |
+
### BibTeX
|
556 |
+
|
557 |
+
#### Sentence Transformers
|
558 |
+
```bibtex
|
559 |
+
@inproceedings{reimers-2019-sentence-bert,
|
560 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
561 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
562 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
563 |
+
month = "11",
|
564 |
+
year = "2019",
|
565 |
+
publisher = "Association for Computational Linguistics",
|
566 |
+
url = "https://arxiv.org/abs/1908.10084",
|
567 |
+
}
|
568 |
+
```
|
569 |
+
|
570 |
+
#### CoSENTLoss
|
571 |
+
```bibtex
|
572 |
+
@online{kexuefm-8847,
|
573 |
+
title={CoSENT: A more efficient sentence vector scheme than Sentence-BERT},
|
574 |
+
author={Su Jianlin},
|
575 |
+
year={2022},
|
576 |
+
month={Jan},
|
577 |
+
url={https://kexue.fm/archives/8847},
|
578 |
+
}
|
579 |
+
```
|
580 |
+
|
581 |
+
<!--
|
582 |
+
## Glossary
|
583 |
+
|
584 |
+
*Clearly define terms in order to be accessible across audiences.*
|
585 |
+
-->
|
586 |
+
|
587 |
+
<!--
|
588 |
+
## Model Card Authors
|
589 |
+
|
590 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
591 |
+
-->
|
592 |
+
|
593 |
+
<!--
|
594 |
+
## Model Card Contact
|
595 |
+
|
596 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
597 |
+
-->
|
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
ADDED
@@ -0,0 +1,597 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model: microsoft/mpnet-base
|
3 |
+
datasets:
|
4 |
+
- mteb/askubuntudupquestions-reranking
|
5 |
+
- mteb/mind_small
|
6 |
+
- mteb/scidocs-reranking
|
7 |
+
- mteb/stackoverflowdupquestions-reranking
|
8 |
+
- mteb/arguana
|
9 |
+
- mteb/climate-fever
|
10 |
+
- mteb/cqadupstack-android
|
11 |
+
- mteb/cqadupstack-english
|
12 |
+
- mteb/biosses-sts
|
13 |
+
- mteb/sickr-sts
|
14 |
+
- mteb/sts12-sts
|
15 |
+
- mteb/sts13-sts
|
16 |
+
language:
|
17 |
+
- en
|
18 |
+
library_name: sentence-transformers
|
19 |
+
pipeline_tag: sentence-similarity
|
20 |
+
tags:
|
21 |
+
- sentence-transformers
|
22 |
+
- sentence-similarity
|
23 |
+
- feature-extraction
|
24 |
+
- generated_from_trainer
|
25 |
+
- dataset_size:5130135
|
26 |
+
- loss:MultipleNegativesSymmetricRankingLoss
|
27 |
+
- loss:CoSENTLoss
|
28 |
+
- dataset_size:8233
|
29 |
+
widget:
|
30 |
+
- source_sentence: "This is a sample source sentence." # Ensure this is not empty
|
31 |
+
target_sentence: "This is a sample target sentence." # Ensure this is not empty
|
32 |
+
sentences:
|
33 |
+
- Broadband is a necessary evolution of internet technology that firms would be
|
34 |
+
wise to avail of if they wish to remain competitive. But it is this very desirability
|
35 |
+
that makes the provision of broadband a lucrative business in which many firms
|
36 |
+
participate. Business on a large scale is rarely organised in diffuse patterns,
|
37 |
+
but clustered in major population centres. Economic development can be furnished
|
38 |
+
by the private sector investing in broadband where there is a market. Growth will
|
39 |
+
not be slowed just because some farmers in Nebraska have slower internet. Singapore
|
40 |
+
is an aberrant example, as it is so small and its population so dense that it
|
41 |
+
would be impossible to compare its provision of broadband access to most other
|
42 |
+
countries.
|
43 |
+
- 'In retrospect, the decision to welcome the former Soviet states in the Baltic
|
44 |
+
into NATO appears foolish. They continue to have a prickly relationship with Russia,
|
45 |
+
which has some legitimate concerns about the treatment of large Russian minorities
|
46 |
+
in Latvia and Estonia, and about the siting of US nuclear defences. Their entry
|
47 |
+
into NATO was forced upon Russia, which naturally saw it as an aggressive move
|
48 |
+
designed to humiliate it, and marked the point when its pro-western policy shifted
|
49 |
+
to a more nationalist and confrontational approach. [1] It also weakened the unity
|
50 |
+
of NATO as there are quite legitimate doubts as to whether all the alliance’s
|
51 |
+
members would really go to war with Russia over the integrity of, say, Estonia.
|
52 |
+
Given this history, it would be madness to compound the problem by extending NATO
|
53 |
+
membership to Georgia and Ukraine. [1] Fraser, Malcolm, ‘Ukraine: there’s no
|
54 |
+
way out unless the west understands its past mistakes’, theguardian.com, 3 March
|
55 |
+
2014,'
|
56 |
+
- 'We need to be critical of the cumulative potential of the tax model proposed.
|
57 |
+
Firstly, the theory of the state’s capacity and how it functions in practice differ
|
58 |
+
substantially. The idea of taxation acting to enhance the productive capacity
|
59 |
+
of a nation is based on assumptions that the institutions, human resources, and
|
60 |
+
state-capacity, are already present. This is not always the case in Africa. Corruption
|
61 |
+
and bad governance are prevalent. Reforms in 1996 to curb corruption in the TRA
|
62 |
+
were reversed due to misunderstanding the nature of corruption amongst tax officials
|
63 |
+
and administration (Fjelstad, 2003). Tax-revenue performance remains comparatively
|
64 |
+
low [1] , there is little reason to simply altering what taxes there are will
|
65 |
+
change this. Finally, alternative methods can be used to assist rural infrastructure
|
66 |
+
projects, and enable national savings. For example, revising the role of agricultural
|
67 |
+
marketing boards [2] . [1] See further readings: Gray and Kahn, 2010. [2] See
|
68 |
+
further readings: Baffes, 2005.'
|
69 |
+
- source_sentence: advantages/disadvantages of installing from source code
|
70 |
+
sentences:
|
71 |
+
- 'is it there any advantage to unticking the `` source code '''' entry of a repository
|
72 |
+
? what is the advantage to build unity from source ffmpeg : installing from repository
|
73 |
+
or compiling from source ?'
|
74 |
+
- 'flash player issues flash player alternative for firefox flash videos go fullscreen
|
75 |
+
once ( firefox ) , then after minimising it and trying to go fullscreen again
|
76 |
+
it freezes ( ubuntu 14.04 , gnome desktop ) choppy flash video playback , ''settings
|
77 |
+
'' disabled for flash as well flash player is not working and do n''t know what
|
78 |
+
to do to fix it flash player : sound distorted error flash chrome in ubuntu 14.04'
|
79 |
+
- how to install newest version of minitube from source installing two version of
|
80 |
+
a software how to find source for a line in $ path ? how do i install network
|
81 |
+
driver source code to /lib/modules/ < kernel version > /build/drivers/net/ethernet
|
82 |
+
ca n't install vmware-view-client from partner repo in saucy why apt-get does
|
83 |
+
n't install the newest software what is the right way to reinstall from source
|
84 |
+
after package was installed via apt ? do i have to remove open drivers to switch
|
85 |
+
to fglrx ? how do i install clang version 3 in 10.10 ? adding extract tool to
|
86 |
+
nautilus ( compiled from source code ) how to point to boost built from source
|
87 |
+
how to remove httpd built from source if i build a package from source how can
|
88 |
+
i uninstall or remove completely ? avoid reinstall virtualbox and update to the
|
89 |
+
latest release installing only ruby 1.9 can i update software installed from source
|
90 |
+
code directly determine which package ( s ) were installed from a particular source
|
91 |
+
- source_sentence: will i be able to upgrade to 13.04 from 12.10 with a wubi installation
|
92 |
+
?
|
93 |
+
sentences:
|
94 |
+
- add cron job on startup from a script
|
95 |
+
- upgrading from 12.10 wubi install to 13.04 can i safely upgrade ubuntu 12.10 to
|
96 |
+
13.04 which installed using wubi ? will i be able to use wubi to install ubuntu
|
97 |
+
releases newer than 12.10 ? installing ubuntu in windows 8 with wubi
|
98 |
+
- upgrade from ubuntu server 12.10 to 13.04 wubi after upgrading windows 7 to windows
|
99 |
+
8 should i use wubi ubuntu 12.04 for my academic studies like writing docs , programming
|
100 |
+
, etc ? how to do a fresh re-installation of ubuntu safely on dual boot ? wubi
|
101 |
+
12.10 installation on windows 8 hangs do i keep my windows installation if i install
|
102 |
+
ubuntu with wubi , the windows installer ? move wubi installation of ubuntu to
|
103 |
+
a different partition in windows failed why was wubi removed from 13.04+ backup
|
104 |
+
, install and restore programms/settings of ubuntu ( wubi ) installation unable
|
105 |
+
to install ubuntu 12.10 with wubi in windows 7 - wubi is stuck upgrading my wubi
|
106 |
+
11.04 to 11.10 no additional driver no usb or dvd drive and not able to migrate
|
107 |
+
wubi ( no clue ) how can i remove windows and upgrade wubi install to a full install
|
108 |
+
without a cd or usb stick ? upgrade ubuntu to 13.04 from 12.10 on dual-boot laptop
|
109 |
+
upgrading ubuntu 12.10 to 13.04 using bootable usb alongside windows 7
|
110 |
+
- source_sentence: how do i use ubuntu 's web application integration ?
|
111 |
+
sentences:
|
112 |
+
- out of the box ubuntu 13.04 with chromium does not automatically use web apps
|
113 |
+
- why i do not have gnome shell with gnome 3 ? no gnome shell after install on ubuntu
|
114 |
+
12.04 inside vmware workstation
|
115 |
+
- how do i put a web application on the launcher ? how can i force ubuntu to use
|
116 |
+
font a instead font b in all applications and web pages ? how to remove the web
|
117 |
+
app shortcut created by chromium ? is there any finished tutorial on how to develop
|
118 |
+
and package unity web apps ? how do i put web applications in my unity launcher
|
119 |
+
? how to ftp transfer files to /var/www ? i would like to set up a ubuntu os on
|
120 |
+
amazon web server , how do i do this is there a way to request support for web
|
121 |
+
applications not currently supported ? how to test web applications for mobile
|
122 |
+
devices on ubuntu ? can i use unity web apps in ubuntu 13.10 ? how to create chrome/chromium
|
123 |
+
web application desktop shortcut ? icedtea-web 1.5 needs confirmation to run trusted
|
124 |
+
applet xul + unity web api hp pavilion dv2000 web camera driver how to open applications
|
125 |
+
after booting a purely command line interface ? trouble connecting to wireless
|
126 |
+
via clear hub express are web apps still part of ubuntu 's future ? newer versions
|
127 |
+
of chromium ? powerpc macs and 12.04 lts application support
|
128 |
+
- source_sentence: 'This form of necrosis, also termed necroptosis, requires the activity
|
129 |
+
of receptor-interacting protein kinase 1 (RIP1) and its related kinase, RIP3 '
|
130 |
+
sentences:
|
131 |
+
- This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive
|
132 |
+
with inactivating TET2 mutations, suggesting that the two types of mutations had
|
133 |
+
similar effects and were thus functionally redundant.
|
134 |
+
- Co-transfection of miRVec-miR-204 and the Renilla-3′ UTR plasmid was in HEK293T
|
135 |
+
cells with TransIT-LT1 Transfection Reagent (Mirus)
|
136 |
+
- TNF-mediated programmed necrosis typically involves the receptor-interacting serine-threonine
|
137 |
+
kinases 1 and 3 (RIP1 and RIP3), as evidenced in human, mouse, and zebrafish cell
|
138 |
+
lines, as well as in a murine sepsis model
|
139 |
+
---
|
140 |
+
|
141 |
+
# SentenceTransformer based on microsoft/mpnet-base
|
142 |
+
|
143 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base) on the [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking), [retrival_1](https://huggingface.co/datasets/mteb/arguana) and [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) datasets. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
144 |
+
|
145 |
+
## Model Details
|
146 |
+
|
147 |
+
### Model Description
|
148 |
+
- **Model Type:** Sentence Transformer
|
149 |
+
- **Base model:** [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base) <!-- at revision 6996ce1e91bd2a9c7d7f61daec37463394f73f09 -->
|
150 |
+
- **Maximum Sequence Length:** 512 tokens
|
151 |
+
- **Output Dimensionality:** 768 tokens
|
152 |
+
- **Similarity Function:** Cosine Similarity
|
153 |
+
- **Training Datasets:**
|
154 |
+
- [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking)
|
155 |
+
- [retrival_1](https://huggingface.co/datasets/mteb/arguana)
|
156 |
+
- [sts_1](https://huggingface.co/datasets/mteb/biosses-sts)
|
157 |
+
- **Language:** en
|
158 |
+
<!-- - **License:** Unknown -->
|
159 |
+
|
160 |
+
### Model Sources
|
161 |
+
|
162 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
163 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
164 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
165 |
+
|
166 |
+
### Full Model Architecture
|
167 |
+
|
168 |
+
```
|
169 |
+
SentenceTransformer(
|
170 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False}) with Transformer model: MPNetModel
|
171 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
172 |
+
)
|
173 |
+
```
|
174 |
+
|
175 |
+
## Usage
|
176 |
+
|
177 |
+
### Direct Usage (Sentence Transformers)
|
178 |
+
|
179 |
+
First install the Sentence Transformers library:
|
180 |
+
|
181 |
+
```bash
|
182 |
+
pip install -U sentence-transformers
|
183 |
+
```
|
184 |
+
|
185 |
+
Then you can load this model and run inference.
|
186 |
+
```python
|
187 |
+
from sentence_transformers import SentenceTransformer
|
188 |
+
|
189 |
+
# Download from the 🤗 Hub
|
190 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
191 |
+
# Run inference
|
192 |
+
sentences = [
|
193 |
+
'This form of necrosis, also termed necroptosis, requires the activity of receptor-interacting protein kinase 1 (RIP1) and its related kinase, RIP3 ',
|
194 |
+
'TNF-mediated programmed necrosis typically involves the receptor-interacting serine-threonine kinases 1 and 3 (RIP1 and RIP3), as evidenced in human, mouse, and zebrafish cell lines, as well as in a murine sepsis model',
|
195 |
+
'This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive with inactivating TET2 mutations, suggesting that the two types of mutations had similar effects and were thus functionally redundant.',
|
196 |
+
]
|
197 |
+
embeddings = model.encode(sentences)
|
198 |
+
print(embeddings.shape)
|
199 |
+
# [3, 768]
|
200 |
+
|
201 |
+
# Get the similarity scores for the embeddings
|
202 |
+
similarities = model.similarity(embeddings, embeddings)
|
203 |
+
print(similarities.shape)
|
204 |
+
# [3, 3]
|
205 |
+
```
|
206 |
+
|
207 |
+
<!--
|
208 |
+
### Direct Usage (Transformers)
|
209 |
+
|
210 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
211 |
+
|
212 |
+
</details>
|
213 |
+
-->
|
214 |
+
|
215 |
+
<!--
|
216 |
+
### Downstream Usage (Sentence Transformers)
|
217 |
+
|
218 |
+
You can finetune this model on your own dataset.
|
219 |
+
|
220 |
+
<details><summary>Click to expand</summary>
|
221 |
+
|
222 |
+
</details>
|
223 |
+
-->
|
224 |
+
|
225 |
+
<!--
|
226 |
+
### Out-of-Scope Use
|
227 |
+
|
228 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
229 |
+
-->
|
230 |
+
|
231 |
+
<!--
|
232 |
+
## Bias, Risks and Limitations
|
233 |
+
|
234 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
235 |
+
-->
|
236 |
+
|
237 |
+
<!--
|
238 |
+
### Recommendations
|
239 |
+
|
240 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
241 |
+
-->
|
242 |
+
|
243 |
+
## Training Details
|
244 |
+
|
245 |
+
### Training Datasets
|
246 |
+
|
247 |
+
#### reranking_1
|
248 |
+
|
249 |
+
* Dataset: [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking) at [4d853f9](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking/tree/4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c)
|
250 |
+
* Size: 337 training samples
|
251 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
252 |
+
* Approximate statistics based on the first 1000 samples:
|
253 |
+
| | anchor | positive | negative |
|
254 |
+
|:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|
|
255 |
+
| type | string | string | string |
|
256 |
+
| details | <ul><li>min: 4 tokens</li><li>mean: 14.94 tokens</li><li>max: 39 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 84.1 tokens</li><li>max: 407 tokens</li></ul> | <ul><li>min: 2 tokens</li><li>mean: 188.2 tokens</li><li>max: 391 tokens</li></ul> |
|
257 |
+
* Samples:
|
258 |
+
| anchor | positive | negative |
|
259 |
+
|:------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
260 |
+
| <code>black screen after installation with wubi</code> | <code>will installing ubuntu harm my computer ? wubi boot problem ca n't install on an emachines e725 black screen after purple ubuntu screen error , then black screen after wubi 11.10 goes into purple screen with black squares trying to login ( using wubi ) system hangs after wubi install screen turns off on boot dark purple screen with graphic corruption at boot , using wubi can i install 32 bit ubuntu on dual boot with 64 bit windows 7 ? black screen during installation ubuntu 12.10 via wubi on hp pavillion g6-1273s1 ubuntu wont boot after installing wubi from windows 7 windows 8 dual boot problem dual boot , ubuntu wo n't boot ! second wubi installation not working ubuntu after boot shows a black screen with a warning reboot required</code> | <code>how to fix black screen after boot purple then black screen after booting ? black screen after the grub screen ca n't boot after update , purple/black screen</code> |
|
261 |
+
| <code>wubi gives error 'nonetype ' object has no attribute 'get_info '</code> | <code>nonetype object has no attribute get_info ubuntu 14.04 can not install ubuntu 13.04 using wubi why does wubi installation fail with `` error : 'none type ' object has no attribute 'get_info ' '' ? error - 'nonetype ' object has no attribute 'get_info ' during xubuntu installation ca n't install 12.04 inside windows 7 using wubi error while installing ubuntu as separate os on my pc ? wubi 's error while installin ubuntu 12.10 on windows 7 why is wubi giving me an error message when i try to install ? ubuntu 12.10 install fails , both native and wubi asus eeepc 1015cx ubuntu 32 bits or 64bits ?</code> | <code>attributeerror : 'module ' object has no attribute openshot does n't launch with `` failed to import '' message software center not working ubuntu one not syncing ... in windows xp sp3 ubuntu one for windows client : `` attributeerror '' messages ubuntu one sign in error ( after installation completed ) : `` nonetype '' object has no attribute `` make file '' `` attributeerror : 'nonetype ' object has no attribute 'group ' '' when trying to use youtube-dl ' '' windows backend object has no attribute 'iso-path ' - see log for details . ' error when trying to install how can i resolve a 'windows backend : object has no attribute iso_path ' error while installing with wubi ? 'module ' object has no attribute 'py2 '</code> |
|
262 |
+
| <code>give permission to /var/www</code> | <code>write permissions in /var/www folder folders and files permission problem user ca n't ftp to a directory but is part of the group that owns it how to give read write permission to a folder and its sub folders and files ? give apache permission to write to /home/*/www/ directories give www-data write permission to /home ? assining permission to www folder problems with the /var/www folder trouble accessing www folders - permission or ownership ? group access to directory i am part of a group , but i can not create files apache 'you do n't have permission to access / on this server '</code> | <code>missing /var/www lubuntu 13.04 change permission from -rwxrwxr-x to drwxrwxr-x wordpress upload permission on nginx & ubuntu how do i restore the default permission on a directory/folder ? file permission in www/html directory for security problem while installing visual paradigm uml tool ? setting up home folders for users for 12.04 server edition -ls : can not open directory . : permission denied changed apache www folder</code> |
|
263 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
264 |
+
```json
|
265 |
+
{
|
266 |
+
"scale": 20.0,
|
267 |
+
"similarity_fct": "cos_sim"
|
268 |
+
}
|
269 |
+
```
|
270 |
+
|
271 |
+
#### retrival_1
|
272 |
+
|
273 |
+
* Dataset: [retrival_1](https://huggingface.co/datasets/mteb/arguana) at [c22ab2a](https://huggingface.co/datasets/mteb/arguana/tree/c22ab2a51041ffd869aaddef7af8d8215647e41a)
|
274 |
+
* Size: 7,806 training samples
|
275 |
+
* Columns: <code>title</code> and <code>text</code>
|
276 |
+
* Approximate statistics based on the first 1000 samples:
|
277 |
+
| | title | text |
|
278 |
+
|:--------|:---------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
279 |
+
| type | string | string |
|
280 |
+
| details | <ul><li>min: 2 tokens</li><li>mean: 5.42 tokens</li><li>max: 17 tokens</li></ul> | <ul><li>min: 41 tokens</li><li>mean: 199.3 tokens</li><li>max: 512 tokens</li></ul> |
|
281 |
+
* Samples:
|
282 |
+
| title | text |
|
283 |
+
|:--------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
284 |
+
| <code></code> | <code>Not having children is environmentally friendly The more people consume in the world, the greater the environmental damage. An average American produces 52 tons of garbage by the age of 75.* However, producing extra litter and pollution is not the only hazard that every child poses to the planet. Increasing world’s population also places incredible stress on Earth’s resources. It is estimated, for instance, that by 2025 three billion people will live in water-scarce countries. By reducing the number of human beings we will manage to avoid numerous overpopulation crises and reverse the damage done to the environment. * Tufts Climate Initiative., 2006,</code> |
|
285 |
+
| <code></code> | <code>The need for interaction is all the more reason to ensure that all ideas are in the marketplace. This way, the veracity of all ideas are questioned. For example, if someone brings bigoted ideas with them as a freshman, perhaps because these ideas were prevalent in the community they grew up in, if they cannot express these ideas and be challenged they may never attempt to integrate. Instead, they will gravitate to those who share their ideas and remain isolated.</code> |
|
286 |
+
| <code></code> | <code>Putting the power to censor the internet, no matter how stringent or specific the guidelines, into the hands of a private organization is misguided. It is the state not individual ISPs who are needed to assess how dangerous a site is, whether it is actually promoting extremism, and ultimately make a decision as to whether a site needs to be blocked. The ISPs may end up being the actors that implement the policy but it has to be government that decides which websites to block and why. This also means that the decision would be much more centralised. Leaving this decision to the discretion of individual ISPs will mean that some websites will be blocked on some ISPs and not on others. Only government can ensure that there is consistency.</code> |
|
287 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
288 |
+
```json
|
289 |
+
{
|
290 |
+
"scale": 20.0,
|
291 |
+
"similarity_fct": "cos_sim"
|
292 |
+
}
|
293 |
+
```
|
294 |
+
|
295 |
+
#### sts_1
|
296 |
+
|
297 |
+
* Dataset: [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) at [9ee918f](https://huggingface.co/datasets/mteb/biosses-sts/tree/9ee918f184421b6bd48b78f6c714d86546106103)
|
298 |
+
* Size: 90 training samples
|
299 |
+
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>score</code>
|
300 |
+
* Approximate statistics based on the first 1000 samples:
|
301 |
+
| | sentence1 | sentence2 | score |
|
302 |
+
|:--------|:-----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
303 |
+
| type | string | string | float |
|
304 |
+
| details | <ul><li>min: 13 tokens</li><li>mean: 39.44 tokens</li><li>max: 88 tokens</li></ul> | <ul><li>min: 12 tokens</li><li>mean: 38.43 tokens</li><li>max: 95 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 2.24</li><li>max: 4.0</li></ul> |
|
305 |
+
* Samples:
|
306 |
+
| sentence1 | sentence2 | score |
|
307 |
+
|:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
308 |
+
| <code>As p16INK4a blocks the inactivation of pRb by cyclin-dependent kinases, and Arf blocks the inactivation of p53 by Mdm2-mediated proteolysis, both have the capacity to cause cell cycle arrest.</code> | <code>By inducing Arf and Ink4a in primary rodent fibroblasts, oncogenic Ras expression leads to growth arrest and premature senescence.</code> | <code>2.4</code> |
|
309 |
+
| <code>Several lines of evidence suggest that the known principal RB pathway lesions in human tumors act in a mutual exclusive manner.</code> | <code>In individual human tumor specimens, these principal components of the pathway—RB-CDK4/6-p16INK4A—are reported to be targeted in a mutually exclusive manner.</code> | <code>3.4</code> |
|
310 |
+
| <code>T47D, MCF-7, Skbr3, HeLa, and Caco-2 cells were transfected by electroporation as described previously.</code> | <code> MCF7 or HeLa cells were electroporated as described previously to more than 95% efficiency with pSuper constructs against the various targets, and 72 hr later, protein expression was analyzed by SDS-PAGE and Western blotting.</code> | <code>3.0</code> |
|
311 |
+
* Loss: [<code>CoSENTLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosentloss) with these parameters:
|
312 |
+
```json
|
313 |
+
{
|
314 |
+
"scale": 20.0,
|
315 |
+
"similarity_fct": "pairwise_cos_sim"
|
316 |
+
}
|
317 |
+
```
|
318 |
+
|
319 |
+
### Evaluation Datasets
|
320 |
+
|
321 |
+
#### reranking_1
|
322 |
+
|
323 |
+
* Dataset: [reranking_1](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking) at [4d853f9](https://huggingface.co/datasets/mteb/askubuntudupquestions-reranking/tree/4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c)
|
324 |
+
* Size: 38 evaluation samples
|
325 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
326 |
+
* Approximate statistics based on the first 1000 samples:
|
327 |
+
| | anchor | positive | negative |
|
328 |
+
|:--------|:---------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
329 |
+
| type | string | string | string |
|
330 |
+
| details | <ul><li>min: 7 tokens</li><li>mean: 14.0 tokens</li><li>max: 24 tokens</li></ul> | <ul><li>min: 10 tokens</li><li>mean: 77.58 tokens</li><li>max: 371 tokens</li></ul> | <ul><li>min: 2 tokens</li><li>mean: 196.55 tokens</li><li>max: 291 tokens</li></ul> |
|
331 |
+
* Samples:
|
332 |
+
| anchor | positive | negative |
|
333 |
+
|:-------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
334 |
+
| <code>how do i clean install windows 7 on the `` other '' partition ?</code> | <code>how to partition disk in ubuntu and then install windows 7 ? install windows 7 on seperate partitions without losing grub how do i create a partion to install windows ? doubt : about dual boot ( 14.04 with windows 7 ) how do i install windows 7 from an iso file on a separate partition from ubuntu ? how to partition for a dual boot</code> | <code>install ubuntu in a specific partition side by side with windows 7 windows 7 system partition i have xp on one partition and windows 7 on another . how do i install ubuntu on a seperate partition ? cant ' dual install xubuntu and windows 7 i have formatted a partition for ubuntu . how do i install it on that partition ? grub wo n't load windows 7 ( unknown file system ) how to delete windows xp and integrate its partition to ubuntu ? uninstalling ubuntu when it is on the windows partition upgrading current version of ubuntu , on a multi boot system . a partition is necessary before installing ubuntu on windows 7 ? how to do a clean reinstall of ubuntu ? can i use testdisk to recover the windows partition over which ubuntu was installed ? how to update dual boot windows 7 / ubuntu 13.04 to 14.04 if i chose `` replace windows with ubuntu '' , do i lose the other partition too ?</code> |
|
335 |
+
| <code>is it possible to have two different dpi configurations for two different screens ?</code> | <code>how can i change the dpi of my monitors separately ? using external monitor with laptop monitor as separate monitors resolution in login screen different text scaling factors for different displays ? external display is showing and reporting wrong resolutions hard drive encryption boot screen resolution how to disable clone display mode on ubuntu login screen ?</code> | <code>change logon screen display configuration login screen on the wrong monitor only one resolution available in xorg.conf force gdm login screen to the primary monitor how to find and change the screen dpi ? dual screen different font resolution how can i display laptop screen on the tv by hdmi in kubuntu how do i turn off the laptop screen while using an external monitor ? adapt ubuntu to a high-dpi resolution screen how can i change my login screen resolution when connected to my monitor ( 12.04 ) dpi setting in ubuntu 13.10 resolution of the login screen is wrong on a second monitor force full-screen game to one monitor ?</code> |
|
336 |
+
| <code>any command line calculator for ubuntu ?</code> | <code>quick simple mathematics calculations ubuntu calculator in dash</code> | <code>shortcut to open/focus terminal window how to assign shortcut keys in gnome ? menu bar not visible on gnome-calculator how to permanently enable in-dash calculator in 13.10 a good hex/binary calculator command line calculator that keeps fractional values is there any calculator in software centre which could solve quadratic equations ? how to make shortcut to terminal application ? can calculator show decimal as fraction ? how to open pseudo-terminal devices on terminal ? keep calculator from opening a new window every time i press the `` calculator '' button on the keyboard ? keyboard shortcut for terminal does n't work since updating to 12.10 decimal point from number pad wo n't work on the calculator but will everywhere else how to set qalculator as default calculator ? what is 'calculator ' package ? how to get a 'non-screenlet ' calculator in compiz widget layer ? how do i use the 'scientific ' mode in the calculator ? how can i capture text from my terminal without redirecting it to a text file ?</code> |
|
337 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
338 |
+
```json
|
339 |
+
{
|
340 |
+
"scale": 20.0,
|
341 |
+
"similarity_fct": "cos_sim"
|
342 |
+
}
|
343 |
+
```
|
344 |
+
|
345 |
+
#### retrival_1
|
346 |
+
|
347 |
+
* Dataset: [retrival_1](https://huggingface.co/datasets/mteb/arguana) at [c22ab2a](https://huggingface.co/datasets/mteb/arguana/tree/c22ab2a51041ffd869aaddef7af8d8215647e41a)
|
348 |
+
* Size: 868 evaluation samples
|
349 |
+
* Columns: <code>title</code> and <code>text</code>
|
350 |
+
* Approximate statistics based on the first 1000 samples:
|
351 |
+
| | title | text |
|
352 |
+
|:--------|:--------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
353 |
+
| type | string | string |
|
354 |
+
| details | <ul><li>min: 2 tokens</li><li>mean: 5.0 tokens</li><li>max: 17 tokens</li></ul> | <ul><li>min: 26 tokens</li><li>mean: 204.03 tokens</li><li>max: 512 tokens</li></ul> |
|
355 |
+
* Samples:
|
356 |
+
| title | text |
|
357 |
+
|:--------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
358 |
+
| <code></code> | <code>Behind the veil of ignorance, human beings may not in fact side with what gives them the statistical greatest chance of survival. As Rawls himself notes, people are naturally risk-averse, and thus will select the rules that protect them from the worst possible situations, even if that sacrifice would help many others. Most people find the prospect of being actively killed by the conscious action of another human being worse than simply dying in an accident, and would seek to protect themselves against that worse outcome.</code> |
|
359 |
+
| <code></code> | <code>Schengen membership is not the same as EU membership – some non-EU states, such as Switzerland are part of Schengen, the UK and Ireland are EU member states but are not. Joining Schengen would involve the politically sensitive issue of undocumented migrants, which could not only be fatal to Cape Verde joining Schengen but to integration with Europe itself. Even if it is unlikely, is it that difficult for people to show a passport? Besides, tourism is not just from Europe to outside – a Euro move would only stop Europeans from needing to change currencies. The peg is the best of both worlds in that it means that the currency is stable.</code> |
|
360 |
+
| <code></code> | <code>News organisations cannot be completely transparent if they are to do their job properly and News International is no exception. Such organisations cannot for example reveal their sources as this may sometimes put their sources at risk and would mean that others would not come forward. As part of this news companies need to keep secret how they obtained information. While an attempt by a newspaper to cover up crimes is regrettable this one newspapers actions should not tar the whole company and its other papers.</code> |
|
361 |
+
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
|
362 |
+
```json
|
363 |
+
{
|
364 |
+
"scale": 20.0,
|
365 |
+
"similarity_fct": "cos_sim"
|
366 |
+
}
|
367 |
+
```
|
368 |
+
|
369 |
+
#### sts_1
|
370 |
+
|
371 |
+
* Dataset: [sts_1](https://huggingface.co/datasets/mteb/biosses-sts) at [9ee918f](https://huggingface.co/datasets/mteb/biosses-sts/tree/9ee918f184421b6bd48b78f6c714d86546106103)
|
372 |
+
* Size: 10 evaluation samples
|
373 |
+
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>score</code>
|
374 |
+
* Approximate statistics based on the first 1000 samples:
|
375 |
+
| | sentence1 | sentence2 | score |
|
376 |
+
|:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
377 |
+
| type | string | string | float |
|
378 |
+
| details | <ul><li>min: 17 tokens</li><li>mean: 38.4 tokens</li><li>max: 61 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 46.8 tokens</li><li>max: 62 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 1.76</li><li>max: 3.2</li></ul> |
|
379 |
+
* Samples:
|
380 |
+
| sentence1 | sentence2 | score |
|
381 |
+
|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
382 |
+
| <code>Recently, it was reported that expression of IDH1R132H suppresses TET2 activity and the mutations of IDH1 and IDH2 genes occur in a mutual exclusive manner with that of TET2 gene in AML </code> | <code>The mechanism was clarified by yet another genomic survey, this time involving acute myelogenous leukemia (AML).</code> | <code>1.4</code> |
|
383 |
+
| <code>Recently, it was reported that expression of IDH1R132H suppresses TET2 activity and the mutations of IDH1 and IDH2 genes occur in a mutual exclusive manner with that of TET2 gene in AML.</code> | <code>This large-scale study showed that IDH1/IDH2 mutations were mutually exclusive with inactivating TET2 mutations, suggesting that the two types of mutations had similar effects and were thus functionally redundant.</code> | <code>3.2</code> |
|
384 |
+
| <code>A gene that warrants further studies is the erythropoietin receptor that is 7.4-fold higher expressed in TEL-AML1-positive cases compared to other precursor B-ALL cases confirming other gene expression classification studies.</code> | <code>Another recent gene expression study of large numbers of cases provided support for the hypothesis that distinct leukemias are specified by each of the unique chromosomal abnormalities found in lymphoblastic leukemias.</code> | <code>0.6</code> |
|
385 |
+
* Loss: [<code>CoSENTLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosentloss) with these parameters:
|
386 |
+
```json
|
387 |
+
{
|
388 |
+
"scale": 20.0,
|
389 |
+
"similarity_fct": "pairwise_cos_sim"
|
390 |
+
}
|
391 |
+
```
|
392 |
+
|
393 |
+
### Training Hyperparameters
|
394 |
+
#### Non-Default Hyperparameters
|
395 |
+
|
396 |
+
- `eval_strategy`: epoch
|
397 |
+
- `per_device_train_batch_size`: 2
|
398 |
+
- `per_device_eval_batch_size`: 2
|
399 |
+
- `gradient_accumulation_steps`: 8
|
400 |
+
- `learning_rate`: 2e-05
|
401 |
+
- `num_train_epochs`: 5
|
402 |
+
- `lr_scheduler_type`: cosine
|
403 |
+
- `warmup_ratio`: 0.1
|
404 |
+
- `bf16`: True
|
405 |
+
- `tf32`: True
|
406 |
+
- `optim`: adamw_torch_fused
|
407 |
+
- `batch_sampler`: no_duplicates
|
408 |
+
|
409 |
+
#### All Hyperparameters
|
410 |
+
<details><summary>Click to expand</summary>
|
411 |
+
|
412 |
+
- `overwrite_output_dir`: False
|
413 |
+
- `do_predict`: False
|
414 |
+
- `eval_strategy`: epoch
|
415 |
+
- `prediction_loss_only`: True
|
416 |
+
- `per_device_train_batch_size`: 2
|
417 |
+
- `per_device_eval_batch_size`: 2
|
418 |
+
- `per_gpu_train_batch_size`: None
|
419 |
+
- `per_gpu_eval_batch_size`: None
|
420 |
+
- `gradient_accumulation_steps`: 8
|
421 |
+
- `eval_accumulation_steps`: None
|
422 |
+
- `learning_rate`: 2e-05
|
423 |
+
- `weight_decay`: 0.0
|
424 |
+
- `adam_beta1`: 0.9
|
425 |
+
- `adam_beta2`: 0.999
|
426 |
+
- `adam_epsilon`: 1e-08
|
427 |
+
- `max_grad_norm`: 1.0
|
428 |
+
- `num_train_epochs`: 5
|
429 |
+
- `max_steps`: -1
|
430 |
+
- `lr_scheduler_type`: cosine
|
431 |
+
- `lr_scheduler_kwargs`: {}
|
432 |
+
- `warmup_ratio`: 0.1
|
433 |
+
- `warmup_steps`: 0
|
434 |
+
- `log_level`: passive
|
435 |
+
- `log_level_replica`: warning
|
436 |
+
- `log_on_each_node`: True
|
437 |
+
- `logging_nan_inf_filter`: True
|
438 |
+
- `save_safetensors`: True
|
439 |
+
- `save_on_each_node`: False
|
440 |
+
- `save_only_model`: False
|
441 |
+
- `restore_callback_states_from_checkpoint`: False
|
442 |
+
- `no_cuda`: False
|
443 |
+
- `use_cpu`: False
|
444 |
+
- `use_mps_device`: False
|
445 |
+
- `seed`: 42
|
446 |
+
- `data_seed`: None
|
447 |
+
- `jit_mode_eval`: False
|
448 |
+
- `use_ipex`: False
|
449 |
+
- `bf16`: True
|
450 |
+
- `fp16`: False
|
451 |
+
- `fp16_opt_level`: O1
|
452 |
+
- `half_precision_backend`: auto
|
453 |
+
- `bf16_full_eval`: False
|
454 |
+
- `fp16_full_eval`: False
|
455 |
+
- `tf32`: True
|
456 |
+
- `local_rank`: 0
|
457 |
+
- `ddp_backend`: None
|
458 |
+
- `tpu_num_cores`: None
|
459 |
+
- `tpu_metrics_debug`: False
|
460 |
+
- `debug`: []
|
461 |
+
- `dataloader_drop_last`: False
|
462 |
+
- `dataloader_num_workers`: 0
|
463 |
+
- `dataloader_prefetch_factor`: None
|
464 |
+
- `past_index`: -1
|
465 |
+
- `disable_tqdm`: False
|
466 |
+
- `remove_unused_columns`: True
|
467 |
+
- `label_names`: None
|
468 |
+
- `load_best_model_at_end`: False
|
469 |
+
- `ignore_data_skip`: False
|
470 |
+
- `fsdp`: []
|
471 |
+
- `fsdp_min_num_params`: 0
|
472 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
473 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
474 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
475 |
+
- `deepspeed`: None
|
476 |
+
- `label_smoothing_factor`: 0.0
|
477 |
+
- `optim`: adamw_torch_fused
|
478 |
+
- `optim_args`: None
|
479 |
+
- `adafactor`: False
|
480 |
+
- `group_by_length`: False
|
481 |
+
- `length_column_name`: length
|
482 |
+
- `ddp_find_unused_parameters`: None
|
483 |
+
- `ddp_bucket_cap_mb`: None
|
484 |
+
- `ddp_broadcast_buffers`: False
|
485 |
+
- `dataloader_pin_memory`: True
|
486 |
+
- `dataloader_persistent_workers`: False
|
487 |
+
- `skip_memory_metrics`: True
|
488 |
+
- `use_legacy_prediction_loop`: False
|
489 |
+
- `push_to_hub`: False
|
490 |
+
- `resume_from_checkpoint`: None
|
491 |
+
- `hub_model_id`: None
|
492 |
+
- `hub_strategy`: every_save
|
493 |
+
- `hub_private_repo`: False
|
494 |
+
- `hub_always_push`: False
|
495 |
+
- `gradient_checkpointing`: False
|
496 |
+
- `gradient_checkpointing_kwargs`: None
|
497 |
+
- `include_inputs_for_metrics`: False
|
498 |
+
- `eval_do_concat_batches`: True
|
499 |
+
- `fp16_backend`: auto
|
500 |
+
- `push_to_hub_model_id`: None
|
501 |
+
- `push_to_hub_organization`: None
|
502 |
+
- `mp_parameters`:
|
503 |
+
- `auto_find_batch_size`: False
|
504 |
+
- `full_determinism`: False
|
505 |
+
- `torchdynamo`: None
|
506 |
+
- `ray_scope`: last
|
507 |
+
- `ddp_timeout`: 1800
|
508 |
+
- `torch_compile`: False
|
509 |
+
- `torch_compile_backend`: None
|
510 |
+
- `torch_compile_mode`: None
|
511 |
+
- `dispatch_batches`: None
|
512 |
+
- `split_batches`: None
|
513 |
+
- `include_tokens_per_second`: False
|
514 |
+
- `include_num_input_tokens_seen`: False
|
515 |
+
- `neftune_noise_alpha`: None
|
516 |
+
- `optim_target_modules`: None
|
517 |
+
- `batch_eval_metrics`: False
|
518 |
+
- `batch_sampler`: no_duplicates
|
519 |
+
- `multi_dataset_batch_sampler`: proportional
|
520 |
+
|
521 |
+
</details>
|
522 |
+
|
523 |
+
### Training Logs
|
524 |
+
| Epoch | Step | Training Loss | reranking 1 loss | retrival 1 loss | sts 1 loss |
|
525 |
+
|:------:|:----:|:-------------:|:----------------:|:---------------:|:----------:|
|
526 |
+
| 0.9716 | 500 | 0.4296 | - | - | - |
|
527 |
+
| 0.9988 | 514 | - | 0.2080 | 0.1297 | 0.1096 |
|
528 |
+
| 0.9716 | 500 | 0.0933 | - | - | - |
|
529 |
+
| 0.9988 | 514 | - | 0.2104 | 0.1012 | 0.5515 |
|
530 |
+
| 0.9716 | 500 | 0.0435 | - | - | - |
|
531 |
+
| 0.9988 | 514 | - | 0.2026 | 0.1434 | 0.4824 |
|
532 |
+
| 0.9716 | 500 | 0.0282 | - | - | - |
|
533 |
+
| 0.9988 | 514 | - | 0.1827 | 0.1305 | 0.2950 |
|
534 |
+
| 1.9432 | 1000 | 0.0555 | - | - | - |
|
535 |
+
| 1.9995 | 1029 | - | 0.3932 | 0.0693 | 0.8649 |
|
536 |
+
| 2.9147 | 1500 | 0.0151 | - | - | - |
|
537 |
+
| 2.9983 | 1543 | - | 0.2112 | 0.0555 | 0.5478 |
|
538 |
+
| 3.8863 | 2000 | 0.0036 | - | - | - |
|
539 |
+
| 3.9990 | 2058 | - | 0.1921 | 0.0432 | 0.5912 |
|
540 |
+
| 4.8579 | 2500 | 0.0013 | - | - | - |
|
541 |
+
| 4.9939 | 2570 | - | 0.1904 | 0.0412 | 0.6356 |
|
542 |
+
|
543 |
+
|
544 |
+
### Framework Versions
|
545 |
+
- Python: 3.10.12
|
546 |
+
- Sentence Transformers: 3.0.1
|
547 |
+
- Transformers: 4.41.2
|
548 |
+
- PyTorch: 2.2.0+cu121
|
549 |
+
- Accelerate: 0.31.0
|
550 |
+
- Datasets: 2.20.0
|
551 |
+
- Tokenizers: 0.19.1
|
552 |
+
|
553 |
+
## Citation
|
554 |
+
|
555 |
+
### BibTeX
|
556 |
+
|
557 |
+
#### Sentence Transformers
|
558 |
+
```bibtex
|
559 |
+
@inproceedings{reimers-2019-sentence-bert,
|
560 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
561 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
562 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
563 |
+
month = "11",
|
564 |
+
year = "2019",
|
565 |
+
publisher = "Association for Computational Linguistics",
|
566 |
+
url = "https://arxiv.org/abs/1908.10084",
|
567 |
+
}
|
568 |
+
```
|
569 |
+
|
570 |
+
#### CoSENTLoss
|
571 |
+
```bibtex
|
572 |
+
@online{kexuefm-8847,
|
573 |
+
title={CoSENT: A more efficient sentence vector scheme than Sentence-BERT},
|
574 |
+
author={Su Jianlin},
|
575 |
+
year={2022},
|
576 |
+
month={Jan},
|
577 |
+
url={https://kexue.fm/archives/8847},
|
578 |
+
}
|
579 |
+
```
|
580 |
+
|
581 |
+
<!--
|
582 |
+
## Glossary
|
583 |
+
|
584 |
+
*Clearly define terms in order to be accessible across audiences.*
|
585 |
+
-->
|
586 |
+
|
587 |
+
<!--
|
588 |
+
## Model Card Authors
|
589 |
+
|
590 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
591 |
+
-->
|
592 |
+
|
593 |
+
<!--
|
594 |
+
## Model Card Contact
|
595 |
+
|
596 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
597 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "microsoft/mpnet-base",
|
3 |
+
"architectures": [
|
4 |
+
"MPNetModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "mpnet",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 1,
|
20 |
+
"relative_attention_num_buckets": 32,
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.41.2",
|
23 |
+
"vocab_size": 30527
|
24 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "3.0.1",
|
4 |
+
"transformers": "4.41.2",
|
5 |
+
"pytorch": "2.2.0+cu121"
|
6 |
+
},
|
7 |
+
"prompts": {},
|
8 |
+
"default_prompt_name": null,
|
9 |
+
"similarity_fn_name": null
|
10 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8484e6626c78b1e3f27dffe1ed7c9886ba67ccbd573276abacaccfdb0abba724
|
3 |
+
size 437967672
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b9a26f7bc618275dddec6da1510d9e69bf98dcf391b31ba32af4e6ad0f92dc2
|
3 |
+
size 871334522
|
rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c14a556422a7476f073f5fa4ddf7346afcbbfd267378dfa8972c18d40e075e79
|
3 |
+
size 14244
|
scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d94fb8caeabfcf418870a22e48bdd1bf4c35926a662a2650f49c78657687c790
|
3 |
+
size 1064
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "[UNK]",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": false,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,65 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "<s>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "<pad>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "</s>",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "<unk>",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": true,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"104": {
|
36 |
+
"content": "[UNK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
},
|
43 |
+
"30526": {
|
44 |
+
"content": "<mask>",
|
45 |
+
"lstrip": true,
|
46 |
+
"normalized": false,
|
47 |
+
"rstrip": false,
|
48 |
+
"single_word": false,
|
49 |
+
"special": true
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"bos_token": "<s>",
|
53 |
+
"clean_up_tokenization_spaces": true,
|
54 |
+
"cls_token": "<s>",
|
55 |
+
"do_lower_case": true,
|
56 |
+
"eos_token": "</s>",
|
57 |
+
"mask_token": "<mask>",
|
58 |
+
"model_max_length": 512,
|
59 |
+
"pad_token": "<pad>",
|
60 |
+
"sep_token": "</s>",
|
61 |
+
"strip_accents": null,
|
62 |
+
"tokenize_chinese_chars": true,
|
63 |
+
"tokenizer_class": "MPNetTokenizer",
|
64 |
+
"unk_token": "[UNK]"
|
65 |
+
}
|
trainer_state.json
ADDED
@@ -0,0 +1,188 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 4.993927617196988,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 2570,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9715812484819043,
|
13 |
+
"grad_norm": 0.0,
|
14 |
+
"learning_rate": 1.9460259489596192e-05,
|
15 |
+
"loss": 0.0282,
|
16 |
+
"step": 500
|
17 |
+
},
|
18 |
+
{
|
19 |
+
"epoch": 0.9987855234393976,
|
20 |
+
"eval_reranking_1_loss": 0.182732954621315,
|
21 |
+
"eval_reranking_1_runtime": 1.2858,
|
22 |
+
"eval_reranking_1_samples_per_second": 29.553,
|
23 |
+
"eval_reranking_1_steps_per_second": 14.777,
|
24 |
+
"step": 514
|
25 |
+
},
|
26 |
+
{
|
27 |
+
"epoch": 0.9987855234393976,
|
28 |
+
"eval_retrival_1_loss": 0.1305331587791443,
|
29 |
+
"eval_retrival_1_runtime": 26.5236,
|
30 |
+
"eval_retrival_1_samples_per_second": 32.726,
|
31 |
+
"eval_retrival_1_steps_per_second": 16.363,
|
32 |
+
"step": 514
|
33 |
+
},
|
34 |
+
{
|
35 |
+
"epoch": 0.9987855234393976,
|
36 |
+
"eval_sts_1_loss": 0.2950426936149597,
|
37 |
+
"eval_sts_1_runtime": 0.2829,
|
38 |
+
"eval_sts_1_samples_per_second": 35.351,
|
39 |
+
"eval_sts_1_steps_per_second": 17.676,
|
40 |
+
"step": 514
|
41 |
+
},
|
42 |
+
{
|
43 |
+
"epoch": 1.9431624969638086,
|
44 |
+
"grad_norm": 6.779000282287598,
|
45 |
+
"learning_rate": 1.5325659218524745e-05,
|
46 |
+
"loss": 0.0555,
|
47 |
+
"step": 1000
|
48 |
+
},
|
49 |
+
{
|
50 |
+
"epoch": 1.999514209375759,
|
51 |
+
"eval_reranking_1_loss": 0.3932221829891205,
|
52 |
+
"eval_reranking_1_runtime": 1.258,
|
53 |
+
"eval_reranking_1_samples_per_second": 30.208,
|
54 |
+
"eval_reranking_1_steps_per_second": 15.104,
|
55 |
+
"step": 1029
|
56 |
+
},
|
57 |
+
{
|
58 |
+
"epoch": 1.999514209375759,
|
59 |
+
"eval_retrival_1_loss": 0.06928794831037521,
|
60 |
+
"eval_retrival_1_runtime": 28.2993,
|
61 |
+
"eval_retrival_1_samples_per_second": 30.672,
|
62 |
+
"eval_retrival_1_steps_per_second": 15.336,
|
63 |
+
"step": 1029
|
64 |
+
},
|
65 |
+
{
|
66 |
+
"epoch": 1.999514209375759,
|
67 |
+
"eval_sts_1_loss": 0.8648566007614136,
|
68 |
+
"eval_sts_1_runtime": 0.2978,
|
69 |
+
"eval_sts_1_samples_per_second": 33.582,
|
70 |
+
"eval_sts_1_steps_per_second": 16.791,
|
71 |
+
"step": 1029
|
72 |
+
},
|
73 |
+
{
|
74 |
+
"epoch": 2.914743745445713,
|
75 |
+
"grad_norm": 0.030390629544854164,
|
76 |
+
"learning_rate": 8.827829529818852e-06,
|
77 |
+
"loss": 0.0151,
|
78 |
+
"step": 1500
|
79 |
+
},
|
80 |
+
{
|
81 |
+
"epoch": 2.998299732815157,
|
82 |
+
"eval_reranking_1_loss": 0.21115952730178833,
|
83 |
+
"eval_reranking_1_runtime": 1.2048,
|
84 |
+
"eval_reranking_1_samples_per_second": 31.54,
|
85 |
+
"eval_reranking_1_steps_per_second": 15.77,
|
86 |
+
"step": 1543
|
87 |
+
},
|
88 |
+
{
|
89 |
+
"epoch": 2.998299732815157,
|
90 |
+
"eval_retrival_1_loss": 0.05546686798334122,
|
91 |
+
"eval_retrival_1_runtime": 26.8806,
|
92 |
+
"eval_retrival_1_samples_per_second": 32.291,
|
93 |
+
"eval_retrival_1_steps_per_second": 16.145,
|
94 |
+
"step": 1543
|
95 |
+
},
|
96 |
+
{
|
97 |
+
"epoch": 2.998299732815157,
|
98 |
+
"eval_sts_1_loss": 0.5478371977806091,
|
99 |
+
"eval_sts_1_runtime": 0.2864,
|
100 |
+
"eval_sts_1_samples_per_second": 34.913,
|
101 |
+
"eval_sts_1_steps_per_second": 17.457,
|
102 |
+
"step": 1543
|
103 |
+
},
|
104 |
+
{
|
105 |
+
"epoch": 3.886324993927617,
|
106 |
+
"grad_norm": 0.0,
|
107 |
+
"learning_rate": 2.8501434747835012e-06,
|
108 |
+
"loss": 0.0036,
|
109 |
+
"step": 2000
|
110 |
+
},
|
111 |
+
{
|
112 |
+
"epoch": 3.999028418751518,
|
113 |
+
"eval_reranking_1_loss": 0.19206289947032928,
|
114 |
+
"eval_reranking_1_runtime": 1.196,
|
115 |
+
"eval_reranking_1_samples_per_second": 31.774,
|
116 |
+
"eval_reranking_1_steps_per_second": 15.887,
|
117 |
+
"step": 2058
|
118 |
+
},
|
119 |
+
{
|
120 |
+
"epoch": 3.999028418751518,
|
121 |
+
"eval_retrival_1_loss": 0.04320598766207695,
|
122 |
+
"eval_retrival_1_runtime": 27.2793,
|
123 |
+
"eval_retrival_1_samples_per_second": 31.819,
|
124 |
+
"eval_retrival_1_steps_per_second": 15.909,
|
125 |
+
"step": 2058
|
126 |
+
},
|
127 |
+
{
|
128 |
+
"epoch": 3.999028418751518,
|
129 |
+
"eval_sts_1_loss": 0.591204047203064,
|
130 |
+
"eval_sts_1_runtime": 0.2948,
|
131 |
+
"eval_sts_1_samples_per_second": 33.923,
|
132 |
+
"eval_sts_1_steps_per_second": 16.961,
|
133 |
+
"step": 2058
|
134 |
+
},
|
135 |
+
{
|
136 |
+
"epoch": 4.857906242409522,
|
137 |
+
"grad_norm": 0.0018939984729513526,
|
138 |
+
"learning_rate": 4.5163479025036596e-08,
|
139 |
+
"loss": 0.0013,
|
140 |
+
"step": 2500
|
141 |
+
},
|
142 |
+
{
|
143 |
+
"epoch": 4.993927617196988,
|
144 |
+
"eval_reranking_1_loss": 0.19038808345794678,
|
145 |
+
"eval_reranking_1_runtime": 1.207,
|
146 |
+
"eval_reranking_1_samples_per_second": 31.484,
|
147 |
+
"eval_reranking_1_steps_per_second": 15.742,
|
148 |
+
"step": 2570
|
149 |
+
},
|
150 |
+
{
|
151 |
+
"epoch": 4.993927617196988,
|
152 |
+
"eval_retrival_1_loss": 0.04124879837036133,
|
153 |
+
"eval_retrival_1_runtime": 27.5211,
|
154 |
+
"eval_retrival_1_samples_per_second": 31.539,
|
155 |
+
"eval_retrival_1_steps_per_second": 15.77,
|
156 |
+
"step": 2570
|
157 |
+
},
|
158 |
+
{
|
159 |
+
"epoch": 4.993927617196988,
|
160 |
+
"eval_sts_1_loss": 0.6356238722801208,
|
161 |
+
"eval_sts_1_runtime": 0.3051,
|
162 |
+
"eval_sts_1_samples_per_second": 32.781,
|
163 |
+
"eval_sts_1_steps_per_second": 16.39,
|
164 |
+
"step": 2570
|
165 |
+
}
|
166 |
+
],
|
167 |
+
"logging_steps": 500,
|
168 |
+
"max_steps": 2570,
|
169 |
+
"num_input_tokens_seen": 0,
|
170 |
+
"num_train_epochs": 5,
|
171 |
+
"save_steps": 500,
|
172 |
+
"stateful_callbacks": {
|
173 |
+
"TrainerControl": {
|
174 |
+
"args": {
|
175 |
+
"should_epoch_stop": false,
|
176 |
+
"should_evaluate": false,
|
177 |
+
"should_log": false,
|
178 |
+
"should_save": true,
|
179 |
+
"should_training_stop": true
|
180 |
+
},
|
181 |
+
"attributes": {}
|
182 |
+
}
|
183 |
+
},
|
184 |
+
"total_flos": 0.0,
|
185 |
+
"train_batch_size": 2,
|
186 |
+
"trial_name": null,
|
187 |
+
"trial_params": null
|
188 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8732499b4dd920e781a2fdaada10558fd39a38c780fd56ad157b883624218075
|
3 |
+
size 5304
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|