File size: 70,402 Bytes
c22ac53
 
 
 
 
 
 
 
 
5c2007e
c22ac53
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
 
c22ac53
5c2007e
 
 
 
 
 
 
 
 
c22ac53
5c2007e
 
 
 
 
 
 
 
 
c22ac53
5c2007e
 
 
 
 
c22ac53
5c2007e
 
 
 
c22ac53
5c2007e
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
5c2007e
c22ac53
 
 
 
 
 
5c2007e
c22ac53
 
5c2007e
 
 
 
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
5c2007e
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
5c2007e
 
 
 
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
5c2007e
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
5c2007e
c22ac53
5c2007e
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
 
 
c22ac53
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
 
c22ac53
 
 
 
5c2007e
c22ac53
 
 
 
 
5c2007e
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
 
 
 
d6796ed
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5c2007e
c22ac53
5c2007e
 
 
 
 
 
c22ac53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
---
language:
- en
library_name: sentence-transformers
tags:
- sentence-transformers
- sentence-similarity
- feature-extraction
- generated_from_trainer
- dataset_size:689221
- loss:MultipleNegativesRankingLoss
- loss:CoSENTLoss
- loss:GISTEmbedLoss
- loss:OnlineContrastiveLoss
- loss:MultipleNegativesSymmetricRankingLoss
base_model: microsoft/deberta-v3-small
datasets:
- sentence-transformers/all-nli
- sentence-transformers/stsb
- tals/vitaminc
- nyu-mll/glue
- allenai/scitail
- sentence-transformers/xsum
- sentence-transformers/sentence-compression
widget:
- source_sentence: What are the exceptions in the constitution  that require special
    considerations to amend?
  sentences:
  - The river makes a distinctive turn to the north near Chur.
  - The Victorian Constitution can be amended by the Parliament of Victoria, except
    for certain "entrenched" provisions that require either an absolute majority in
    both houses, a three-fifths majority in both houses, or the approval of the Victorian
    people in a referendum, depending on the provision.
  - A new arrangement of the theme, once again by Gold, was introduced in the 2007
    Christmas special episode, "Voyage of the Damned"; Gold returned as composer for
    the 2010 series.
- source_sentence: What is the name of a Bodhisattva vow?
  sentences:
  - In Tibetan Buddhism the teachers of Dharma in Tibet are most commonly called a
    Lama.
  - This origin of chloroplasts was first suggested by the Russian biologist Konstantin
    Mereschkowski in 1905 after Andreas Schimper observed in 1883 that chloroplasts
    closely resemble cyanobacteria.
  - The announcement came a day after Setanta Sports confirmed that it would launch
    in March as a subscription service on the digital terrestrial platform, and on
    the same day that NTL's services re-branded as Virgin Media.
- source_sentence: Two dogs run around inside a fence.
  sentences:
  - A young woman tennis player have many tennis balls.
  - Two dogs are inside a fence.
  - A little girl in red plays tennis.
- source_sentence: A little boy wearing a blue stiped shirt has a party hat on his
    head and is playing in a puddle.
  sentences:
  - The party boy is playing in a puddle.
  - There is a crowd
  - Four people are skiing
- source_sentence: Two wrestlers jump in a ring while an official watches.
  sentences:
  - The man was walking.
  - Two men are dressed in makeup
  - Two wrestlers were just tagged in on a tag team match.
pipeline_tag: sentence-similarity
---

# SentenceTransformer based on microsoft/deberta-v3-small

This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/deberta-v3-small](https://huggingface.co/microsoft/deberta-v3-small) on the [nli-pairs](https://huggingface.co/datasets/sentence-transformers/all-nli), [sts-label](https://huggingface.co/datasets/sentence-transformers/stsb), [vitaminc-pairs](https://huggingface.co/datasets/tals/vitaminc), [qnli-contrastive](https://huggingface.co/datasets/nyu-mll/glue), [scitail-pairs-qa](https://huggingface.co/datasets/allenai/scitail), [scitail-pairs-pos](https://huggingface.co/datasets/allenai/scitail), [xsum-pairs](https://huggingface.co/datasets/sentence-transformers/xsum) and [compression-pairs](https://huggingface.co/datasets/sentence-transformers/sentence-compression) datasets. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.

## Model Details

### Model Description
- **Model Type:** Sentence Transformer
- **Base model:** [microsoft/deberta-v3-small](https://huggingface.co/microsoft/deberta-v3-small) <!-- at revision a36c739020e01763fe789b4b85e2df55d6180012 -->
- **Maximum Sequence Length:** 512 tokens
- **Output Dimensionality:** 768 tokens
- **Similarity Function:** Cosine Similarity
- **Training Datasets:**
    - [nli-pairs](https://huggingface.co/datasets/sentence-transformers/all-nli)
    - [sts-label](https://huggingface.co/datasets/sentence-transformers/stsb)
    - [vitaminc-pairs](https://huggingface.co/datasets/tals/vitaminc)
    - [qnli-contrastive](https://huggingface.co/datasets/nyu-mll/glue)
    - [scitail-pairs-qa](https://huggingface.co/datasets/allenai/scitail)
    - [scitail-pairs-pos](https://huggingface.co/datasets/allenai/scitail)
    - [xsum-pairs](https://huggingface.co/datasets/sentence-transformers/xsum)
    - [compression-pairs](https://huggingface.co/datasets/sentence-transformers/sentence-compression)
- **Language:** en
<!-- - **License:** Unknown -->

### Model Sources

- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)

### Full Model Architecture

```
SentenceTransformer(
  (0): Transformer({'max_seq_length': 512, 'do_lower_case': False}) with Transformer model: DebertaV2Model 
  (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
)
```

## Usage

### Direct Usage (Sentence Transformers)

First install the Sentence Transformers library:

```bash
pip install -U sentence-transformers
```

Then you can load this model and run inference.
```python
from sentence_transformers import SentenceTransformer

# Download from the 🤗 Hub
model = SentenceTransformer("bobox/DeBERTaV3-small-GeneralSentenceTransformer-checkpoints-tmp")
# Run inference
sentences = [
    'Two wrestlers jump in a ring while an official watches.',
    'Two wrestlers were just tagged in on a tag team match.',
    'Two men are dressed in makeup',
]
embeddings = model.encode(sentences)
print(embeddings.shape)
# [3, 768]

# Get the similarity scores for the embeddings
similarities = model.similarity(embeddings, embeddings)
print(similarities.shape)
# [3, 3]
```

<!--
### Direct Usage (Transformers)

<details><summary>Click to see the direct usage in Transformers</summary>

</details>
-->

<!--
### Downstream Usage (Sentence Transformers)

You can finetune this model on your own dataset.

<details><summary>Click to expand</summary>

</details>
-->

<!--
### Out-of-Scope Use

*List how the model may foreseeably be misused and address what users ought not to do with the model.*
-->

<!--
## Bias, Risks and Limitations

*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
-->

<!--
### Recommendations

*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
-->

## Training Details

### Training Datasets

#### nli-pairs

* Dataset: [nli-pairs](https://huggingface.co/datasets/sentence-transformers/all-nli) at [d482672](https://huggingface.co/datasets/sentence-transformers/all-nli/tree/d482672c8e74ce18da116f430137434ba2e52fab)
* Size: 150,000 training samples
* Columns: <code>sentence1</code> and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                         | sentence2                                                                        |
  |:--------|:----------------------------------------------------------------------------------|:---------------------------------------------------------------------------------|
  | type    | string                                                                            | string                                                                           |
  | details | <ul><li>min: 5 tokens</li><li>mean: 16.62 tokens</li><li>max: 62 tokens</li></ul> | <ul><li>min: 4 tokens</li><li>mean: 9.46 tokens</li><li>max: 29 tokens</li></ul> |
* Samples:
  | sentence1                                                                  | sentence2                                        |
  |:---------------------------------------------------------------------------|:-------------------------------------------------|
  | <code>A person on a horse jumps over a broken down airplane.</code>        | <code>A person is outdoors, on a horse.</code>   |
  | <code>Children smiling and waving at camera</code>                         | <code>There are children present</code>          |
  | <code>A boy is jumping on skateboard in the middle of a red bridge.</code> | <code>The boy does a skateboarding trick.</code> |
* Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

#### sts-label

* Dataset: [sts-label](https://huggingface.co/datasets/sentence-transformers/stsb) at [ab7a5ac](https://huggingface.co/datasets/sentence-transformers/stsb/tree/ab7a5ac0e35aa22088bdcf23e7fd99b220e53308)
* Size: 5,749 training samples
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>score</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                        | sentence2                                                                        | score                                                          |
  |:--------|:---------------------------------------------------------------------------------|:---------------------------------------------------------------------------------|:---------------------------------------------------------------|
  | type    | string                                                                           | string                                                                           | float                                                          |
  | details | <ul><li>min: 6 tokens</li><li>mean: 9.81 tokens</li><li>max: 27 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 9.74 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.54</li><li>max: 1.0</li></ul> |
* Samples:
  | sentence1                                                  | sentence2                                                             | score             |
  |:-----------------------------------------------------------|:----------------------------------------------------------------------|:------------------|
  | <code>A plane is taking off.</code>                        | <code>An air plane is taking off.</code>                              | <code>1.0</code>  |
  | <code>A man is playing a large flute.</code>               | <code>A man is playing a flute.</code>                                | <code>0.76</code> |
  | <code>A man is spreading shreded cheese on a pizza.</code> | <code>A man is spreading shredded cheese on an uncooked pizza.</code> | <code>0.76</code> |
* Loss: [<code>CoSENTLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosentloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "pairwise_cos_sim"
  }
  ```

#### vitaminc-pairs

* Dataset: [vitaminc-pairs](https://huggingface.co/datasets/tals/vitaminc) at [be6febb](https://huggingface.co/datasets/tals/vitaminc/tree/be6febb761b0b2807687e61e0b5282e459df2fa0)
* Size: 75,142 training samples
* Columns: <code>label</code>, <code>sentence1</code>, and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | label                        | sentence1                                                                         | sentence2                                                                         |
  |:--------|:-----------------------------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
  | type    | int                          | string                                                                            | string                                                                            |
  | details | <ul><li>1: 100.00%</li></ul> | <ul><li>min: 7 tokens</li><li>mean: 17.44 tokens</li><li>max: 53 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 38.0 tokens</li><li>max: 151 tokens</li></ul> |
* Samples:
  | label          | sentence1                                                                                                                                                     | sentence2                                                                                                                                                                                                           |
  |:---------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
  | <code>1</code> | <code>Penguins has a rating of less than 92 % , defined by more than 20 reviews on Rotten Tomatoes .</code>                                                   | <code>On review aggregator Rotten Tomatoes , the film holds an approval rating of 91 % based on 22 reviews , with an average rating of 7.14/10 .</code>                                                             |
  | <code>1</code> | <code>Fluoxetine , acts as a positive allosteric modulator of the GABAA receptor at high concentrations , as does norfluoxetine though more potently .</code> | <code>In addition , it acts as a positive allosteric modulator of the GABAA receptor at high concentrations , and norfluoxetine does the same but more potently , actions which may be clinically-relevant .</code> |
  | <code>1</code> | <code>Andrew Robertson is considered by many experts to be one of the best left backs .</code>                                                                | <code>He is considered by many pundits to be one of the best left backs in the world due to his pace and crossing ability.</code>                                                                                   |
* Loss: [<code>GISTEmbedLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#gistembedloss) with these parameters:
  ```json
  {'guide': SentenceTransformer(
    (0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel 
    (1): Pooling({'word_embedding_dimension': 384, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
    (2): Normalize()
  ), 'temperature': 0.05}
  ```

#### qnli-contrastive

* Dataset: [qnli-contrastive](https://huggingface.co/datasets/nyu-mll/glue) at [bcdcba7](https://huggingface.co/datasets/nyu-mll/glue/tree/bcdcba79d07bc864c1c254ccfcedcce55bcc9a8c)
* Size: 104,743 training samples
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>label</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                         | sentence2                                                                          | label                        |
  |:--------|:----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:-----------------------------|
  | type    | string                                                                            | string                                                                             | int                          |
  | details | <ul><li>min: 3 tokens</li><li>mean: 13.82 tokens</li><li>max: 39 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 34.56 tokens</li><li>max: 110 tokens</li></ul> | <ul><li>0: 100.00%</li></ul> |
* Samples:
  | sentence1                                                                          | sentence2                                                                                                                                                                                                                       | label          |
  |:-----------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------|
  | <code>Which Formula One racing team developed the C-X75's used for filming.</code> | <code>The C-X75s used for filming were developed by the engineering division of Formula One racing team Williams, who built the original C-X75 prototype for Jaguar.</code>                                                     | <code>0</code> |
  | <code>When did the University of Michigan leave Detroit?</code>                    | <code>In June 2009, the Michigan State University College of Osteopathic Medicine which is based in East Lansing opened a satellite campus located at the Detroit Medical Center.</code>                                        | <code>0</code> |
  | <code>When did the Vlachs migrate into the region?</code>                          | <code>The Gorals of southern Poland and northern Slovakia are partially descended from Romance-speaking Vlachs who migrated into the region from the 14th to 17th centuries and were absorbed into the local population.</code> | <code>0</code> |
* Loss: [<code>OnlineContrastiveLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#onlinecontrastiveloss)

#### scitail-pairs-qa

* Dataset: [scitail-pairs-qa](https://huggingface.co/datasets/allenai/scitail) at [0cc4353](https://huggingface.co/datasets/allenai/scitail/tree/0cc4353235b289165dfde1c7c5d1be983f99ce44)
* Size: 14,987 training samples
* Columns: <code>sentence2</code> and <code>sentence1</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence2                                                                         | sentence1                                                                         |
  |:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
  | type    | string                                                                            | string                                                                            |
  | details | <ul><li>min: 7 tokens</li><li>mean: 16.04 tokens</li><li>max: 41 tokens</li></ul> | <ul><li>min: 6 tokens</li><li>mean: 15.14 tokens</li><li>max: 34 tokens</li></ul> |
* Samples:
  | sentence2                                                                             | sentence1                                                                               |
  |:--------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------------|
  | <code>Voltage is not the same as energy, but means the energy per unit charge.</code> | <code>What term is not the same as energy, but means the energy per unit charge?</code> |
  | <code>A jellyfish does not have a circulatory system.</code>                          | <code>Name the type of system that a jellyfish does not have?</code>                    |
  | <code>Insight learning is based on past experience and reasoning.</code>              | <code>What type of learning is based on past experience and reasoning?</code>           |
* Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

#### scitail-pairs-pos

* Dataset: [scitail-pairs-pos](https://huggingface.co/datasets/allenai/scitail) at [0cc4353](https://huggingface.co/datasets/allenai/scitail/tree/0cc4353235b289165dfde1c7c5d1be983f99ce44)
* Size: 8,600 training samples
* Columns: <code>sentence1</code> and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                         | sentence2                                                                         |
  |:--------|:----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
  | type    | string                                                                            | string                                                                            |
  | details | <ul><li>min: 6 tokens</li><li>mean: 23.99 tokens</li><li>max: 65 tokens</li></ul> | <ul><li>min: 7 tokens</li><li>mean: 15.54 tokens</li><li>max: 39 tokens</li></ul> |
* Samples:
  | sentence1                                                                                                        | sentence2                                                                                                         |
  |:-----------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------|
  | <code>A) A calorie is a unit of measure used to express the amount of energy a food produces in the body.</code> | <code>Another unit of energy, used widely in the health professions and everyday life, is calorie ( cal )?</code> |
  | <code>solid 1 A state that retains shape independent of the shape of the container it occupies.</code>           | <code>Solid takes neither the shape nor the volume of its container.</code>                                       |
  | <code>Sometimes the two sides of a fracture moved due to the pressure and a fault was formed.</code>             | <code>A fault is the fracture caused when rocks on both sides move.</code>                                        |
* Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

#### xsum-pairs

* Dataset: [xsum-pairs](https://huggingface.co/datasets/sentence-transformers/xsum) at [788ddaf](https://huggingface.co/datasets/sentence-transformers/xsum/tree/788ddafe04e539956d56b567bc32a036ee7b9206)
* Size: 150,000 training samples
* Columns: <code>sentence1</code> and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                            | sentence2                                                                         |
  |:--------|:-------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
  | type    | string                                                                               | string                                                                            |
  | details | <ul><li>min: 13 tokens</li><li>mean: 346.32 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>min: 7 tokens</li><li>mean: 26.95 tokens</li><li>max: 66 tokens</li></ul> |
* Samples:
  | sentence1                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | sentence2                                                                                                                                                      |
  |:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------|
  | <code>Jacob Murphy fired in his 10th goal of the season from inside the box to give the Canaries the lead at the break.<br>Adam Hammill, Angus MacDonald and Marley Watkins all went close for the visitors after the restart.<br>Norwich then stretched their lead thanks to MacDonald's own goal to leave them five points behind sixth-placed Sheffield Wednesday.<br>Victory means caretaker boss Alan Irvine has now claimed four points from a possible six since the departure of Alex Neil.<br>The hosts dominated the early proceedings, with Jonny Howson and Alex Pritchard both being denied by Barnsley keeper Adam Davies.<br>After Hammill had a goal ruled out for a clear offside at the other end, winger Murphy gave the Canaries a deserved lead moments before the break when, having being picked out by Cameron Jerome, he drilled a shot low and into the corner of the net.<br>Hammill was unlucky to not get a strong enough flick on Andy Yiadom's cross to make it 1-1 after the restart and MacDonald saw a close-range effort well saved by Michael McGovern from the resulting corner.<br>But, after Steven Naismith fired over for the Canaries with just the keeper to beat, they doubled their lead in fortunate circumstances as an effort from Murphy deflected off MacDonald into the net.<br>Jerome and Howson then went close to adding a third as Norwich coasted to three points.<br>Norwich caretaker manager Alan Irvine:<br>"I was asked to take charge for two games and I have done that. I haven't heard anything more about what happens going forward, but I should imagine I will be speaking to someone soon to find out what happens next week.<br>"If that is to be my last game in charge it was a good way to finish - and the win certainly makes it interesting as far as the play-offs are concerned.<br>"Being five points behind sounds a lot better than being eight points behind - and as I said last week there are still plenty of points to play for."<br>Barnsley manager Paul Heckingbottom:<br>"The take-away message from that game is hit the target, score goals.<br>"There were plenty of positives to take away from it, but if you are going to get anything in this league you have got to be clinical in front of goal.<br>"It's frustrating, but there is still plenty to play for. We will keep striving to get that perfect performance and obviously want to win as many games as possible between now and the end of the season."<br>Match ends, Norwich City 2, Barnsley 0.<br>Second Half ends, Norwich City 2, Barnsley 0.<br>Hand ball by Nélson Oliveira (Norwich City).<br>Attempt missed. Ryan Kent (Barnsley) right footed shot from the centre of the box is close, but misses to the left. Assisted by Ryan Hedges with a cross.<br>Attempt saved. Nélson Oliveira (Norwich City) left footed shot from outside the box is saved in the centre of the goal.<br>Alex Pritchard (Norwich City) wins a free kick in the attacking half.<br>Foul by Alex Mowatt (Barnsley).<br>Corner,  Barnsley. Conceded by Jonny Howson.<br>Foul by Graham Dorrans (Norwich City).<br>Matthew James (Barnsley) wins a free kick in the defensive half.<br>Attempt missed. Tom Bradshaw (Barnsley) left footed shot from the centre of the box is too high. Assisted by Gethin Jones with a cross.<br>Attempt missed. Steven Naismith (Norwich City) right footed shot from the right side of the box misses to the left. Assisted by Alex Pritchard.<br>Corner,  Norwich City. Conceded by Angus MacDonald.<br>Attempt blocked. Jonny Howson (Norwich City) right footed shot from the right side of the box is blocked. Assisted by Graham Dorrans with a through ball.<br>Substitution, Norwich City. Graham Dorrans replaces Jacob Murphy.<br>Substitution, Norwich City. Nélson Oliveira replaces Cameron Jerome.<br>Substitution, Barnsley. Ryan Hedges replaces Adam Hammill.<br>Attempt missed. Ryan Kent (Barnsley) left footed shot from the centre of the box is high and wide to the left. Assisted by Matthew James with a cross.<br>Attempt saved. Cameron Jerome (Norwich City) right footed shot from the centre of the box is saved in the bottom right corner. Assisted by Jacob Murphy with a through ball.<br>Substitution, Barnsley. Alex Mowatt replaces Marley Watkins.<br>Corner,  Barnsley. Conceded by Ivo Pinto.<br>Corner,  Barnsley. Conceded by Russell Martin.<br>Attempt blocked. Tom Bradshaw (Barnsley) right footed shot from the right side of the box is blocked. Assisted by Ryan Kent.<br>Own Goal by Angus MacDonald, Barnsley.  Norwich City 2, Barnsley 0.<br>Attempt saved. Jacob Murphy (Norwich City) right footed shot from the centre of the box is saved in the bottom right corner. Assisted by Alex Pritchard.<br>Attempt saved. Steven Naismith (Norwich City) left footed shot from the centre of the box is saved in the bottom left corner. Assisted by Steven Whittaker with a cross.<br>Ivo Pinto (Norwich City) wins a free kick in the defensive half.<br>Foul by Adam Hammill (Barnsley).<br>Attempt saved. Ryan Kent (Barnsley) right footed shot from outside the box is saved in the centre of the goal. Assisted by Marley Watkins.<br>Attempt missed. Josh Scowen (Barnsley) right footed shot from outside the box is high and wide to the right. Assisted by Adam Hammill.<br>Jacob Murphy (Norwich City) wins a free kick in the attacking half.<br>Foul by Angus MacDonald (Barnsley).<br>Ryan Bennett (Norwich City) wins a free kick in the defensive half.<br>Foul by Marc Roberts (Barnsley).<br>Ivo Pinto (Norwich City) is shown the yellow card for a bad foul.<br>Foul by Ivo Pinto (Norwich City).<br>Ryan Kent (Barnsley) wins a free kick in the attacking half.<br>Foul by Ryan Bennett (Norwich City).<br>Tom Bradshaw (Barnsley) wins a free kick in the attacking half.<br>Attempt missed. Steven Naismith (Norwich City) left footed shot from the left side of the box is too high. Assisted by Alex Pritchard.</code> | <code>Norwich City kept their Championship play-off hopes alive by beating Barnsley at Carrow Road.</code>                                                     |
  | <code>Political reporter Samantha Maiden said the offensive text, which also contained strong language, was intended for disgraced ex-minister Jamie Briggs.<br>She said Mr Dutton apologised for the message about her article referring to Mr Briggs' recent resignation.<br>The BBC has approached Mr Dutton's office for comment.<br>He reportedly told News Corp in a statement he is expecting a "tough time" in Ms Maiden's next article.<br>"Sam and I have exchanged some robust language over the years so we had a laugh after this and I apologised to her straightaway, which she took in good faith," Mr Dutton was quoted as saying.<br>Former Cities Minister Jamie Briggs resigned last week following a complaint from a female public servant over his alleged conduct during a night out in Hong Kong.</code>                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | <code>Australia's Immigration Minister Peter Dutton has reportedly apologised for mistakenly sending an SMS to a journalist, calling her a "mad witch".</code> |
  | <code>Demonstrators have moved around several sites since April to highlight a crisis in temporary housing.<br>The council's lawyer told the court "trespass, highways and planning laws" were the grounds for the case.<br>The cost to the council in terms of additional policing, security and legal costs has exceeded £100,000, he added.<br>Ahead of the hearing, tents were set up and a banner reading "The homeless resistance" was hung outside Manchester Civil Justice Centre.<br>'Grave and serious'<br>Protesters said they hoped to be offered "permanent, suitable accommodation".<br>Some had earlier refused temporary accommodation offered by the council because they said it was "not suitable" and they felt unsafe.<br>The council said it had engaged with the protestors and had offered them support, but it could not accept anti-social behaviour and disruption to residents and businesses.<br>Councillor Nigel Murphy added the exclusion order was "designed to prevent the recurrence of camps and not targeted at individual rough sleepers".<br>He said the council would work with police and court bailiffs to "regain possession" of areas taken over by camps in St Ann's Square and Castlefield as soon as possible.<br>John Clegg, from Unison's community branch, said there was a lack of social housing in Manchester.<br>He added: "There is a large amount of money for building private flats, more hotels are going up all the time, but there are no plans to build any social housing. That's wrong. That's absolutely wrong."<br>"In our view an injunction is a form of gating, and sending out a message that poor people are not wanted and should not be coming in to the city centre."</code>                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | <code>A Manchester City Council application for an injunction to stop the setting up of homeless camps in the city centre has been granted.</code>             |
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

#### compression-pairs

* Dataset: [compression-pairs](https://huggingface.co/datasets/sentence-transformers/sentence-compression) at [605bc91](https://huggingface.co/datasets/sentence-transformers/sentence-compression/tree/605bc91d95631895ba25b6eda51a3cb596976c90)
* Size: 180,000 training samples
* Columns: <code>sentence1</code> and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                           | sentence2                                                                         |
  |:--------|:------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
  | type    | string                                                                              | string                                                                            |
  | details | <ul><li>min: 10 tokens</li><li>mean: 31.89 tokens</li><li>max: 125 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 10.21 tokens</li><li>max: 28 tokens</li></ul> |
* Samples:
  | sentence1                                                                                                                                                                                                                                          | sentence2                                              |
  |:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-------------------------------------------------------|
  | <code>The USHL completed an expansion draft on Monday as 10 players who were on the rosters of USHL teams during the 2009-10 season were selected by the League's two newest entries, the Muskegon Lumberjacks and Dubuque Fighting Saints.</code> | <code>USHL completes expansion draft</code>            |
  | <code>Major League Baseball Commissioner Bud Selig will be speaking at St. Norbert College next month.</code>                                                                                                                                      | <code>Bud Selig to speak at St. Norbert College</code> |
  | <code>It's fresh cherry time in Michigan and the best time to enjoy this delicious and nutritious fruit.</code>                                                                                                                                    | <code>It's cherry time</code>                          |
* Loss: [<code>MultipleNegativesSymmetricRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativessymmetricrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

### Evaluation Datasets

#### nli-pairs

* Dataset: [nli-pairs](https://huggingface.co/datasets/sentence-transformers/all-nli) at [d482672](https://huggingface.co/datasets/sentence-transformers/all-nli/tree/d482672c8e74ce18da116f430137434ba2e52fab)
* Size: 6,808 evaluation samples
* Columns: <code>sentence1</code> and <code>sentence2</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                         | sentence2                                                                        |
  |:--------|:----------------------------------------------------------------------------------|:---------------------------------------------------------------------------------|
  | type    | string                                                                            | string                                                                           |
  | details | <ul><li>min: 5 tokens</li><li>mean: 17.64 tokens</li><li>max: 63 tokens</li></ul> | <ul><li>min: 4 tokens</li><li>mean: 9.67 tokens</li><li>max: 29 tokens</li></ul> |
* Samples:
  | sentence1                                                                                                                                                                      | sentence2                                                   |
  |:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------|
  | <code>Two women are embracing while holding to go packages.</code>                                                                                                             | <code>Two woman are holding packages.</code>                |
  | <code>Two young children in blue jerseys, one with the number 9 and one with the number 2 are standing on wooden steps in a bathroom and washing their hands in a sink.</code> | <code>Two kids in numbered jerseys wash their hands.</code> |
  | <code>A man selling donuts to a customer during a world exhibition event held in the city of Angeles</code>                                                                    | <code>A man selling donuts to a customer.</code>            |
* Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
  ```json
  {
      "scale": 20.0,
      "similarity_fct": "cos_sim"
  }
  ```

#### qnli-contrastive

* Dataset: [qnli-contrastive](https://huggingface.co/datasets/nyu-mll/glue) at [bcdcba7](https://huggingface.co/datasets/nyu-mll/glue/tree/bcdcba79d07bc864c1c254ccfcedcce55bcc9a8c)
* Size: 5,463 evaluation samples
* Columns: <code>sentence1</code>, <code>sentence2</code>, and <code>label</code>
* Approximate statistics based on the first 1000 samples:
  |         | sentence1                                                                         | sentence2                                                                          | label                        |
  |:--------|:----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:-----------------------------|
  | type    | string                                                                            | string                                                                             | int                          |
  | details | <ul><li>min: 6 tokens</li><li>mean: 14.13 tokens</li><li>max: 36 tokens</li></ul> | <ul><li>min: 4 tokens</li><li>mean: 36.58 tokens</li><li>max: 225 tokens</li></ul> | <ul><li>0: 100.00%</li></ul> |
* Samples:
  | sentence1                                                                 | sentence2                                                                                                                                        | label          |
  |:--------------------------------------------------------------------------|:-------------------------------------------------------------------------------------------------------------------------------------------------|:---------------|
  | <code>What came into force after the new constitution was herald?</code>  | <code>As of that day, the new constitution heralding the Second Republic came into force.</code>                                                 | <code>0</code> |
  | <code>What is the first major city in the stream of the Rhine?</code>     | <code>The most important tributaries in this area are the Ill below of Strasbourg, the Neckar in Mannheim and the Main across from Mainz.</code> | <code>0</code> |
  | <code>What is the minimum required if you want to teach in Canada?</code> | <code>In most provinces a second Bachelor's Degree such as a Bachelor of Education is required to become a qualified teacher.</code>             | <code>0</code> |
* Loss: [<code>OnlineContrastiveLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#onlinecontrastiveloss)

### Training Hyperparameters
#### Non-Default Hyperparameters

- `eval_strategy`: steps
- `per_device_train_batch_size`: 94
- `per_device_eval_batch_size`: 32
- `learning_rate`: 2e-05
- `weight_decay`: 1e-10
- `num_train_epochs`: 2
- `lr_scheduler_type`: cosine
- `warmup_ratio`: 0.33
- `save_safetensors`: False
- `fp16`: True
- `push_to_hub`: True
- `hub_model_id`: bobox/DeBERTaV3-small-GeneralSentenceTransformer-checkpoints-tmp
- `hub_strategy`: checkpoint
- `batch_sampler`: no_duplicates

#### All Hyperparameters
<details><summary>Click to expand</summary>

- `overwrite_output_dir`: False
- `do_predict`: False
- `eval_strategy`: steps
- `prediction_loss_only`: True
- `per_device_train_batch_size`: 94
- `per_device_eval_batch_size`: 32
- `per_gpu_train_batch_size`: None
- `per_gpu_eval_batch_size`: None
- `gradient_accumulation_steps`: 1
- `eval_accumulation_steps`: None
- `learning_rate`: 2e-05
- `weight_decay`: 1e-10
- `adam_beta1`: 0.9
- `adam_beta2`: 0.999
- `adam_epsilon`: 1e-08
- `max_grad_norm`: 1.0
- `num_train_epochs`: 2
- `max_steps`: -1
- `lr_scheduler_type`: cosine
- `lr_scheduler_kwargs`: {}
- `warmup_ratio`: 0.33
- `warmup_steps`: 0
- `log_level`: passive
- `log_level_replica`: warning
- `log_on_each_node`: True
- `logging_nan_inf_filter`: True
- `save_safetensors`: False
- `save_on_each_node`: False
- `save_only_model`: False
- `restore_callback_states_from_checkpoint`: False
- `no_cuda`: False
- `use_cpu`: False
- `use_mps_device`: False
- `seed`: 42
- `data_seed`: None
- `jit_mode_eval`: False
- `use_ipex`: False
- `bf16`: False
- `fp16`: True
- `fp16_opt_level`: O1
- `half_precision_backend`: auto
- `bf16_full_eval`: False
- `fp16_full_eval`: False
- `tf32`: None
- `local_rank`: 0
- `ddp_backend`: None
- `tpu_num_cores`: None
- `tpu_metrics_debug`: False
- `debug`: []
- `dataloader_drop_last`: False
- `dataloader_num_workers`: 0
- `dataloader_prefetch_factor`: None
- `past_index`: -1
- `disable_tqdm`: False
- `remove_unused_columns`: True
- `label_names`: None
- `load_best_model_at_end`: False
- `ignore_data_skip`: False
- `fsdp`: []
- `fsdp_min_num_params`: 0
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
- `fsdp_transformer_layer_cls_to_wrap`: None
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
- `deepspeed`: None
- `label_smoothing_factor`: 0.0
- `optim`: adamw_torch
- `optim_args`: None
- `adafactor`: False
- `group_by_length`: False
- `length_column_name`: length
- `ddp_find_unused_parameters`: None
- `ddp_bucket_cap_mb`: None
- `ddp_broadcast_buffers`: False
- `dataloader_pin_memory`: True
- `dataloader_persistent_workers`: False
- `skip_memory_metrics`: True
- `use_legacy_prediction_loop`: False
- `push_to_hub`: True
- `resume_from_checkpoint`: None
- `hub_model_id`: bobox/DeBERTaV3-small-GeneralSentenceTransformer-checkpoints-tmp
- `hub_strategy`: checkpoint
- `hub_private_repo`: False
- `hub_always_push`: False
- `gradient_checkpointing`: False
- `gradient_checkpointing_kwargs`: None
- `include_inputs_for_metrics`: False
- `eval_do_concat_batches`: True
- `fp16_backend`: auto
- `push_to_hub_model_id`: None
- `push_to_hub_organization`: None
- `mp_parameters`: 
- `auto_find_batch_size`: False
- `full_determinism`: False
- `torchdynamo`: None
- `ray_scope`: last
- `ddp_timeout`: 1800
- `torch_compile`: False
- `torch_compile_backend`: None
- `torch_compile_mode`: None
- `dispatch_batches`: None
- `split_batches`: None
- `include_tokens_per_second`: False
- `include_num_input_tokens_seen`: False
- `neftune_noise_alpha`: None
- `optim_target_modules`: None
- `batch_eval_metrics`: False
- `batch_sampler`: no_duplicates
- `multi_dataset_batch_sampler`: proportional

</details>

### Training Logs
| Epoch  | Step  | Training Loss | qnli-contrastive loss | nli-pairs loss |
|:------:|:-----:|:-------------:|:---------------------:|:--------------:|
| None   | 0     | -             | 20.1737               | 4.0959         |
| 0.1001 | 734   | 4.796         | -                     | -              |
| 0.2001 | 1468  | 1.3015        | 0.0358                | 0.9115         |
| 0.3002 | 2202  | 0.89          | -                     | -              |
| 0.4002 | 2936  | 0.716         | 0.0168                | 0.5944         |
| 0.5003 | 3670  | 0.6365        | -                     | -              |
| 0.6003 | 4404  | 0.5883        | 0.0164                | 0.4975         |
| 0.7004 | 5138  | 0.5192        | -                     | -              |
| 0.8004 | 5872  | 0.4961        | 0.0288                | 0.4450         |
| 0.9005 | 6606  | 0.6035        | -                     | -              |
| 1.0005 | 7340  | 0.4733        | 0.0110                | 0.4215         |
| 1.1006 | 8074  | 0.4002        | -                     | -              |
| 1.2007 | 8808  | 0.3929        | 0.0454                | 0.3796         |
| 1.3007 | 9542  | 0.3826        | -                     | -              |
| 1.4008 | 10276 | 0.3522        | 0.0178                | 0.3714         |
| 1.5008 | 11010 | 0.3627        | -                     | -              |
| 1.6009 | 11744 | 0.3553        | 0.0257                | 0.3629         |
| 1.7009 | 12478 | 0.3406        | -                     | -              |
| 1.8010 | 13212 | 0.3288        | 0.0289                | 0.3575         |
| 1.9010 | 13946 | 0.4563        | -                     | -              |


### Framework Versions
- Python: 3.10.12
- Sentence Transformers: 3.0.1
- Transformers: 4.41.2
- PyTorch: 2.3.0+cu121
- Accelerate: 0.31.0
- Datasets: 2.20.0
- Tokenizers: 0.19.1

## Citation

### BibTeX

#### Sentence Transformers
```bibtex
@inproceedings{reimers-2019-sentence-bert,
    title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
    author = "Reimers, Nils and Gurevych, Iryna",
    booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
    month = "11",
    year = "2019",
    publisher = "Association for Computational Linguistics",
    url = "https://arxiv.org/abs/1908.10084",
}
```

#### MultipleNegativesRankingLoss
```bibtex
@misc{henderson2017efficient,
    title={Efficient Natural Language Response Suggestion for Smart Reply}, 
    author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
    year={2017},
    eprint={1705.00652},
    archivePrefix={arXiv},
    primaryClass={cs.CL}
}
```

#### CoSENTLoss
```bibtex
@online{kexuefm-8847,
    title={CoSENT: A more efficient sentence vector scheme than Sentence-BERT},
    author={Su Jianlin},
    year={2022},
    month={Jan},
    url={https://kexue.fm/archives/8847},
}
```

#### GISTEmbedLoss
```bibtex
@misc{solatorio2024gistembed,
    title={GISTEmbed: Guided In-sample Selection of Training Negatives for Text Embedding Fine-tuning}, 
    author={Aivin V. Solatorio},
    year={2024},
    eprint={2402.16829},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}
```

<!--
## Glossary

*Clearly define terms in order to be accessible across audiences.*
-->

<!--
## Model Card Authors

*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
-->

<!--
## Model Card Contact

*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
-->