Add new SentenceTransformer model
Browse files- README.md +14 -15
- model.safetensors +1 -1
README.md
CHANGED
|
@@ -202,7 +202,6 @@ You can finetune this model on your own dataset.
|
|
| 202 |
#### Non-Default Hyperparameters
|
| 203 |
|
| 204 |
- `per_device_train_batch_size`: 256
|
| 205 |
-
- `learning_rate`: 1e-05
|
| 206 |
- `warmup_ratio`: 0.1
|
| 207 |
- `fp16`: True
|
| 208 |
- `batch_sampler`: no_duplicates
|
|
@@ -221,7 +220,7 @@ You can finetune this model on your own dataset.
|
|
| 221 |
- `gradient_accumulation_steps`: 1
|
| 222 |
- `eval_accumulation_steps`: None
|
| 223 |
- `torch_empty_cache_steps`: None
|
| 224 |
-
- `learning_rate`:
|
| 225 |
- `weight_decay`: 0.0
|
| 226 |
- `adam_beta1`: 0.9
|
| 227 |
- `adam_beta2`: 0.999
|
|
@@ -330,19 +329,19 @@ You can finetune this model on your own dataset.
|
|
| 330 |
### Training Logs
|
| 331 |
| Epoch | Step | Training Loss |
|
| 332 |
|:------:|:----:|:-------------:|
|
| 333 |
-
| 0.2273 | 10 | 1.
|
| 334 |
-
| 0.4545 | 20 | 1.
|
| 335 |
-
| 0.6818 | 30 | 0.
|
| 336 |
-
| 0.9091 | 40 | 0.
|
| 337 |
-
| 1.1364 | 50 | 1.
|
| 338 |
-
| 1.3636 | 60 | 0.
|
| 339 |
-
| 1.5909 | 70 |
|
| 340 |
-
| 1.8182 | 80 | 0.
|
| 341 |
-
| 2.0455 | 90 | 0.
|
| 342 |
-
| 2.2727 | 100 |
|
| 343 |
-
| 2.5 | 110 | 0.
|
| 344 |
-
| 2.7273 | 120 | 0.
|
| 345 |
-
| 2.9545 | 130 | 0.
|
| 346 |
|
| 347 |
|
| 348 |
### Framework Versions
|
|
|
|
| 202 |
#### Non-Default Hyperparameters
|
| 203 |
|
| 204 |
- `per_device_train_batch_size`: 256
|
|
|
|
| 205 |
- `warmup_ratio`: 0.1
|
| 206 |
- `fp16`: True
|
| 207 |
- `batch_sampler`: no_duplicates
|
|
|
|
| 220 |
- `gradient_accumulation_steps`: 1
|
| 221 |
- `eval_accumulation_steps`: None
|
| 222 |
- `torch_empty_cache_steps`: None
|
| 223 |
+
- `learning_rate`: 5e-05
|
| 224 |
- `weight_decay`: 0.0
|
| 225 |
- `adam_beta1`: 0.9
|
| 226 |
- `adam_beta2`: 0.999
|
|
|
|
| 329 |
### Training Logs
|
| 330 |
| Epoch | Step | Training Loss |
|
| 331 |
|:------:|:----:|:-------------:|
|
| 332 |
+
| 0.2273 | 10 | 1.6158 |
|
| 333 |
+
| 0.4545 | 20 | 1.1681 |
|
| 334 |
+
| 0.6818 | 30 | 0.8775 |
|
| 335 |
+
| 0.9091 | 40 | 0.7628 |
|
| 336 |
+
| 1.1364 | 50 | 1.0154 |
|
| 337 |
+
| 1.3636 | 60 | 0.7048 |
|
| 338 |
+
| 1.5909 | 70 | 0.7981 |
|
| 339 |
+
| 1.8182 | 80 | 0.6322 |
|
| 340 |
+
| 2.0455 | 90 | 0.4916 |
|
| 341 |
+
| 2.2727 | 100 | 0.8441 |
|
| 342 |
+
| 2.5 | 110 | 0.6697 |
|
| 343 |
+
| 2.7273 | 120 | 0.5358 |
|
| 344 |
+
| 2.9545 | 130 | 0.5111 |
|
| 345 |
|
| 346 |
|
| 347 |
### Framework Versions
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 437951328
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b94852c6a04ca84b6478f9b3af75a7bff023c8ae5ed7db43464461ca19e98ea0
|
| 3 |
size 437951328
|