96abhishekarora
commited on
Commit
•
98e7174
1
Parent(s):
c70faba
Modified validation and training for linktransformer model
Browse files- .gitattributes +1 -0
- README.md +3 -3
- model.safetensors +1 -1
.gitattributes
CHANGED
@@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
37 |
.git/lfs/objects/1a/76/1a76a58ef6d75109a94ea9fef24bd95c3e37b89337a9263dfd2e78be67d40fad filter=lfs diff=lfs merge=lfs -text
|
|
|
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
37 |
.git/lfs/objects/1a/76/1a76a58ef6d75109a94ea9fef24bd95c3e37b89337a9263dfd2e78be67d40fad filter=lfs diff=lfs merge=lfs -text
|
38 |
+
.git/lfs/objects/d1/50/d150d5f1dc925180772426d6240cefc69cc62920fad2a06d088e0ce6ec787d61 filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
@@ -97,7 +97,7 @@ The model was trained with the parameters:
|
|
97 |
|
98 |
**DataLoader**:
|
99 |
|
100 |
-
`torch.utils.data.dataloader.DataLoader` of length
|
101 |
```
|
102 |
{'batch_size': 64, 'sampler': 'torch.utils.data.dataloader._InfiniteConstantSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
|
103 |
```
|
@@ -110,7 +110,7 @@ Parameters of the fit()-Method:
|
|
110 |
```
|
111 |
{
|
112 |
"epochs": 70,
|
113 |
-
"evaluation_steps":
|
114 |
"evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
|
115 |
"max_grad_norm": 1,
|
116 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
@@ -119,7 +119,7 @@ Parameters of the fit()-Method:
|
|
119 |
},
|
120 |
"scheduler": "WarmupLinear",
|
121 |
"steps_per_epoch": null,
|
122 |
-
"warmup_steps":
|
123 |
"weight_decay": 0.01
|
124 |
}
|
125 |
```
|
|
|
97 |
|
98 |
**DataLoader**:
|
99 |
|
100 |
+
`torch.utils.data.dataloader.DataLoader` of length 50 with parameters:
|
101 |
```
|
102 |
{'batch_size': 64, 'sampler': 'torch.utils.data.dataloader._InfiniteConstantSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
|
103 |
```
|
|
|
110 |
```
|
111 |
{
|
112 |
"epochs": 70,
|
113 |
+
"evaluation_steps": 25,
|
114 |
"evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
|
115 |
"max_grad_norm": 1,
|
116 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
|
|
119 |
},
|
120 |
"scheduler": "WarmupLinear",
|
121 |
"steps_per_epoch": null,
|
122 |
+
"warmup_steps": 3500,
|
123 |
"weight_decay": 0.01
|
124 |
}
|
125 |
```
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1346690896
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d417a0fe87c0361764cffc49b15f5bbe663a758233c22ab6d6a51a5ce008adfd
|
3 |
size 1346690896
|