ep9io commited on
Commit
77aafbc
1 Parent(s): 7c047c3

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +52 -52
README.md CHANGED
@@ -11,7 +11,7 @@ developers: Tristan Everitt and Paul Ryan
11
  model_card_authors: See developers
12
  model_card_contact: See developers
13
  repo: https://gitlab.computing.dcu.ie/everitt2/2024-mcm-everitt-ryan
14
- training_regime: 'PEFT: None, accelerator_config="{''split_batches'': False, ''dispatch_batches'':
15
  None, ''even_batches'': True, ''use_seedable_sampler'': True, ''non_blocking'':
16
  False, ''gradient_accumulation_kwargs'': None}", adafactor=false, adam_beta1=0.9,
17
  adam_beta2=0.999, adam_epsilon=1e-08, auto_find_batch_size=false, batch_eval_metrics=false,
@@ -40,20 +40,20 @@ training_regime: 'PEFT: None, accelerator_config="{''split_batches'': False, ''d
40
  train_batch_size=8, use_cpu=false, use_ipex=false, use_legacy_prediction_loop=false,
41
  use_mps_device=false, warmup_ratio=0.0, warmup_steps=0, weight_decay=0.001'
42
  results: " precision recall f1-score support\n \n \
43
- \ age 0.91 0.49 0.63 80\n disability 0.97\
44
- \ 0.47 0.64 80\n feminine 0.99 0.86 0.92\
45
- \ 80\n general 0.82 0.56 0.67 80\n masculine\
46
- \ 0.62 0.65 0.63 80\n neutral 0.35 0.90\
47
- \ 0.50 80\n racial 0.89 0.80 0.84 80\n\
48
- \ sexuality 0.95 0.75 0.84 80\n \n micro avg\
49
- \ 0.69 0.69 0.69 640\n macro avg 0.81 0.69\
50
- \ 0.71 640\n weighted avg 0.81 0.69 0.71 640\n\
51
- \ samples avg 0.70 0.74 0.71 640\n "
52
- compute_infrastructure: '- Linux 6.5.0-35-generic x86_64
53
 
54
- - MemTotal: 1056613768 kB
55
 
56
- - 256 X AMD EPYC 7702 64-Core Processor
57
 
58
  - GPU_0: NVIDIA L40S'
59
  software: python 3.10.12, accelerate 0.32.1, aiohttp 3.9.5, aiosignal 1.3.1, anyio
@@ -104,7 +104,7 @@ software: python 3.10.12, accelerate 0.32.1, aiohttp 3.9.5, aiosignal 1.3.1, any
104
  webcolors 1.13, webencodings 0.5.1, websocket-client 1.7.0, wheel 0.42.0, widgetsnbextension
105
  4.0.9, xxhash 3.4.1, yarl 1.9.4, zipp 1.0.0
106
  hardware_type: 1 X NVIDIA L40S
107
- hours_used: '6.22'
108
  cloud_provider: N/A
109
  cloud_region: N/A
110
  co2_emitted: N/A
@@ -134,47 +134,47 @@ model-index:
134
  type: mix_human-eval_synthetic
135
  metrics:
136
  - type: loss
137
- value: 0.31148761510849
138
  - type: accuracy
139
- value: 0.6523972602739726
140
  - type: f1_micro
141
- value: 0.6891679748822606
142
  - type: precision_micro
143
- value: 0.692429022082019
144
  - type: recall_micro
145
- value: 0.6859375
146
  - type: roc_auc_micro
147
- value: 0.8187872023809524
148
  - type: f1_macro
149
- value: 0.709360114262138
150
  - type: precision_macro
151
- value: 0.8114628911140539
152
  - type: recall_macro
153
- value: 0.6859375000000001
154
  - type: roc_auc_macro
155
- value: 0.8187872023809524
156
  - type: f1_samples
157
- value: 0.7119863013698631
158
  - type: precision_samples
159
- value: 0.7029109589041096
160
  - type: recall_samples
161
- value: 0.7360159817351598
162
  - type: roc_auc_samples
163
- value: 0.8432444553163732
164
  - type: f1_weighted
165
- value: 0.709360114262138
166
  - type: precision_weighted
167
- value: 0.8114628911140539
168
  - type: recall_weighted
169
- value: 0.6859375
170
  - type: roc_auc_weighted
171
- value: 0.8187872023809526
172
  - type: runtime
173
- value: 373.8217
174
  - type: samples_per_second
175
- value: 1.562
176
  - type: steps_per_second
177
- value: 0.195
178
  - type: epoch
179
  value: 3.0
180
  ---
@@ -286,7 +286,7 @@ Use the code below to get started with the model.
286
 
287
  #### Training Hyperparameters
288
 
289
- - **Training regime:** PEFT: None, accelerator_config="{'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}", adafactor=false, adam_beta1=0.9, adam_beta2=0.999, adam_epsilon=1e-08, auto_find_batch_size=false, batch_eval_metrics=false, bf16=false, bf16_full_eval=false, data_seed="None", dataloader_drop_last=false, dataloader_num_workers=0, dataloader_persistent_workers=false, dataloader_pin_memory=true, dataloader_prefetch_factor="None", ddp_backend="None", ddp_broadcast_buffers="None", ddp_bucket_cap_mb="None", ddp_find_unused_parameters="None", ddp_timeout=1800, deepspeed="None", disable_tqdm=false, dispatch_batches="None", do_eval=true, do_predict=false, do_train=false, eval_accumulation_steps="None", eval_batch_size=8, eval_delay=0, eval_do_concat_batches=true, eval_on_start=false, eval_steps="None", eval_strategy="epoch", evaluation_strategy="None", fp16=false, fp16_backend="auto", fp16_full_eval=false, fp16_opt_level="O1", fsdp="[]", fsdp_config="{'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}", fsdp_min_num_params=0, fsdp_transformer_layer_cls_to_wrap="None", full_determinism=false, gradient_accumulation_steps=1, gradient_checkpointing="(False,)", gradient_checkpointing_kwargs="None", greater_is_better=false, group_by_length=true, half_precision_backend="auto", ignore_data_skip=false, include_inputs_for_metrics=false, jit_mode_eval=false, label_names="None", label_smoothing_factor=0.0, learning_rate=0.0001, length_column_name="length", load_best_model_at_end=true, local_rank=0, lr_scheduler_kwargs="{}", lr_scheduler_type="linear", max_grad_norm=1.0, max_steps=-1, metric_for_best_model="loss", mp_parameters="", neftune_noise_alpha="None", no_cuda=false, num_train_epochs=3, optim="adamw_torch", optim_args="None", optim_target_modules="None", past_index=-1, per_device_eval_batch_size=8, per_device_train_batch_size=8, per_gpu_eval_batch_size="None", per_gpu_train_batch_size="None", prediction_loss_only=false, ray_scope="last", remove_unused_columns=true, report_to="[]", restore_callback_states_from_checkpoint=false, resume_from_checkpoint="None", seed=42, skip_memory_metrics=true, split_batches="None", tf32="None", torch_compile=false, torch_compile_backend="None", torch_compile_mode="None", torchdynamo="None", tpu_num_cores="None", train_batch_size=8, use_cpu=false, use_ipex=false, use_legacy_prediction_loop=false, use_mps_device=false, warmup_ratio=0.0, warmup_steps=0, weight_decay=0.001 <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
290
 
291
  #### Speeds, Sizes, Times [optional]
292
 
@@ -322,19 +322,19 @@ Use the code below to get started with the model.
322
 
323
  precision recall f1-score support
324
 
325
- age 0.91 0.49 0.63 80
326
- disability 0.97 0.47 0.64 80
327
- feminine 0.99 0.86 0.92 80
328
- general 0.82 0.56 0.67 80
329
- masculine 0.62 0.65 0.63 80
330
- neutral 0.35 0.90 0.50 80
331
- racial 0.89 0.80 0.84 80
332
- sexuality 0.95 0.75 0.84 80
333
 
334
- micro avg 0.69 0.69 0.69 640
335
- macro avg 0.81 0.69 0.71 640
336
- weighted avg 0.81 0.69 0.71 640
337
- samples avg 0.70 0.74 0.71 640
338
 
339
 
340
  #### Summary
@@ -354,7 +354,7 @@ Use the code below to get started with the model.
354
  Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
355
 
356
  - **Hardware Type:** 1 X NVIDIA L40S
357
- - **Hours used:** 6.22
358
  - **Cloud Provider:** N/A
359
  - **Compute Region:** N/A
360
  - **Carbon Emitted:** N/A
@@ -367,9 +367,9 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
367
 
368
  ### Compute Infrastructure
369
 
370
- - Linux 6.5.0-35-generic x86_64
371
- - MemTotal: 1056613768 kB
372
- - 256 X AMD EPYC 7702 64-Core Processor
373
  - GPU_0: NVIDIA L40S
374
 
375
  #### Hardware
 
11
  model_card_authors: See developers
12
  model_card_contact: See developers
13
  repo: https://gitlab.computing.dcu.ie/everitt2/2024-mcm-everitt-ryan
14
+ training_regime: 'accelerator_config="{''split_batches'': False, ''dispatch_batches'':
15
  None, ''even_batches'': True, ''use_seedable_sampler'': True, ''non_blocking'':
16
  False, ''gradient_accumulation_kwargs'': None}", adafactor=false, adam_beta1=0.9,
17
  adam_beta2=0.999, adam_epsilon=1e-08, auto_find_batch_size=false, batch_eval_metrics=false,
 
40
  train_batch_size=8, use_cpu=false, use_ipex=false, use_legacy_prediction_loop=false,
41
  use_mps_device=false, warmup_ratio=0.0, warmup_steps=0, weight_decay=0.001'
42
  results: " precision recall f1-score support\n \n \
43
+ \ age 0.72 0.60 0.65 80\n disability 0.95\
44
+ \ 0.50 0.66 80\n feminine 0.99 0.91 0.95\
45
+ \ 80\n general 0.84 0.46 0.60 80\n masculine\
46
+ \ 0.65 0.66 0.66 80\n neutral 0.34 0.86\
47
+ \ 0.49 80\n racial 0.90 0.82 0.86 80\n\
48
+ \ sexuality 0.97 0.75 0.85 80\n \n micro avg\
49
+ \ 0.69 0.70 0.69 640\n macro avg 0.80 0.70\
50
+ \ 0.71 640\n weighted avg 0.80 0.70 0.71 640\n\
51
+ \ samples avg 0.71 0.74 0.72 640\n "
52
+ compute_infrastructure: '- Linux 6.5.0-28-generic x86_64
53
 
54
+ - MemTotal: 527988292 kB
55
 
56
+ - 64 X Intel(R) Xeon(R) Silver 4314 CPU @ 2.40GHz
57
 
58
  - GPU_0: NVIDIA L40S'
59
  software: python 3.10.12, accelerate 0.32.1, aiohttp 3.9.5, aiosignal 1.3.1, anyio
 
104
  webcolors 1.13, webencodings 0.5.1, websocket-client 1.7.0, wheel 0.42.0, widgetsnbextension
105
  4.0.9, xxhash 3.4.1, yarl 1.9.4, zipp 1.0.0
106
  hardware_type: 1 X NVIDIA L40S
107
+ hours_used: '4.18'
108
  cloud_provider: N/A
109
  cloud_region: N/A
110
  co2_emitted: N/A
 
134
  type: mix_human-eval_synthetic
135
  metrics:
136
  - type: loss
137
+ value: 0.2838529944419861
138
  - type: accuracy
139
+ value: 0.6438356164383562
140
  - type: f1_micro
141
+ value: 0.6947040498442367
142
  - type: precision_micro
143
+ value: 0.6925465838509317
144
  - type: recall_micro
145
+ value: 0.696875
146
  - type: roc_auc_micro
147
+ value: 0.8238839285714286
148
  - type: f1_macro
149
+ value: 0.7138661109496585
150
  - type: precision_macro
151
+ value: 0.7957063168116414
152
  - type: recall_macro
153
+ value: 0.6968749999999999
154
  - type: roc_auc_macro
155
+ value: 0.8238839285714286
156
  - type: f1_samples
157
+ value: 0.7163078930202218
158
  - type: precision_samples
159
+ value: 0.7057648401826483
160
  - type: recall_samples
161
+ value: 0.7441495433789955
162
  - type: roc_auc_samples
163
+ value: 0.8469646934116113
164
  - type: f1_weighted
165
+ value: 0.7138661109496585
166
  - type: precision_weighted
167
+ value: 0.7957063168116415
168
  - type: recall_weighted
169
+ value: 0.696875
170
  - type: roc_auc_weighted
171
+ value: 0.8238839285714284
172
  - type: runtime
173
+ value: 251.9003
174
  - type: samples_per_second
175
+ value: 2.318
176
  - type: steps_per_second
177
+ value: 0.29
178
  - type: epoch
179
  value: 3.0
180
  ---
 
286
 
287
  #### Training Hyperparameters
288
 
289
+ - **Training regime:** accelerator_config="{'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}", adafactor=false, adam_beta1=0.9, adam_beta2=0.999, adam_epsilon=1e-08, auto_find_batch_size=false, batch_eval_metrics=false, bf16=false, bf16_full_eval=false, data_seed="None", dataloader_drop_last=false, dataloader_num_workers=0, dataloader_persistent_workers=false, dataloader_pin_memory=true, dataloader_prefetch_factor="None", ddp_backend="None", ddp_broadcast_buffers="None", ddp_bucket_cap_mb="None", ddp_find_unused_parameters="None", ddp_timeout=1800, deepspeed="None", disable_tqdm=false, dispatch_batches="None", do_eval=true, do_predict=false, do_train=false, eval_accumulation_steps="None", eval_batch_size=8, eval_delay=0, eval_do_concat_batches=true, eval_on_start=false, eval_steps="None", eval_strategy="epoch", evaluation_strategy="None", fp16=false, fp16_backend="auto", fp16_full_eval=false, fp16_opt_level="O1", fsdp="[]", fsdp_config="{'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}", fsdp_min_num_params=0, fsdp_transformer_layer_cls_to_wrap="None", full_determinism=false, gradient_accumulation_steps=1, gradient_checkpointing="(False,)", gradient_checkpointing_kwargs="None", greater_is_better=false, group_by_length=true, half_precision_backend="auto", ignore_data_skip=false, include_inputs_for_metrics=false, jit_mode_eval=false, label_names="None", label_smoothing_factor=0.0, learning_rate=0.0001, length_column_name="length", load_best_model_at_end=true, local_rank=0, lr_scheduler_kwargs="{}", lr_scheduler_type="linear", max_grad_norm=1.0, max_steps=-1, metric_for_best_model="loss", mp_parameters="", neftune_noise_alpha="None", no_cuda=false, num_train_epochs=3, optim="adamw_torch", optim_args="None", optim_target_modules="None", past_index=-1, per_device_eval_batch_size=8, per_device_train_batch_size=8, per_gpu_eval_batch_size="None", per_gpu_train_batch_size="None", prediction_loss_only=false, ray_scope="last", remove_unused_columns=true, report_to="[]", restore_callback_states_from_checkpoint=false, resume_from_checkpoint="None", seed=42, skip_memory_metrics=true, split_batches="None", tf32="None", torch_compile=false, torch_compile_backend="None", torch_compile_mode="None", torchdynamo="None", tpu_num_cores="None", train_batch_size=8, use_cpu=false, use_ipex=false, use_legacy_prediction_loop=false, use_mps_device=false, warmup_ratio=0.0, warmup_steps=0, weight_decay=0.001 <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
290
 
291
  #### Speeds, Sizes, Times [optional]
292
 
 
322
 
323
  precision recall f1-score support
324
 
325
+ age 0.72 0.60 0.65 80
326
+ disability 0.95 0.50 0.66 80
327
+ feminine 0.99 0.91 0.95 80
328
+ general 0.84 0.46 0.60 80
329
+ masculine 0.65 0.66 0.66 80
330
+ neutral 0.34 0.86 0.49 80
331
+ racial 0.90 0.82 0.86 80
332
+ sexuality 0.97 0.75 0.85 80
333
 
334
+ micro avg 0.69 0.70 0.69 640
335
+ macro avg 0.80 0.70 0.71 640
336
+ weighted avg 0.80 0.70 0.71 640
337
+ samples avg 0.71 0.74 0.72 640
338
 
339
 
340
  #### Summary
 
354
  Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
355
 
356
  - **Hardware Type:** 1 X NVIDIA L40S
357
+ - **Hours used:** 4.18
358
  - **Cloud Provider:** N/A
359
  - **Compute Region:** N/A
360
  - **Carbon Emitted:** N/A
 
367
 
368
  ### Compute Infrastructure
369
 
370
+ - Linux 6.5.0-28-generic x86_64
371
+ - MemTotal: 527988292 kB
372
+ - 64 X Intel(R) Xeon(R) Silver 4314 CPU @ 2.40GHz
373
  - GPU_0: NVIDIA L40S
374
 
375
  #### Hardware