lomahony
/

eleuther-pythia410m-hh-sft

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

lomahony commited on Jul 21, 2023

Commit

3f2d1c9

•

1 Parent(s): 98e817d

First model version

Files changed (4) hide show

config.yaml +44 -0
optimizer.pt +3 -0
policy.pt +3 -0
scheduler.pt +3 -0

config.yaml ADDED Viewed

	@@ -0,0 +1,44 @@

+seed: 0
+exp_name: pythia410m_hh_ga4_dpo
+batch_size: 64
+eval_batch_size: 32
+debug: false
+fsdp_port: 12355
+datasets:
+- hh
+wandb:
+  enabled: true
+  entity: pythia_dpo
+  project: Pythia_LOM
+local_dirs:
+- /scr-ssd
+- /scr
+- .cache
+sample_during_eval: false
+n_eval_model_samples: 16
+do_first_eval: true
+local_run_dir: .cache/laura/pythia410m_hh_ga4_dpo_2023-07-19_13-02-35_532776
+lr: 1.0e-06
+gradient_accumulation_steps: 4
+max_grad_norm: 10.0
+max_length: 512
+max_prompt_length: 256
+n_epochs: 1
+n_examples: null
+n_eval_examples: 256
+trainer: FSDPTrainer
+optimizer: RMSprop
+warmup_steps: 150
+activation_checkpointing: false
+eval_every: 19968
+minimum_log_interval_secs: 1.0
+model:
+  name_or_path: EleutherAI/pythia-410m
+  tokenizer_name_or_path: null
+  archive: null
+  block_name: GPTNeoXLayer
+  policy_dtype: float32
+  fsdp_policy_mp: bfloat16
+  reference_dtype: float16
+loss:
+  name: sft

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d61e9f7ae162b6ca0f3e6f4310f307a45d8d5f0718a757228d7f9e8d877108df
+size 1621435717

policy.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7d5342d3950db163bc8bacb6d0a7eac25502526a3066e30cfd134a6f9da6d9a
+size 1722144187

scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef3bb892ec5f85ebcd911ec0358781fc843702c92bef54eec6bc38b127a23878
+size 627