exdysa's picture
Update README.md
8447d1e verified
metadata
name: suzume-llama-3-8B-multilingual-orpo-borda-top25
license: cc-by-nc-4.0
tags:
  - lightblue
  - multilingual
  - text-generation
  - text2text-generation
  - natural language
  - translate
  - orpo
  - Meta
  - Llama
  - RichardErkhov
type:
  - 6GB
  - 8GB
  - llm
  - chat
  - multilingual
  - subsume
  - llama-3
config:
  - ctx=8192
  - 5bit
  - temp=0
resolutions: null
datasets:
  - lightblue/mitsu_full_borda
  - lightblue/tagengo-gpt4
  - megagonlabs/instruction_ja
  - openchat/openchat_sharegpt4_dataset
language:
  - zh
  - fr
  - de
  - jp
  - ru
  - en
size:
  - 4920734016
  - 5732987200
use: null
shortcomings: null
sources:
  - https://arxiv.org/abs/2405.12612
  - https://arxiv.org/abs/2405.18952
funded_by: null
train_hardware: 4 x A100 (80GB)
pipeline_tag: text-generation
examples: Bonjour!

repo_clone_081924

name: suzume-llama-3-8B-multilingual-orpo-borda-top25
license: cc-by-nc-4.0
tags:
- lightblue
- multilingual
- text-generation
- text2text-generation
- natural language
- translate
- orpo
- Meta
- Llama
- RichardErkhov
type:
- 6GB
- 8GB
- llm
- chat
- multilingual
- subsume
- llama-3
config: 
- ctx=8192
- 5bit
- temp=0
resolutions: 
datasets:
- lightblue/mitsu_full_borda
- lightblue/tagengo-gpt4
- megagonlabs/instruction_ja
- openchat/openchat_sharegpt4_dataset
language: 
- zh
- fr
- de
- jp
- ru
- en
size:
- 4920734016
- 5732987200
use: 
shortcomings: 
sources: 
- https://arxiv.org/abs/2405.12612
- https://arxiv.org/abs/2405.18952
funded_by: 
train_hardware:  4 x A100 (80GB)
pipeline_tag: text-generation 
examples: "Bonjour!"