Update README.md
Browse files
README.md
CHANGED
@@ -54,14 +54,14 @@ The model is pre-trained by [UER-py](https://github.com/dbiir/UER-py/) on [Tence
|
|
54 |
|
55 |
```
|
56 |
python3 preprocess.py --corpus_path corpora/poem.txt \
|
57 |
-
--vocab_path models/
|
58 |
--dataset_path poem_dataset.pt --processes_num 16 \
|
59 |
--seq_length 128 --data_processor lm
|
60 |
```
|
61 |
|
62 |
```
|
63 |
python3 pretrain.py --dataset_path poem_dataset.pt \
|
64 |
-
--vocab_path models/
|
65 |
--config_path models/gpt2/config.json \
|
66 |
--output_model_path models/poem_gpt2_model.bin \
|
67 |
--world_size 8 --gpu_ranks 0 1 2 3 4 5 6 7 \
|
|
|
54 |
|
55 |
```
|
56 |
python3 preprocess.py --corpus_path corpora/poem.txt \
|
57 |
+
--vocab_path models/google_zh_poem_vocab.txt \
|
58 |
--dataset_path poem_dataset.pt --processes_num 16 \
|
59 |
--seq_length 128 --data_processor lm
|
60 |
```
|
61 |
|
62 |
```
|
63 |
python3 pretrain.py --dataset_path poem_dataset.pt \
|
64 |
+
--vocab_path models/google_zh_poem_vocab.txt \
|
65 |
--config_path models/gpt2/config.json \
|
66 |
--output_model_path models/poem_gpt2_model.bin \
|
67 |
--world_size 8 --gpu_ranks 0 1 2 3 4 5 6 7 \
|