Update README.md
Browse files
README.md
CHANGED
|
@@ -91,7 +91,7 @@ Taking the case of ALBERT-Base
|
|
| 91 |
Stage1:
|
| 92 |
|
| 93 |
```
|
| 94 |
-
python3 preprocess.py --corpus_path corpora/
|
| 95 |
--vocab_path models/google_zh_vocab.txt \
|
| 96 |
--dataset_path cluecorpussmall_albert_seq128_dataset.pt \
|
| 97 |
--seq_length 128 --processes_num 32 --data_processor albert
|
|
@@ -110,7 +110,7 @@ python3 pretrain.py --dataset_path cluecorpussmall_albert_seq128_dataset.pt \
|
|
| 110 |
Stage2:
|
| 111 |
|
| 112 |
```
|
| 113 |
-
python3 preprocess.py --corpus_path corpora/
|
| 114 |
--vocab_path models/google_zh_vocab.txt \
|
| 115 |
--dataset_path cluecorpussmall_albert_seq512_dataset.pt \
|
| 116 |
--seq_length 512 --processes_num 32 --data_processor albert
|
|
|
|
| 91 |
Stage1:
|
| 92 |
|
| 93 |
```
|
| 94 |
+
python3 preprocess.py --corpus_path corpora/cluecorpussmall_bert.txt \
|
| 95 |
--vocab_path models/google_zh_vocab.txt \
|
| 96 |
--dataset_path cluecorpussmall_albert_seq128_dataset.pt \
|
| 97 |
--seq_length 128 --processes_num 32 --data_processor albert
|
|
|
|
| 110 |
Stage2:
|
| 111 |
|
| 112 |
```
|
| 113 |
+
python3 preprocess.py --corpus_path corpora/cluecorpussmall_bert.txt \
|
| 114 |
--vocab_path models/google_zh_vocab.txt \
|
| 115 |
--dataset_path cluecorpussmall_albert_seq512_dataset.pt \
|
| 116 |
--seq_length 512 --processes_num 32 --data_processor albert
|