Skip to content

Commit fc6f064

Browse files
hehesimidaLin-Bert
authored andcommitted
gpt 13b ckpt
1 parent 9274e08 commit fc6f064

File tree

2 files changed

+20
-4
lines changed

2 files changed

+20
-4
lines changed

docs/model_cards/gpt2.md

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -321,7 +321,8 @@ GPT2支持文本生成和文本分类两个任务的评测。
321321
--eval_dataset_dir {your_path/wikitext-2.mindrecord} \
322322
--run_mode eval \
323323
--epochs 1
324-
# PerplexityMetric: {'PerplexityMetric': {'loss': 3.24, 'PPL': 25.55}
324+
# gpt2: PerplexityMetric: {'PerplexityMetric': {'loss': 3.24, 'PPL': 25.55}
325+
# gpt2_13b(需替换yaml文件): PerplexityMetric: {'PerplexityMetric': {'loss': 2.35, 'PPL': 10.49}
325326
```
326327

327328
- 文本分类:

mindformers/mindformer_book.py

Lines changed: 18 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -324,6 +324,8 @@ class MindFormerBook:
324324
_PROJECT_PATH, "configs/gpt2/run_gpt2_xl.yaml")),
325325
("gpt2_xl_lora", os.path.join(
326326
_PROJECT_PATH, "configs/gpt2/run_gpt2_xl_lora.yaml")),
327+
("gpt2_13b", os.path.join(
328+
_PROJECT_PATH, "configs/gpt2/run_gpt2_13b.yaml")),
327329
("llama_7b", os.path.join(
328330
_PROJECT_PATH, "configs/llama/run_llama_7b.yaml")),
329331
("llama_13b", os.path.join(
@@ -421,7 +423,8 @@ class MindFormerBook:
421423
'gpt2',
422424
'gpt2_lora',
423425
'gpt2_xl',
424-
'gpt2_xl_lora'
426+
'gpt2_xl_lora',
427+
'gpt2_13b'
425428
]),
426429
('llama', [
427430
'llama_7b',
@@ -510,7 +513,8 @@ class MindFormerBook:
510513
'gpt2',
511514
'gpt2_lora',
512515
'gpt2_xl',
513-
'gpt2_xl_lora'
516+
'gpt2_xl_lora',
517+
'gpt2_13b'
514518
]),
515519
('llama', [
516520
'llama_7b',
@@ -590,7 +594,8 @@ class MindFormerBook:
590594
'gpt2',
591595
'gpt2_lora',
592596
'gpt2_xl',
593-
'gpt2_xl_lora'
597+
'gpt2_xl_lora',
598+
'gpt2_13b'
594599
]),
595600
('llama', [
596601
'llama',
@@ -785,6 +790,10 @@ class MindFormerBook:
785790
['https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
786791
'/XFormer_for_mindspore/gpt2/gpt2_xl_lora.ckpt'
787792
]),
793+
('gpt2_13b',
794+
['https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
795+
'/XFormer_for_mindspore/gpt2/gpt2_13b.ckpt'
796+
]),
788797
('pangualpha_2_6b',
789798
['https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
790799
'/XFormer_for_mindspore/pangualpha/pangualpha_2_6b.ckpt'
@@ -1017,6 +1026,12 @@ class MindFormerBook:
10171026
'https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
10181027
'/XFormer_for_mindspore/gpt2/merges.txt'
10191028
]),
1029+
('gpt2_13b',
1030+
['https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
1031+
'/XFormer_for_mindspore/gpt2/vocab.json',
1032+
'https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
1033+
'/XFormer_for_mindspore/gpt2/merges.txt'
1034+
]),
10201035
('pangualpha_2_6b',
10211036
['https://ascend-repo-modelzoo.obs.cn-east-2.myhuaweicloud.com'
10221037
'/XFormer_for_mindspore/pangualpha/vocab.model'

0 commit comments

Comments
 (0)