Bladeren bron

Add GLM-Base model

duzx16 2 jaren geleden
bovenliggende
commit
6615fdd072
2 gewijzigde bestanden met toevoegingen van 12 en 1 verwijderingen
  1. 12 0
      configs/model_glm_base.sh
  2. 0 1
      configs/model_glm_large_generation.sh

+ 12 - 0
configs/model_glm_base.sh

@@ -0,0 +1,12 @@
+MODEL_TYPE="glm-large-generation"
+CHECKPOINT_PATH="/zhangpai21/checkpoints/glm-base-en-blank"
+MP_SIZE=1
+MODEL_ARGS="--model-parallel-size ${MP_SIZE} \
+            --vocab 30592 \
+            --num-layers 12 \
+            --hidden-size 768 \
+            --num-attention-heads 12 \
+            --max-sequence-length 513 \
+            --tokenizer-type glm_BertWordPieceTokenizer \
+            --tokenizer-model-type bert-base-uncased \
+            --load ${CHECKPOINT_PATH}"

+ 0 - 1
configs/model_glm_large_generation.sh

@@ -9,5 +9,4 @@ MODEL_ARGS="--model-parallel-size ${MP_SIZE} \
             --max-sequence-length 513 \
             --tokenizer-type glm_BertWordPieceTokenizer \
             --tokenizer-model-type bert-large-uncased \
-            --task-mask \
             --load ${CHECKPOINT_PATH}"