2
0

model_glm_130b_v100.sh 567 B

1234567891011121314151617
  1. MODEL_TYPE="glm-130b"
  2. CHECKPOINT_PATH="<your checkpoint path>"
  3. MP_SIZE=8
  4. MODEL_ARGS="--model-parallel-size ${MP_SIZE} \
  5. --num-layers 70 \
  6. --hidden-size 12288 \
  7. --inner-hidden-size 32768 \
  8. --vocab-size 150528 \
  9. --num-attention-heads 96 \
  10. --max-sequence-length 2048 \
  11. --tokenizer-type icetk-glm-130B \
  12. --layernorm-order post \
  13. --load ${CHECKPOINT_PATH} \
  14. --skip-init \
  15. --fp16 \
  16. --bminf \
  17. --bminf-memory-limit 25"