generate.sh 866 B

1234567891011121314151617181920212223242526272829303132333435363738
  1. #!/bin/bash
  2. script_path=$(realpath $0)
  3. script_dir=$(dirname $script_path)
  4. main_dir=$(dirname $script_dir)
  5. source "${main_dir}/configs/model_glm_130b.sh"
  6. SEED=1234
  7. MAX_OUTPUT_LENGTH=256
  8. MIN_GEN_LENGTH=0
  9. # BeamSearchStrategy args
  10. NUM_BEAMS=4
  11. LENGTH_PENALTY=1.0
  12. NO_REPEAT_NGRAM=3
  13. # BaseStrategy args
  14. TEMP=1.0
  15. TOPK=0
  16. TOPP=0.7
  17. ARGS="${main_dir}/generate.py \
  18. --seed $SEED \
  19. --mode inference \
  20. --sampling-strategy BaseStrategy \
  21. --out-seq-length $MAX_OUTPUT_LENGTH \
  22. --min-gen-length $MIN_GEN_LENGTH \
  23. --num-beams $NUM_BEAMS \
  24. --length-penalty $LENGTH_PENALTY \
  25. --no-repeat-ngram-size $NO_REPEAT_NGRAM \
  26. --temperature $TEMP \
  27. --top_k $TOPK \
  28. --top_p $TOPP \
  29. --output-path samples \
  30. $MODEL_ARGS \
  31. $*"
  32. run_cmd="torchrun --nproc_per_node $MP_SIZE ${ARGS}"
  33. eval ${run_cmd}