Skip to content

Modify the environment variables and model configuration of the bench… #9725

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -127,6 +127,8 @@ function _train(){

export FLAGS_selected_gpus="0,1,2,3,4,5,6,7"
export PYTHONPATH=$(dirname "$PWD"):$PYTHONPATH
# benchmark框架中会默认设置CUDA_MODULE_LOADING=LAZY,影响case执行,修复框架问题后再移除该变量
unset CUDA_MODULE_LOADING

source ${BENCHMARK_ROOT}/scripts/run_model.sh # 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
_set_params $@
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@
# See the License for the specific language governing permissions and
# limitations under the License.

param="model_item=baichuan-inc-baichuan-2-13b_pretrain "
param="model_item=baichuan-inc-baichuan-2-13b_pretrain_dy2st "
param+="run_mode=DP1_MP4_PP2_1F1B_Sharding4_Stage1 "
param+="device_num=N4C32 "
param+="global_batch_size=128 "
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -242,6 +242,8 @@ export FLAGS_enable_sharding_stage1_tensor_fusion=1
# 只有13b的任务需要打开CUDA_DEVICE_MAX_CONNECTIONS,7b与13b关闭
export CUDA_DEVICE_MAX_CONNECTIONS=1
export PARALLEL_CROSS_ENTROPY=true
# benchmark框架中会默认设置CUDA_MODULE_LOADING=LAZY,影响case执行,修复框架问题后再移除该变量
unset CUDA_MODULE_LOADING

source ${BENCHMARK_ROOT}/scripts/run_model.sh # 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
_set_params $@
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -246,6 +246,8 @@ export FLAGS_enable_sharding_stage1_tensor_fusion=1
# 只有13b的任务需要打开CUDA_DEVICE_MAX_CONNECTIONS,7b与13b关闭
export CUDA_DEVICE_MAX_CONNECTIONS=1
export PARALLEL_CROSS_ENTROPY=true
# benchmark框架中会默认设置CUDA_MODULE_LOADING=LAZY,影响case执行,修复框架问题后再移除该变量
unset CUDA_MODULE_LOADING

source ${BENCHMARK_ROOT}/scripts/run_model.sh # 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
_set_params $@
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -246,6 +246,8 @@ export FLAGS_enable_sharding_stage1_tensor_fusion=1
# 只有13b的任务需要打开CUDA_DEVICE_MAX_CONNECTIONS,7b与13b关闭
export CUDA_DEVICE_MAX_CONNECTIONS=1
export PARALLEL_CROSS_ENTROPY=true
# benchmark框架中会默认设置CUDA_MODULE_LOADING=LAZY,影响case执行,修复框架问题后再移除该变量
unset CUDA_MODULE_LOADING

source ${BENCHMARK_ROOT}/scripts/run_model.sh # 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
_set_params $@
Expand Down