mirror of
https://github.com/tencentmusic/cube-studio.git
synced 2024-12-15 06:09:57 +08:00
.. | ||
build.sh | ||
demo.py | ||
Dockerfile | ||
launcher.py | ||
README.md | ||
tensorflow-mnist.yaml |
horovod 模板
镜像:ccr.ccs.tencentyun.com/cube-studio/horovod:20210401 k8s账号: kubeflow-pipeline 启动参数:
{
"参数": {
"--work_images": {
"type": "str",
"item_type": "str",
"label": "worker的运行镜像,直接运行你代码的环境镜像 <a target='_blank' href='https://github.com/tencentmusic/cube-studio/tree/master/images'>基础镜像</a>",
"require": 1,
"choice": [],
"range": "",
"default": "ccr.ccs.tencentyun.com/cube-studio/horovod:20210401",
"placeholder": "",
"describe": "worker的运行镜像",
"editable": 1,
"condition": "",
"sub_args": {}
},
"--working_dir": {
"type": "str",
"item_type": "str",
"label": "命令的启动目录",
"require": 1,
"choice": [],
"range": "",
"default": "/mnt/xxx/horovod/",
"placeholder": "",
"describe": "命令的启动目录",
"editable": 1,
"condition": "",
"sub_args": {}
},
"--command": {
"type": "str",
"item_type": "str",
"label": "训练启动命令",
"require": 1,
"choice": [],
"range": "",
"default": "python /mnt/admin/demo.py",
"placeholder": "",
"describe": "训练启动命令",
"editable": 1,
"condition": "",
"sub_args": {}
},
"--num_worker": {
"type": "str",
"item_type": "str",
"label": "分布式worker的数目",
"require": 1,
"choice": [],
"range": "",
"default": 2,
"placeholder": "",
"describe": "分布式worker的数目",
"editable": 1,
"condition": "",
"sub_args": {}
}
}
}