修复模板启动

This commit is contained in:
pengluan 2022-08-02 16:00:01 +08:00
parent 6cae3236c9
commit 85b8906384
6 changed files with 9 additions and 8 deletions

View File

@ -78,6 +78,10 @@ https://github.com/tencentmusic/cube-studio/wiki
<br>
<br>
[![Stargazers repo roster for @tencentmusic/cube-studio](https://reporoster.com/stars/tencentmusic/cube-studio)](https://github.com/tencentmusic/cube-studio/stargazers)
[![Forkers repo roster for @tencentmusic/cube-studio](https://reporoster.com/forks/tencentmusic/cube-studio)](https://github.com/tencentmusic/cube-studio/network/members)
# 落地公司
![image](https://user-images.githubusercontent.com/20157705/176909239-f24cbf8d-8fb5-4326-abed-6fbc3f5a2d1f.png)

View File

@ -41,7 +41,7 @@ KFJ_TASK_RESOURCE_CPU = os.getenv('KFJ_TASK_RESOURCE_CPU', '')
KFJ_TASK_RESOURCE_MEMORY = os.getenv('KFJ_TASK_RESOURCE_MEMORY', '')
NUM_WORKER = 3
COMMAND=''
WORK_IMAGES='csighub.tencentyun.com/tme-kubeflow/horovod:cpu-20210401'
WORK_IMAGES='ccr.ccs.tencentyun.com/cube-studio/horovod:20210401'
WORKIMG_DIR ='/mnt/admin'
k8s_volumes, k8s_volume_mounts = k8s_client.get_volume_mounts(KFJ_TASK_VOLUME_MOUNT,KFJ_CREATOR)

View File

@ -284,7 +284,7 @@ if __name__ == "__main__":
arg_parser.add_argument('--working_dir', type=str, help="运行job的工作目录,需要分布式存储", default='')
arg_parser.add_argument('--num_worker', type=int, help="workder数量", default=3)
arg_parser.add_argument('--user_cmd', type=str, help="执行命令", default='./run.sh')
arg_parser.add_argument('--image', type=str, help="worker的镜像", default='mirrors.tencent.com/raw-kaldi/liutaozhang_kaldi_gpu:latest')
arg_parser.add_argument('--image', type=str, help="worker的镜像", default='ccr.ccs.tencentyun.com/cube-studio/kaldi_distributed_worker:v1')
args = arg_parser.parse_args()
logging.info("{} args: {}".format(__file__, args))

View File

@ -5,9 +5,8 @@ RUN git clone https://github.com/pjreddie/darknet.git
RUN cd darknet && sed -i 's@OPENMP=0@OPENMP=1@g' Makefile && make
COPY setup_args.py /app
COPY launcher.sh /app
RUN wget https://pengluan-76009.sz.gfp.tencent-cloud.com/github/yolov3.weights
RUN wget https://pengluan-76009.sz.gfp.tencent-cloud.com/github/coco_data_sample.zip
RUN wget https://docker-76009.sz.gfp.tencent-cloud.com/github/cube-studio/service/yolov3.weights
RUN wget https://docker-76009.sz.gfp.tencent-cloud.com/github/cube-studio/pipeline/coco_data_sample.zip
RUN unzip coco_data_sample.zip && cd coco_data_sample && bash reset_list.sh
RUN apt install -y python3.6-dev python3-pip libsasl2-dev libpq-dev \

View File

@ -1,2 +0,0 @@
from .tdw_exceptions import TDWFailedException
from .tdw_exceptions import TDWNoResException

View File

@ -7,7 +7,7 @@ from ..constants import ModelStatus
from ..exceptions.model_repo_exception import *
from ..context import KFJobContext
API_BASE_URL = "http://kubeflow.music.woa.com"
API_BASE_URL = "http://kubeflow-dashboard.infra"
INNER_API_BASE_URL = "http://kubeflow-dashboard.infra"
MODEL_API_URI = "training_model_modelview/api"
DEPLOY_API_URI = "training_model_deploy_modelview/api"