mirror of
https://github.com/tencentmusic/cube-studio.git
synced 2025-03-07 15:08:51 +08:00
fix pipeline bug
This commit is contained in:
parent
17f52ff74e
commit
af56a4e486
19
install/kubernetes/config
Normal file
19
install/kubernetes/config
Normal file
@ -0,0 +1,19 @@
|
||||
apiVersion: v1
|
||||
clusters:
|
||||
- cluster:
|
||||
certificate-authority-data: LS0tLS1CRUdJTiBDRVJUSUZJQ0FURS0tLS0tCk1JSUMvakNDQWVhZ0F3SUJBZ0lCQURBTkJna3Foa2lHOXcwQkFRc0ZBREFWTVJNd0VRWURWUVFERXdwcmRXSmwKY201bGRHVnpNQjRYRFRJME1EUXdOVEF5TXpReU0xb1hEVE0wTURRd016QXlNelF5TTFvd0ZURVRNQkVHQTFVRQpBeE1LYTNWaVpYSnVaWFJsY3pDQ0FTSXdEUVlKS29aSWh2Y05BUUVCQlFBRGdnRVBBRENDQVFvQ2dnRUJBTVpuClcyZ3J0Z3VNQzFNWGVXQTN1TlNCb3lSQXhqbkVBaUVaV1gxMVlBNTBMeVBHZlVjaGVEdVVkVG9UZTJaSXJ0ZXUKK1JlSnNSbitVOUtxNXVWeFcxZUxWNVR2QnFINXNlU1ROL3ZuV0U4L3ZzREl3SFlUK2c2RDA2ZWpVWk44OG1kOQpxQTEwditTYWlQU29DT2tqWjhIU2lVZDZJRWg0M2sxNm9QRnRNOHFyd2E4REhRZkxPQlEvbmFXeVNUWnF6VWVpCmhVdWFVZnZ1UW9mMmJZQWMrekRycnBLZlNWSExBQUE1SThwZnZYUjRxVk5HZVJoalhpbzRrcUxTSWZ0cEV3b3MKUENUek9mUklaMHk1blo3elh6dXA0ZzZaVDBLeCtkTFZkY25lc01McDlBU2VrVzJvTG5sRUZNNTBGR3BvSitkYgpjMWYxejFrVkt5Qk9CeFJuc1hjQ0F3RUFBYU5aTUZjd0RnWURWUjBQQVFIL0JBUURBZ0trTUE4R0ExVWRFd0VCCi93UUZNQU1CQWY4d0hRWURWUjBPQkJZRUZFMVZOOGRsVVJGdHQvbG5sY3lnV1FWTFlhTXVNQlVHQTFVZEVRUU8KTUF5Q0NtdDFZbVZ5Ym1WMFpYTXdEUVlKS29aSWh2Y05BUUVMQlFBRGdnRUJBRnRmR24ycVpyN1dZUzlHTjZzbwpuZDdhVjlISExmaXpLRGt0SUo3NEdpRVBqbm1tQitxRDQwR1ZYNklTY3dtRGV6SVY2RzRXNU15b1JRTTBpRTczCkNuWEMxNURZSG50V2NXeXg3QWg5eVVCdzNaYW1HWE9qUUpHdWxZem1GbzQ5MjhjUEF6NVhyMFFyYUlJWG1VczgKSkZQWGpkYVVBVDVuVnQyNUtCSTBCK3JUaVVNTm9XMkRWRUJWODRUcWpOa05GM2RhRHB6dVpNZWZYOUpqeVcvVAp6Zzc5ZU1abnhSaHhZQlFpZHV4aXJlK2E0Ynl0UW5iN2JDVjBYZGtMdEI3L1RhT1R2U3NuUzMxTkpZa3pkeS90CkZiNGpGM3hSUkFlbi8xaTNFSHhqelA2QnlkVENaS2hoT1IxcWR0WkNiUldvd0V2ZEUrd0RZU3lNVmZyS05LRnUKZWFVPQotLS0tLUVORCBDRVJUSUZJQ0FURS0tLS0tCg==
|
||||
server: https://172.16.210.4:6443
|
||||
name: kubernetes
|
||||
contexts:
|
||||
- context:
|
||||
cluster: kubernetes
|
||||
user: kubernetes-admin
|
||||
name: kubernetes-admin@kubernetes
|
||||
current-context: kubernetes-admin@kubernetes
|
||||
kind: Config
|
||||
preferences: {}
|
||||
users:
|
||||
- name: kubernetes-admin
|
||||
user:
|
||||
client-certificate-data: LS0tLS1CRUdJTiBDRVJUSUZJQ0FURS0tLS0tCk1JSURJVENDQWdtZ0F3SUJBZ0lJYy9KM0VyM21lS3N3RFFZSktvWklodmNOQVFFTEJRQXdGVEVUTUJFR0ExVUUKQXhNS2EzVmlaWEp1WlhSbGN6QWVGdzB5TkRBME1EVXdNak0wTWpOYUZ3MHlOVEEwTURVd01qTTBNalphTURReApGekFWQmdOVkJBb1REbk41YzNSbGJUcHRZWE4wWlhKek1Sa3dGd1lEVlFRREV4QnJkV0psY201bGRHVnpMV0ZrCmJXbHVNSUlCSWpBTkJna3Foa2lHOXcwQkFRRUZBQU9DQVE4QU1JSUJDZ0tDQVFFQXhpZTVUeU9zN0ozTG1FWjAKZmVqd3pVU2UvSkd0a3k2STBnb0t1SDJQNW16bDY0RUwrbnk3ak1PTjRnNUdsNzFTbnAwWDd3SDZ6QThBRC91eApZcENaeGR6WCtoWXBpdVdkWDY4WFNhS1pNQThaMllMVHg5dmxFNEJPQTg0alRBWGVMeVF6RTJ3UnJKNkNtSHNtCnRiMDN3d1BGNlFxRkE3aDIzbE0ydXljMkxwUDhXWDJrY3pRR1B1MHQySmlmZGhMYnJ1UGRNSjRCKzg3YlNWWVoKS0NFL01VdVVBcDJIeEZUNVI3N29YN1hLTk5rbmhyOXh4ZExyem9wc0kxWEdGSmUyc0dsWkJ1YUg4enZPdVhuZApFZ3Y1ZkNnV0g4VnhIRFh4TE5sQ2lZWEl3ZU1melRjckVVQTNrV2Y5bEhVUDdrQjVLdzlRbUpmejVEaHRvOHpTClp0cDB3UUlEQVFBQm8xWXdWREFPQmdOVkhROEJBZjhFQkFNQ0JhQXdFd1lEVlIwbEJBd3dDZ1lJS3dZQkJRVUgKQXdJd0RBWURWUjBUQVFIL0JBSXdBREFmQmdOVkhTTUVHREFXZ0JSTlZUZkhaVkVSYmJmNVo1WE1vRmtGUzJHagpMakFOQmdrcWhraUc5dzBCQVFzRkFBT0NBUUVBY2dhNGxsWk5TcW9uOUkvcTd5cGp1UHdQRFFHci9ZNGlqMGRwCnFKdlpRR053SzFrVTQxZHEzZ1VTWlRKenBvbTVnempZNTI4ZjRNMFhaUnM1WFdlSDhLWm9sQ0FmMGVNQ2o5eE8KWFprT2wwUmc5aVRoTzdlUUEzbmVmZXgweFZKNGZsVExXTnErNW8xdjVKT3dmMk80M1U2aldJSmxqVWFxSi8ySgpNbzlZblBRMGhacFE1Q1h3eTZ2c3JsY3lvTUwxQkN0djY5SkwvNmVqVUtweUlYREwzbzEvdGR6dytGbVFwNGNYCkU4TWNLQ2JRZHJmQzJUOS9YM0lyTHhXODZhNlhZcUc5R1REbXJ3andrekp2bEVSa00zV21Nditnd09KVnR6MEEKbEUvdWlmRjFvK0VBQlpIdkpiNXBobG8xOGNucVB1RmZzVjdKSTk0cE1KTmUzWmsralE9PQotLS0tLUVORCBDRVJUSUZJQ0FURS0tLS0tCg==
|
||||
client-key-data: LS0tLS1CRUdJTiBSU0EgUFJJVkFURSBLRVktLS0tLQpNSUlFcFFJQkFBS0NBUUVBeGllNVR5T3M3SjNMbUVaMGZland6VVNlL0pHdGt5NkkwZ29LdUgyUDVtemw2NEVMCitueTdqTU9ONGc1R2w3MVNucDBYN3dINnpBOEFEL3V4WXBDWnhkelgraFlwaXVXZFg2OFhTYUtaTUE4WjJZTFQKeDl2bEU0Qk9BODRqVEFYZUx5UXpFMndScko2Q21Ic210YjAzd3dQRjZRcUZBN2gyM2xNMnV5YzJMcFA4V1gyawpjelFHUHUwdDJKaWZkaExicnVQZE1KNEIrODdiU1ZZWktDRS9NVXVVQXAySHhGVDVSNzdvWDdYS05Oa25ocjl4CnhkTHJ6b3BzSTFYR0ZKZTJzR2xaQnVhSDh6dk91WG5kRWd2NWZDZ1dIOFZ4SERYeExObENpWVhJd2VNZnpUY3IKRVVBM2tXZjlsSFVQN2tCNUt3OVFtSmZ6NURodG84elNadHAwd1FJREFRQUJBb0lCQVFDTW5xd1d5VTV5TEJqTApXMVJYOWZMTStLR0t3eWJXaC9ONGVyL1k1T0kxdDVvQ1luWEpzTEszMWg3ZUNSdDNtMWNDVUtFbmI5UTI4MzRyCjJZV3NXTW1IYkkyb1lBbmpFOGQybTU1L0Z2QjI5b0IxcHkzN2FzVko3WWR2azkzZ21WbHZRdFVzTjBqam95a3kKWkZLNExpdGdMVkZKYTdteFJqcTAwNERIbDdBUHBKMTZXeVZEcmt6UkwrM2FWeFNuZEo1RjM5TU1jbE0vTG5LMQo5TEtvVjVKK01KaHE2Y2w1akZVVlkyV0c3VVJOZFB0NkNEa3ZJaDR6Sy9CTHJZbUozM0R6YlpwWUdkSGttTStTCkpYYktLUmNVNys5UTBUQ2lTOWs4Szd1WDZTaCtqNkorVXBaQXRwblVlK0dxcHFnTjNhOFFMOW1mQmZkc3lEczcKdjNWUkdGVUJBb0dCQU4wRFZCVUV5S3M0aDNaVWd0UXpDZHdrUFJQazVwMmxFRGoxZmp1RFdwR1lUMmFrckdmdQp6Vjhxa3gvMEdwMzNUMS9zTWM4M01xZ3pLdXp1Q1dzaGQwV2VKRUZQbnRrcnFBcHpPdkdrSkozeUx3SzluOUlTCjRXZFZOeFFKRWN6NnZGZWxGNjByYWVnMGpieno4TjNWUVlaYVNXTC9Zb0tEelBUWXZCQy9sSFdKQW9HQkFPV0cKRWNpQitUYUZ2bU15bDZqM1lCR2F2Q052VDd2MkNKVEl6Zm41aURMQVJRcWdMbHArTW80YTFhSXZUbWE1K2FzcAppYmhicy9ES2k1Uk5vOGZyTEVXTWJxRmNnQVBkWWNOM0tkZnlHVWx6aFRId21VdFpsUWZxYU1oaXMvYjZ5RWFvCjVoRUFoSmFZVmNLUHgva3QwS21DSEI0V2NxTis4REhPNTF0M1ZPOTVBb0dBVEVJNnYrbmZwNXlndVFhZUFjUCsKa2ZQN0V5TTNJNHZ4MWdWMjRlZ0gxeGJieHNucEp3OXgwM1ZvUUcxRXhkNndoNk9DNkVIZWU4VHorYjZFaDIrTApyUHpNKzdBU1dsTEM3NkFrNVgzQ21MRVk0WFEyY2hETHI1RHFxVUliMzBOZ3Uwa2VxMFRBalR1YzhHYW5aSk9SCndWN2oxWUhUSnI5OWQ3cFU0ZDZJeGlrQ2dZRUFxRXFPZlhzM2RNL0owa2hGUldIa3NlUEg4UjlyMGtESzkvVG8KZWxLSmw5UzhpdGI2UmVYa1FhZlJYckxiQkoxMlFCY2I0TzUwV0tqYWdTb1FYY1RFMkZYb3hDM2p1M0cyZmpEQQpvSkxtRWFJL1ZtZTRyclFIZng5VUp5R2dIUWF5bElUQTlGUng0MDNkQytTSzF0ek44NHZ2Kyt1dnNNdWhhSlB4CnRYSWc5OWtDZ1lFQWh5eG44YUwreTdtZWZUeWx1SFg3Z0duQVNRVGRJQUp0TnU3L2lGSURQVVR0RTEwenRXazcKZmNSNFpGdmt6c2p6VkVRcjgxZnhiVDBHWjBzOCtXaTNWcy93RXhrSCtkUXRlTlBGT2pkaEJPWUh6U1QyQnNJNApMUUtDeFJ2ODVCNVJFaXJLREhxTE8zSHo0SElxWUVjeHNkVUpwQUpzZ3J4TUh4ZkkvdkFsTGRVPQotLS0tLUVORCBSU0EgUFJJVkFURSBLRVktLS0tLQo=
|
@ -0,0 +1,29 @@
|
||||
apiVersion: batch/v1
|
||||
kind: Job
|
||||
metadata:
|
||||
name: istio-setup
|
||||
annotations:
|
||||
"helm.sh/hook": post-install
|
||||
"helm.sh/hook-weight": "1"
|
||||
"helm.sh/hook-delete-policy": before-hook-creation
|
||||
spec:
|
||||
template:
|
||||
spec:
|
||||
serviceAccountName: istio-installer
|
||||
containers:
|
||||
- name: setup
|
||||
# 使用你的自定义镜像,假设镜像标签为my-kubectl-with-istio:latest
|
||||
image: gaoxin2020/kubectl-cube:latest
|
||||
command: ["/bin/sh"]
|
||||
args:
|
||||
- -c
|
||||
- |
|
||||
kubectl apply -f /istio/install-crd.yaml
|
||||
kubectl wait crd/envoyfilters.networking.istio.io --for condition=established --timeout=60s
|
||||
kubectl apply -f /istio/install-1.15.0.yaml
|
||||
kubectl wait crd/virtualservices.networking.istio.io --for condition=established --timeout=60s
|
||||
kubectl wait crd/gateways.networking.istio.io --for condition=established --timeout=60s
|
||||
kubectl apply -f /istio/gateway.yaml
|
||||
kubectl apply -f /istio/virtual.yaml
|
||||
kubectl patch svc istio-ingressgateway -n istio-system -p '{"spec":{"externalIPs":["'"{{ .Values.nodeLabels.nodeIP }}"'"]}}'
|
||||
restartPolicy: Never
|
@ -0,0 +1,23 @@
|
||||
apiVersion: batch/v1
|
||||
kind: Job
|
||||
metadata:
|
||||
name: kubeflow-crd-job
|
||||
annotations:
|
||||
"helm.sh/hook": post-install
|
||||
"helm.sh/hook-weight": "1"
|
||||
"helm.sh/hook-delete-policy": before-hook-creation
|
||||
spec:
|
||||
template:
|
||||
spec:
|
||||
serviceAccountName: istio-installer
|
||||
containers:
|
||||
- name: setup
|
||||
# 使用你的自定义镜像,假设镜像标签为my-kubectl-with-istio:latest
|
||||
image: gaoxin2020/kubectl-cube:latest
|
||||
command: ["/bin/sh"]
|
||||
args:
|
||||
- -c
|
||||
- |
|
||||
kubectl apply -f /training-crd/
|
||||
restartPolicy: Never
|
||||
|
@ -668,24 +668,23 @@ data:
|
||||
}
|
||||
}
|
||||
|
||||
GLOBAL_ENV={
|
||||
"KFJ_PIPELINE_ID":"\{\{pipeline_id\}\}",
|
||||
"KFJ_RUN_ID":"\{\{uuid.uuid4().hex\}\}",
|
||||
"KFJ_CREATOR":"\{\{creator\}\}",
|
||||
"KFJ_RUNNER":"\{\{runner\}\}",
|
||||
"KFJ_MODEL_REPO_API_URL":"http://kubeflow-dashboard.infra",
|
||||
"KFJ_ARCHIVE_BASE_PATH":"/archives",
|
||||
"KFJ_PIPELINE_NAME":"\{\{pipeline_name\}\}",
|
||||
"KFJ_NAMESPACE":"pipeline",
|
||||
"KFJ_GPU_MEM_MIN":"13G",
|
||||
"KFJ_GPU_MEM_MAX":"13G",
|
||||
"KFJ_ENVIRONMENT":"\{\{cluster_name\}\}",
|
||||
}
|
||||
|
||||
GLOBAL_ENV={
|
||||
"KFJ_PIPELINE_ID": "{{ "{{" }}pipeline_id{{ "}}" }}",
|
||||
"KFJ_RUN_ID": "{{ "{{" }}uuid.uuid4().hex{{ "}}" }}",
|
||||
"KFJ_CREATOR": "{{ "{{" }}creator{{ "}}" }}",
|
||||
"KFJ_RUNNER": "{{ "{{" }}runner{{ "}}" }}",
|
||||
"KFJ_MODEL_REPO_API_URL": "http://kubeflow-dashboard.infra",
|
||||
"KFJ_ARCHIVE_BASE_PATH": "/archives",
|
||||
"KFJ_PIPELINE_NAME": "{{ "{{" }}pipeline_name{{ "}}" }}",
|
||||
"KFJ_NAMESPACE": "pipeline",
|
||||
"KFJ_GPU_MEM_MIN": "13G",
|
||||
"KFJ_GPU_MEM_MAX": "13G",
|
||||
"KFJ_ENVIRONMENT": "{{ "{{" }}cluster_name{{ "}}" }}",
|
||||
}
|
||||
GPU_RESOURCE={
|
||||
"gpu":"nvidia.com/gpu"
|
||||
}
|
||||
|
||||
DEFAULT_GPU_RESOURCE_NAME='nvidia.com/gpu'
|
||||
|
||||
# 配置禁用gpu的方法,不然对复合共用型机器,gpu会被共享使用
|
||||
@ -737,8 +736,8 @@ data:
|
||||
# 用户常用默认镜像
|
||||
USER_IMAGE = 'ccr.ccs.tencentyun.com/cube-studio/ubuntu-gpu:cuda11.8.0-cudnn8-python3.9'
|
||||
# notebook每个pod使用的用户账号
|
||||
JUPYTER_ACCOUNTS='jupyter-user'
|
||||
HUBSECRET_NAMESPACE=[PIPELINE_NAMESPACE,AUTOML_NAMESPACE,NOTEBOOK_NAMESPACE,SERVICE_NAMESPACE]
|
||||
JUPYTER_ACCOUNTS=''
|
||||
HUBSECRET_NAMESPACE=[PIPELINE_NAMESPACE,AUTOML_NAMESPACE,NOTEBOOK_NAMESPACE,SERVICE_NAMESPACE,AIHUB_NAMESPACE]
|
||||
|
||||
# notebook使用的镜像
|
||||
NOTEBOOK_IMAGES=[
|
||||
@ -749,6 +748,9 @@ data:
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:jupyter-ubuntu-bigdata', 'jupyter(bigdata)'],
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:jupyter-ubuntu-machinelearning', 'jupyter(machinelearning)'],
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:jupyter-ubuntu-deeplearning', 'jupyter(deeplearning)'],
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:enterprise-jupyter-ubuntu-cpu-pro', 'jupyter-conda-pro(企业版)'],
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:enterprise-matlab-ubuntu-deeplearning', 'matlab(企业版)'],
|
||||
['ccr.ccs.tencentyun.com/cube-studio/notebook:enterprise-rstudio-ubuntu-bigdata', 'rstudio(企业版)'],
|
||||
]
|
||||
|
||||
# 定时检查大小的目录列表。需要再celery中启动检查任务
|
||||
@ -773,7 +775,7 @@ data:
|
||||
|
||||
# 数据集的存储地址
|
||||
DATASET_SAVEPATH = '/dataset/'
|
||||
STORE_TYPE="cos"
|
||||
STORE_TYPE="" # 目前不支持备份到云上
|
||||
STORE_CONFIG = {
|
||||
"appid": "xx",
|
||||
"secret_id": "xx",
|
||||
@ -785,6 +787,8 @@ data:
|
||||
}
|
||||
|
||||
K8S_DASHBOARD_CLUSTER = '/k8s/dashboard/cluster/' #
|
||||
BLACK_PORT = [10250] # 黑名单端口,cube-studio将不会占用这些端口,10250是kubelet的端口。
|
||||
|
||||
K8S_NETWORK_MODE = 'iptables' # iptables ipvs
|
||||
NOTEBOOK_EXCLUSIVE = False # notebook 启动是否独占资源
|
||||
SERVICE_EXCLUSIVE = False # 内部服务 启动是否独占资源
|
||||
@ -815,10 +819,10 @@ data:
|
||||
]
|
||||
|
||||
# 推理服务的各种配置
|
||||
TFSERVING_IMAGES=['ccr.ccs.tencentyun.com/cube-studio/tfserving:1.14.0','ccr.ccs.tencentyun.com/cube-studio/tfserving:1.14.0-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.0.0','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.0.0-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.1.4','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.1.4-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.2.3','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.2.3-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.3.4','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.3.4-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.4.3','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.4.3-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.5.2','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.5.2-gpu','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.6.0','ccr.ccs.tencentyun.com/cube-studio/tfserving:2.6.0-gpu']
|
||||
TORCHSERVER_IMAGES=['ccr.ccs.tencentyun.com/cube-studio/torchserve:0.6.0-cpu','ccr.ccs.tencentyun.com/cube-studio/torchserve:0.6.0-gpu','ccr.ccs.tencentyun.com/cube-studio/torchserve:0.5.3-cpu','ccr.ccs.tencentyun.com/cube-studio/torchserve:0.5.3-gpu','ccr.ccs.tencentyun.com/cube-studio/torchserve:0.4.2-cpu','ccr.ccs.tencentyun.com/cube-studio/torchserve:0.4.2-gpu']
|
||||
TFSERVING_IMAGES=['tensorflow/serving:2.14.1-gpu','tensorflow/serving:2.14.1','tensorflow/serving:2.13.1-gpu','tensorflow/serving:2.13.1','tensorflow/serving:2.12.2-gpu','tensorflow/serving:2.12.2','tensorflow/serving:2.11.1-gpu','tensorflow/serving:2.11.1','tensorflow/serving:2.10.1-gpu','tensorflow/serving:2.10.1','tensorflow/serving:2.9.3-gpu','tensorflow/serving:2.9.3','tensorflow/serving:2.8.4-gpu','tensorflow/serving:2.8.4','tensorflow/serving:2.7.4-gpu','tensorflow/serving:2.7.4','tensorflow/serving:2.6.5-gpu','tensorflow/serving:2.6.5','tensorflow/serving:2.5.4-gpu','tensorflow/serving:2.5.4']
|
||||
TORCHSERVER_IMAGES=['pytorch/torchserve:0.9.0-gpu','pytorch/torchserve:0.9.0-cpu','pytorch/torchserve:0.8.2-gpu','pytorch/torchserve:0.8.2-cpu','pytorch/torchserve:0.7.1-gpu','pytorch/torchserve:0.7.1-cpu']
|
||||
ONNXRUNTIME_IMAGES=['ccr.ccs.tencentyun.com/cube-studio/onnxruntime:latest','ccr.ccs.tencentyun.com/cube-studio/onnxruntime:latest-cuda']
|
||||
TRITONSERVER_IMAGES=['ccr.ccs.tencentyun.com/cube-studio/tritonserver:22.07-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:21.12-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:21.09-py3']
|
||||
TRITONSERVER_IMAGES=['ccr.ccs.tencentyun.com/cube-studio/tritonserver:24.01-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:23.12-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:22.12-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:21.12-py3','ccr.ccs.tencentyun.com/cube-studio/tritonserver:20.12-py3']
|
||||
|
||||
INFERNENCE_IMAGES={
|
||||
"tfserving":TFSERVING_IMAGES,
|
||||
@ -895,7 +899,7 @@ data:
|
||||
"pipeline": "/frontend/train/train_task/pipeline",
|
||||
"runhistory": "/frontend/train/train_task/runhistory",
|
||||
"workflow": "/frontend/train/train_task/workflow",
|
||||
"nni": "/frontend/train/train_hyperparameter/nni",
|
||||
"nni": "/frontend/train/automl/hyperparameter_search",
|
||||
|
||||
"total_resource": "/frontend/service/total_resource",
|
||||
"service": "/frontend/service/k8s_service",
|
||||
@ -923,25 +927,32 @@ data:
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
|
||||
HOST = CLUSTERS[ENVIRONMENT].get('HOST',None)
|
||||
entrypoint.sh: |+
|
||||
#!/bin/bash
|
||||
|
||||
set -ex
|
||||
|
||||
rm -rf /home/myapp/myapp/static/assets
|
||||
rm -f /home/myapp/myapp/static/assets
|
||||
ln -s /home/myapp/myapp/assets /home/myapp/myapp/static/
|
||||
rm -rf /home/myapp/myapp/static/mnt
|
||||
rm -f /home/myapp/myapp/static/mnt
|
||||
mkdir -p /data/k8s/kubeflow/pipeline/workspace
|
||||
ln -s /data/k8s/kubeflow/pipeline/workspace /home/myapp/myapp/static/mnt
|
||||
rm -f /home/myapp/myapp/static/dataset
|
||||
mkdir -p /data/k8s/kubeflow/dataset
|
||||
ln -s /data/k8s/kubeflow/dataset /home/myapp/myapp/static/
|
||||
rm -f /home/myapp/myapp/static/aihub
|
||||
ln -s /cube-studio/aihub /home/myapp/myapp/static/
|
||||
|
||||
rm -f /home/myapp/myapp/static/global
|
||||
ln -s /data/k8s/kubeflow/global /home/myapp/myapp/static/
|
||||
|
||||
export FLASK_APP=myapp:app
|
||||
python myapp/create_db.py
|
||||
myapp fab create-admin --username admin --firstname admin --lastname admin --email admin@tencent.com --password admin
|
||||
# myapp db init # 生成migrations文件夹
|
||||
# myapp db migrate # 生成对应版本数据库表的升级文件到versions文件夹下,需要你的数据库是已经upgrade的
|
||||
myapp db upgrade # 数据库表同步更新到mysql
|
||||
myapp fab create-admin --username admin --firstname admin --lastname admin --email admin@tencent.com --password admin
|
||||
# 会创建默认的角色和权限。会创建自定义的menu权限,也才能显示自定义menu。
|
||||
myapp init
|
||||
|
||||
@ -1101,6 +1112,8 @@ data:
|
||||
|
||||
kind: ConfigMap
|
||||
metadata:
|
||||
creationTimestamp: null
|
||||
creationTimestamp: "2024-04-06T07:16:21Z"
|
||||
name: kubeflow-dashboard-config
|
||||
namespace: infra
|
||||
resourceVersion: "200718"
|
||||
uid: ec80f20c-0e19-45ab-a213-50e96fbfba0f
|
||||
|
39
install/kubernetes/helm-install/templates/pull_image.yaml
Normal file
39
install/kubernetes/helm-install/templates/pull_image.yaml
Normal file
@ -0,0 +1,39 @@
|
||||
apiVersion: batch/v1
|
||||
kind: Job
|
||||
metadata:
|
||||
name: image-pull
|
||||
annotations:
|
||||
"helm.sh/hook": pre-install
|
||||
"helm.sh/hook-weight": "5"
|
||||
"helm.sh/hook-delete-policy": before-hook-creation
|
||||
spec:
|
||||
template:
|
||||
spec:
|
||||
nodeSelector:
|
||||
kubernetes.io/hostname: {{ .Values.nodeLabels.nodeNames }}
|
||||
|
||||
hostPID: true
|
||||
hostNetwork: true
|
||||
containers:
|
||||
- name: image-pull
|
||||
image: docker
|
||||
securityContext:
|
||||
privileged: true
|
||||
volumeMounts:
|
||||
- name: docker-socket
|
||||
mountPath: /var/run/docker.sock
|
||||
command: ["/bin/sh", "-c"]
|
||||
args:
|
||||
- |
|
||||
docker pull busybox:1.36.0
|
||||
docker pull mysql:8.0.32
|
||||
|
||||
restartPolicy: OnFailure
|
||||
volumes:
|
||||
- name: docker-socket
|
||||
hostPath:
|
||||
path: /var/run/docker.sock
|
||||
type: Socket
|
||||
|
||||
|
||||
|
1
install/kubernetes/kubeconfig/dev-kubeconfig
Normal file
1
install/kubernetes/kubeconfig/dev-kubeconfig
Normal file
@ -0,0 +1 @@
|
||||
|
Loading…
Reference in New Issue
Block a user