|
|
|
@@ -1,4 +1,64 @@ |
|
|
|
[ |
|
|
|
{ |
|
|
|
"Name": "两卡GPU并行训练-调试任务", |
|
|
|
"Description": "", |
|
|
|
"JobType": "DEBUG", |
|
|
|
"Cluster": "C2Net", |
|
|
|
"ComputeSource": "GPU", |
|
|
|
"HasInternet": 2, |
|
|
|
"VisualizeRequired": false, |
|
|
|
"AccCardsNum": 2, |
|
|
|
"AccCardType": "V100", |
|
|
|
"CpuCores": 16, |
|
|
|
"MemGiB": 100, |
|
|
|
"GPUMemGiB": 32, |
|
|
|
"ShareMemGiB": 0, |
|
|
|
"Image": { |
|
|
|
"ImageID": "", |
|
|
|
"ImageName": "", |
|
|
|
"ImageUrl": "192.168.242.22:443/default-workspace/fccb038c23234b9e80105d4ccd152117/image:ChatGLM3-6B" |
|
|
|
}, |
|
|
|
"PretrainModelList": [], |
|
|
|
"DatasetList": [ |
|
|
|
{ |
|
|
|
"ID": "8d5178b2-eb56-4c0d-b532-be8c685b1e61", |
|
|
|
"DatasetName": "MnistDataset_torch.zip" |
|
|
|
} |
|
|
|
], |
|
|
|
"BranchName": "master", |
|
|
|
"BootFile": "", |
|
|
|
"Parameters": [] |
|
|
|
}, |
|
|
|
{ |
|
|
|
"Name": "两卡GPU并行训练-训练任务", |
|
|
|
"Description": "", |
|
|
|
"JobType": "TRAIN", |
|
|
|
"Cluster": "C2Net", |
|
|
|
"ComputeSource": "GPU", |
|
|
|
"HasInternet": 2, |
|
|
|
"VisualizeRequired": false, |
|
|
|
"AccCardsNum": 2, |
|
|
|
"AccCardType": "V100", |
|
|
|
"CpuCores": 16, |
|
|
|
"MemGiB": 100, |
|
|
|
"GPUMemGiB": 32, |
|
|
|
"ShareMemGiB": 0, |
|
|
|
"Image": { |
|
|
|
"ImageID": "", |
|
|
|
"ImageName": "", |
|
|
|
"ImageUrl": "192.168.242.22:443/default-workspace/fccb038c23234b9e80105d4ccd152117/image:ChatGLM3-6B" |
|
|
|
}, |
|
|
|
"PretrainModelList": [], |
|
|
|
"DatasetList": [ |
|
|
|
{ |
|
|
|
"ID": "8d5178b2-eb56-4c0d-b532-be8c685b1e61", |
|
|
|
"DatasetName": "MnistDataset_torch.zip" |
|
|
|
} |
|
|
|
], |
|
|
|
"BranchName": "master", |
|
|
|
"BootFile": "gpu_mnist_example/parallel_train.py", |
|
|
|
"Parameters": [] |
|
|
|
}, |
|
|
|
{ |
|
|
|
"Name": "NPU调试任务", |
|
|
|
"Description": "", |
|
|
|
@@ -338,65 +398,5 @@ |
|
|
|
"Value": "8" |
|
|
|
} |
|
|
|
] |
|
|
|
}, |
|
|
|
{ |
|
|
|
"Name": "两卡GPU并行训练", |
|
|
|
"Description": "", |
|
|
|
"JobType": "TRAIN", |
|
|
|
"Cluster": "C2Net", |
|
|
|
"ComputeSource": "GPU", |
|
|
|
"HasInternet": 2, |
|
|
|
"VisualizeRequired": false, |
|
|
|
"AccCardsNum": 2, |
|
|
|
"AccCardType": "V100", |
|
|
|
"CpuCores": 16, |
|
|
|
"MemGiB": 100, |
|
|
|
"GPUMemGiB": 32, |
|
|
|
"ShareMemGiB": 0, |
|
|
|
"Image": { |
|
|
|
"ImageID": "", |
|
|
|
"ImageName": "", |
|
|
|
"ImageUrl": "192.168.242.22:443/default-workspace/fccb038c23234b9e80105d4ccd152117/image:ChatGLM3-6B" |
|
|
|
}, |
|
|
|
"PretrainModelList": [], |
|
|
|
"DatasetList": [ |
|
|
|
{ |
|
|
|
"ID": "8d5178b2-eb56-4c0d-b532-be8c685b1e61", |
|
|
|
"DatasetName": "MnistDataset_torch.zip" |
|
|
|
} |
|
|
|
], |
|
|
|
"BranchName": "master", |
|
|
|
"BootFile": "gpu_mnist_example/parallel_train.py", |
|
|
|
"Parameters": [] |
|
|
|
}, |
|
|
|
{ |
|
|
|
"Name": "两卡GPU并行训练-调试任务", |
|
|
|
"Description": "", |
|
|
|
"JobType": "DEBUG", |
|
|
|
"Cluster": "C2Net", |
|
|
|
"ComputeSource": "GPU", |
|
|
|
"HasInternet": 2, |
|
|
|
"VisualizeRequired": false, |
|
|
|
"AccCardsNum": 2, |
|
|
|
"AccCardType": "V100", |
|
|
|
"CpuCores": 16, |
|
|
|
"MemGiB": 100, |
|
|
|
"GPUMemGiB": 32, |
|
|
|
"ShareMemGiB": 0, |
|
|
|
"Image": { |
|
|
|
"ImageID": "", |
|
|
|
"ImageName": "", |
|
|
|
"ImageUrl": "192.168.242.22:443/default-workspace/fccb038c23234b9e80105d4ccd152117/image:ChatGLM3-6B" |
|
|
|
}, |
|
|
|
"PretrainModelList": [], |
|
|
|
"DatasetList": [ |
|
|
|
{ |
|
|
|
"ID": "8d5178b2-eb56-4c0d-b532-be8c685b1e61", |
|
|
|
"DatasetName": "MnistDataset_torch.zip" |
|
|
|
} |
|
|
|
], |
|
|
|
"BranchName": "master", |
|
|
|
"BootFile": "", |
|
|
|
"Parameters": [] |
|
|
|
} |
|
|
|
] |