Skip to content

Commit 5af1fd5

Browse files
authored
Add a local submission json file with 4-GPU. (#400)
* Add a local submission json file with 4-GPU. * Update machine-local-4GPU.json Added some comments. Thanks Yinan for checking.
1 parent 0aa1b4f commit 5af1fd5

File tree

1 file changed

+89
-0
lines changed

1 file changed

+89
-0
lines changed
Lines changed: 89 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,89 @@
1+
{
2+
"_comment" : "This is an example of DP-GEN on Local device running with 4 GPUs",
3+
"_comment" : "Last updated on 2021.5.9 for DP-GEN 0.9.2 by Ke XU",
4+
"train": [
5+
{
6+
"_comment" : "Specify the installed path of DeePMD-kit",
7+
"_comment" : "The version of DeePMD-kit should be 1.*",
8+
"command": "/home/user/anaconda3/bin/dp",
9+
"_comment" : "Specify machine settings",
10+
"machine": {
11+
"_comment" : "Supported batches include slurm, pbs, shell, lsf.",
12+
"batch": "shell",
13+
"work_path": "/tmp/dpwork",
14+
"_comment": "that's all"
15+
},
16+
"resources":{
17+
"_comment" : "The number of nodes.",
18+
"numb_node": 1,
19+
"_comment" : "The number of GPUs.",
20+
"numb_gpu": 1,
21+
"_comment" : "The number of CPUs.",
22+
"task_per_node": 4,
23+
"_comment" : "The number of GPUs that can be used for each task.",
24+
"manual_cuda_devices": 4,
25+
"_comment" : "The number of tasks that can be run in each GPU.",
26+
"manual_cuda_multiplicity":1,
27+
"_comment" : "Allow the multi-GPU task running.",
28+
"cuda_multi_task": true,
29+
"_comment" : "Partition.",
30+
"partition": "gpu",
31+
"_comment" : "Memory limit.",
32+
"mem_limit": 64,
33+
"_comment" : "None for local device",
34+
"exclude_list": [],
35+
"module_list": [],
36+
"source_list": ["/opt/intel/parallel_studio_xe_2020/psxevars.sh"],
37+
"_comment" : "Time limit.",
38+
"time_limit": "23:0:0"
39+
},
40+
"_comment" : "DP-GEN will put 4 tasks together in one submitting script.",
41+
"group_size": 4
42+
}
43+
],
44+
45+
"model_devi": [
46+
{
47+
"machine": {
48+
"batch": "shell",
49+
"work_path": "/tmp/dpwork"
50+
},
51+
"resources": {
52+
"numb_node": 1,
53+
"numb_gpu": 4,
54+
"task_per_node": 4,
55+
"manual_cuda_devices": 4,
56+
"manual_cuda_multiplicity":1,
57+
"cuda_multi_task": true,
58+
"partition": "gpu",
59+
"exclude_list": [],
60+
"mem_limit": 64,
61+
"source_list": [],
62+
"module_list": [],
63+
"time_limit": "23:0:0"
64+
},
65+
"command": "/home/user/Soft/Deepmd/lammps-stable_29Oct2020/src/lmp_mpi",
66+
"group_size": 4
67+
}
68+
],
69+
70+
"fp": [
71+
{
72+
"machine": {
73+
"batch": "shell",
74+
"work_path": "/tmp/dpwork"
75+
},
76+
"resources": {
77+
"allow_failure": true,
78+
"ratio_failue": 0.05,
79+
"task_per_node": 16,
80+
"with_mpi": true,
81+
"_comment" : "Load the intel compiler.",
82+
"source_list": ["/opt/intel/parallel_studio_xe_2020/psxevars.sh"],
83+
"envs": {"PATH" : "/home/user/Soft/VASP/vasp.5.4.4-allbak/bin:$PATH"}
84+
},
85+
"command": "vasp_std",
86+
"group_size": 1
87+
}
88+
]
89+
}

0 commit comments

Comments
 (0)