结合 DP还能干这个?——transfer learning应用之D3修正 - 知乎 (zhihu.com)
/work/qan/kluo/Mg/dpgen/TransLnt50/simplify.json
{
"type_map": ["Mg"],
"mass_map": [24.305],
"init_data_prefix": "",
"init_data_sys": [],
"pick_data": "/work/qan/kluo/Mg/dpgen/TLRun/collect",
"labeled": false,
"init_pick_number":100,
"iter_pick_number":2000,
"model_devi_f_trust_lo":0.05,
"model_devi_f_trust_hi":0.2,
"sys_configs": [],
"sys_batch_size": ["auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto"],
"_sys_batch_size": [1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1],
"training_iter0_model_path": ["/work/qan/kluo/Mg/dpgen/TLRun/iter.000087/00.train/00[0-3]"],
"training_init_model": true,
"numb_models": 4,
"dp_compress": true,
"default_training_param": {
"model": {
"type_map": ["Mg"],
"descriptor": {
"type": "se_e2_a",
"sel": [80],
# or "sel": "auto:1.01" 如果需要初始化旧模型(transferL),这个必须用旧模型的确定值,不能用自动挡。
"rcut_smth": 2.0,
"rcut": 6.0,
"neuron": [20,40,80],
"resnet_dt": false,
"axis_neuron": 12,
"trainable": false,
"seed": 0
},
"fitting_net": {
"neuron": [120,120,120],
"resnet_dt": true,
"trainable": [false, false, false, true],
"seed": 1
}
},
"learning_rate": {
"type": "exp",
"start_lr": 0.001,
"stop_lr": 3.51e-8,
"decay_steps": 10000
},
"loss": {
"type": "ener",
"start_pref_e": 0.02,
"limit_pref_e": 1,
"start_pref_f": 1000,
"limit_pref_f": 1,
"start_pref_v": 0.02,
"limit_pref_v": 1
},
"training": {
"_validation_data":{
"systems": [
"/work/qan/kluo/Mg/dpgen/iter.000059/02.fp/data.029"],
"batch_size": "auto",
"numb_btch": 4,
"_comment": "that's all"
},
"stop_batch": 2000000,
"_seed": 1,
"disp_file": "lcurve.out",
"disp_freq": 5000,
"numb_test": 2,
"save_freq": 100000,
"save_ckpt": "model.ckpt",
"disp_training": true,
"time_training": true,
"profiling": false,
"profiling_file": "timeline.json",
"_comment": "that's all"
}
},
"fp_style": "vasp",
"_fp_skip_bad_box": "true",
"fp_task_max": 2000,
"fp_task_min": 0,
"ratio_failed": 1.0,
"_fp_accurate_threshold": 0.99,
"_fp_accurate_soft_threshold": 0.01,
"fp_pp_path": "./",
"fp_pp_files": ["POTCAR_Mg"],
"fp_incar": "./INCAR_Mg",
"_comment": "that's all"
}
/work/qan/kluo/Mg/dpgen/TransLnt50/machine.json
{
"api_version": "1.0",
"_deepmd_version": "2.0.3",
"train" :[
{
"command": "dp",
"machine": {
"batch_type": "slurm",
"context_type": "local",
"local_root" : "./",
"remote_root": "./work"
},
"resources": {
"number_node": 1,
"cpu_per_node": 64,
"gpu_per_node": 0,
"queue_name": "nova,reserved,instruction,interactive,scavenger",
"custom_flags": ["###SBATCH --account=cpu-s1-matersimul-0",
"#SBATCH --job-name='dptrain'",
"#SBATCH --cpus-per-task=1",
"#SBATCH --hint=compute_bound",
"#SBATCH --ntasks=64",
"#SBATCH --mail-type=ALL",
"#SBATCH --time=24:00:00",
"#SBATCH --exclusive",
"#SBATCH --mem=0",
"#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
"#SBATCH --mail-user=kluo@iastate.edu"],
"source_list": ["/work/qan/kluo/TiCdpgen/Run/dp221.sh"],
"_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
"_time_limit": "240:0:0",
"group_size": 1
}
}
],
"model_devi":[
{
"command": "dp",
"machine": {
"batch_type": "slurm",
"context_type": "local",
"local_root" : "./",
"remote_root": "./work"
},
"resources": {
"number_node": 1,
"cpu_per_node": 64,
"gpu_per_node": 0,
"queue_name": "nova,reserved,instruction,interactive,scavenger",
"custom_flags": ["###SBATCH --account=cpu-s1-matersimul-0",
"#SBATCH --job-name='dpdevi'",
"#SBATCH --cpus-per-task=1",
"#SBATCH --hint=compute_bound",
"#SBATCH --ntasks=64",
"#SBATCH --exclusive",
"#SBATCH --mem=0",
"##SBATCH --nodelist=nova18-[1-70]",
"#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
"#SBATCH --time=1:00:00"],
"source_list": ["/work/qan/kluo/TiCdpgen/Run/lmp227.sh"],
"_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
"_time_limit": "240:0:0",
"wait_time": 1,
"group_size": 1
}
}
],
"fp":[
{
"command": "python /work/qan/kluo/Mg/CDFTpython/elect.py ./ --name Mg --count 2 --nt 50 --ncore 18 && srun -n 18 /work/qan/codes/VASP/bin/vasp_std1",
"machine": {
"batch_type": "slurm",
"context_type": "local",
"local_root" : "./",
"remote_root": "./work"
},
"resources": {
"number_node": 1,
"cpu_per_node": 18,
"gpu_per_node": 0,
"queue_name": "nova,reserved,instruction,interactive,scavenger",
"custom_flags": ["#SBATCH --constraint=intel",
"#SBATCH --job-name='fp'",
"#SBATCH --cpus-per-task=1",
"#SBATCH --hint=compute_bound",
"#SBATCH --ntasks=18",
"##SBATCH --exclusive",
"##SBATCH --mem=0",
"#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
"#SBATCH --time=2:00:00"],
"source_list": ["/home/kluo/shpy/dplmp.sh"],
"_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
"_time_limit": "240:0:0",
"wait_time": 1,
"group_size": 1
}
}
]
}
评论
发表评论