dpgen transfer learning

结合 DP还能干这个？——transfer learning应用之D3修正 - 知乎 (zhihu.com)

/work/qan/kluo/Mg/dpgen/TransLnt50/simplify.json

{

     "type_map": ["Mg"],
     "mass_map": [24.305],
     "init_data_prefix": "",
     "init_data_sys":  [],
     "pick_data":  "/work/qan/kluo/Mg/dpgen/TLRun/collect",
     
     "labeled": false,
     "init_pick_number":100,
     "iter_pick_number":2000,
     "model_devi_f_trust_lo":0.05,
     "model_devi_f_trust_hi":0.2,
     
     "sys_configs": [],
     "sys_batch_size": ["auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto","auto"],
     "_sys_batch_size": [1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1],
     "training_iter0_model_path":  ["/work/qan/kluo/Mg/dpgen/TLRun/iter.000087/00.train/00[0-3]"],
     "training_init_model": true, 
     "numb_models": 4,
     "dp_compress": true,
     "default_training_param": {
        "model": {
            "type_map": ["Mg"],
            "descriptor": {
                "type": "se_e2_a",
                "sel": [80], 
# or "sel": "auto:1.01" 如果需要初始化旧模型（transferL），这个必须用旧模型的确定值，不能用自动挡。
                "rcut_smth": 2.0,
                "rcut": 6.0,
                "neuron": [20,40,80],
                "resnet_dt": false,
                "axis_neuron": 12,
                "trainable":   false,
                "seed": 0
            },
             "fitting_net": {
                "neuron": [120,120,120],
                "resnet_dt": true,
                "trainable":   [false, false, false, true],
                "seed": 1
            }
        },
         "learning_rate": {
             "type": "exp",
             "start_lr": 0.001,
             "stop_lr": 3.51e-8,
             "decay_steps": 10000
         },
         "loss": {
             "type":         "ener",
             "start_pref_e": 0.02,
             "limit_pref_e": 1,
             "start_pref_f": 1000,
             "limit_pref_f": 1,
             "start_pref_v": 0.02,
             "limit_pref_v": 1
         },
         "training": {
             "_validation_data":{
             "systems": [
             "/work/qan/kluo/Mg/dpgen/iter.000059/02.fp/data.029"],

        "batch_size":   "auto",
        "numb_btch":    4,
        "_comment":     "that's all"
    },
         "stop_batch": 2000000,
         "_seed": 1,
         "disp_file": "lcurve.out",
         "disp_freq": 5000,
         "numb_test": 2,
         "save_freq": 100000,
         "save_ckpt": "model.ckpt",
         "disp_training": true,
         "time_training": true,
         "profiling": false,
         "profiling_file": "timeline.json",
         "_comment": "that's all"
         }
     },
 
     "fp_style": "vasp",
     "_fp_skip_bad_box":  "true",
     "fp_task_max": 2000,
     "fp_task_min": 0,
     "ratio_failed": 1.0,
     "_fp_accurate_threshold": 0.99,
     "_fp_accurate_soft_threshold": 0.01,
     "fp_pp_path": "./",
     "fp_pp_files": ["POTCAR_Mg"],
     "fp_incar": "./INCAR_Mg",
     "_comment": "that's all"
}

/work/qan/kluo/Mg/dpgen/TransLnt50/machine.json

{
    "api_version": "1.0",
    "_deepmd_version": "2.0.3",
    "train" :[
        {
            "command": "dp",
            "machine": {
                "batch_type": "slurm",
                "context_type": "local",
                "local_root" : "./",
                "remote_root": "./work"
            },
            "resources": {
                "number_node": 1,
                "cpu_per_node": 64,
                "gpu_per_node": 0,
                                "queue_name": "nova,reserved,instruction,interactive,scavenger",
                                "custom_flags": ["###SBATCH --account=cpu-s1-matersimul-0", 
                                "#SBATCH --job-name='dptrain'", 
                                "#SBATCH --cpus-per-task=1", 
                                "#SBATCH --hint=compute_bound",
                                "#SBATCH --ntasks=64", 
                                "#SBATCH --mail-type=ALL", 
                                "#SBATCH --time=24:00:00",
                                "#SBATCH --exclusive",
                                "#SBATCH --mem=0",
                                "#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
                                "#SBATCH --mail-user=kluo@iastate.edu"],
                                "source_list": ["/work/qan/kluo/TiCdpgen/Run/dp221.sh"],
                                "_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
                                "_time_limit": "240:0:0",
                                "group_size": 1
            }
        }
    ],
    "model_devi":[
        {
            "command": "dp",
            "machine": {
                "batch_type": "slurm",
                "context_type": "local",
                "local_root" : "./",
                "remote_root": "./work"
            },
            "resources": {
                                "number_node": 1,
                                "cpu_per_node": 64,
                                "gpu_per_node": 0,
                                "queue_name": "nova,reserved,instruction,interactive,scavenger",
                                "custom_flags": ["###SBATCH --account=cpu-s1-matersimul-0", 
                                "#SBATCH --job-name='dpdevi'", 
                                "#SBATCH --cpus-per-task=1", 
                                "#SBATCH --hint=compute_bound",
                                "#SBATCH --ntasks=64", 
                                "#SBATCH --exclusive",
                                "#SBATCH --mem=0",
                                "##SBATCH --nodelist=nova18-[1-70]",
                                "#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
                                "#SBATCH --time=1:00:00"],
                                "source_list": ["/work/qan/kluo/TiCdpgen/Run/lmp227.sh"],
                                "_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
                                "_time_limit": "240:0:0",
                                "wait_time": 1,
                                "group_size": 1
                        }
        }
    ],
    "fp":[
        {
            "command": "python /work/qan/kluo/Mg/CDFTpython/elect.py ./ --name Mg --count 2 --nt 50 --ncore 18 && srun -n 18 /work/qan/codes/VASP/bin/vasp_std1",
            "machine": {
                                "batch_type": "slurm",
                                "context_type": "local",
                                "local_root" : "./",
                                "remote_root": "./work"
                        },
                        "resources": {
                                "number_node": 1,
                                "cpu_per_node": 18,
                                "gpu_per_node": 0,
                                "queue_name": "nova,reserved,instruction,interactive,scavenger",
                                "custom_flags": ["#SBATCH --constraint=intel", 
                                "#SBATCH --job-name='fp'", 
                                "#SBATCH --cpus-per-task=1", 
                                "#SBATCH --hint=compute_bound",
                                "#SBATCH --ntasks=18",
                                "##SBATCH --exclusive",
                                "##SBATCH --mem=0",
                                "#SBATCH --exclude=nova18-gpu-[1-5],nova21-gpu-[1-15],nova22-gpu-[1-5]",
                                "#SBATCH --time=2:00:00"],
                                "source_list": ["/home/kluo/shpy/dplmp.sh"],
                                "_module_list": ["intel/mkl/64/2019/5.281", "intel/mpi/64/2019/5.281"],
                                "_time_limit": "240:0:0",
                                "wait_time": 1,
                                "group_size": 1
                        }
        }
    ]
}

hikun的地下仓库

搜索此博客

dpgen transfer learning

标签

评论

发表评论

此博客中的热门博文

dpgen数据收集分类续算

dpgen simplify 数据精简二次处理

python相关