70 lines
2.2 KiB
YAML
70 lines
2.2 KiB
YAML
# config/param.yaml
|
|
|
|
# --- 1. 环境与路径配置 ---
|
|
env:
|
|
# 可执行文件绝对路径
|
|
vasp_std: "mpirun -np 1 /cluster/home/koko125/vasp/bin_gpu/vasp_std"
|
|
gpumd: "/cluster/home/koko125/tool/GPUMD/src/gpumd"
|
|
nep: "/cluster/home/koko125/tool/GPUMD/src/nep"
|
|
|
|
# GPUMDKit 脚本库根目录
|
|
gpumdkit_root: "/cluster/home/koko125/tool/GPUMDkit"
|
|
|
|
# 【修改点】HPC 作业提交配置 (用于填充 submit.slurm 模板)
|
|
# 这些变量会被自动替换到 .sh 脚本头部
|
|
# slurm_config:
|
|
# partition: "v100" # 队列分区名
|
|
# account: "def-user" # 账户名 (如果有)
|
|
# gpu_per_node: 1 # 每节点 GPU 数
|
|
# ntasks_per_node: 32 # 每节点 CPU 核数
|
|
# time_limit: "24:00:00" # 墙钟时间限制
|
|
|
|
# --- 2. 流程控制 ---
|
|
# 阶段代号定义 (对应 modules 下的 Python 文件)
|
|
stages_def:
|
|
p: "preheat" # 00.md/preheat
|
|
m: "md" # 00.md/md
|
|
s: "select" # 01.select
|
|
d: "scf" # 02.scf
|
|
t: "train" # 03.train
|
|
pr: "predict" # 04.predict (新增:用于性质预测)
|
|
o: "output" # 05.output (始终默认执行:整理报告)
|
|
|
|
# 自定义流程调度
|
|
# 注意:'o' (output) 不需要显式写在这里,代码逻辑会强制每轮最后执行它
|
|
schedule:
|
|
# 第1轮: 跑完训练,不做预测,看一眼结果
|
|
1: ["p", "m", "s", "d", "t"]
|
|
|
|
# 第2轮: 跑完训练,加入预测步骤 (计算电导/扩散等)
|
|
2: ["p", "m", "s", "d", "t", "pr"]
|
|
|
|
# 默认流程 (如果没有定义轮次)
|
|
default_workflow: ["p", "m", "s", "d", "t", "pr"]
|
|
|
|
# --- 3. 容错与通知 ---
|
|
control:
|
|
max_retries: 3 # 任务失败自动重启次数
|
|
check_interval: 60 # 状态检查间隔 (秒)
|
|
|
|
notification:
|
|
enable_log: true
|
|
log_file: "./logs/sys_runtime.log"
|
|
|
|
enable_hook: true
|
|
hook_script: "python ./hooks/send_alert.py"
|
|
alert_events: ["fail", "finish"]
|
|
|
|
# --- 4. 模块参数 ---
|
|
params:
|
|
preheat:
|
|
temp: 300
|
|
steps: 10000
|
|
select:
|
|
target_min: 60
|
|
target_max: 120
|
|
init_threshold: 0.01
|
|
predict:
|
|
# 预测阶段需要的参数,比如计算电导率的温度范围
|
|
temperatures: [300, 400, 500]
|
|
script_path: "scripts/calc_conductivity.py" # 具体的计算脚本 |