forked from LLNL/scr
-
Notifications
You must be signed in to change notification settings - Fork 0
/
scr.user.conf.template
35 lines (31 loc) · 1.33 KB
/
scr.user.conf.template
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
# For convenience, one may specify SCR parameters in a configuration
# file. Set SCR_CONF_FILE to point to the user configuration file.
# This may be easier than specifying a bunch of environment variables.
#
# Also, a user configuration file is the *ONLY* way to specify
# multiple types of checkpoints for a single run.
#
# See the SCR User Manual for more details. This file contains some
# example settings.
# Specify the storage directories, the number of checkpoints to be
# stored in each location, and the group of processes which share
# a device. The first two describe node-local storage and the last
# describes a global parallel file system.
#
STORE=/dev/shm GROUP=NODE COUNT=1
STORE=/ssd GROUP=NODE COUNT=3
STORE=/p/lscratcha GROUP=WORLD
# Specify that checkpoint descriptors should be set up using this file
#
SCR_COPY_TYPE=FILE
# Enable datasets to be stored in cache
#
SCR_CACHE_BYPASS=0
# Specify the different types of checkpoints for a job. The following
# instructs SCR to run with three checkpoint configurations:
# - save every 4th checkpoint to /ssd using XOR with a set size of 8
# - save all other checkpoints (not divisible by 4) to /dev/shm using
# XOR with a set size of 16
#
CKPT=0 INTERVAL=1 GROUP=NODE STORE=/dev/shm TYPE=XOR SET_SIZE=16
CKPT=1 INTERVAL=4 GROUP=NODE STORE=/ssd TYPE=XOR SET_SIZE=8