-
Notifications
You must be signed in to change notification settings - Fork 0
/
law.cfg
169 lines (126 loc) · 4.83 KB
/
law.cfg
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
[core]
# inherit from the columnflow configuration file
inherit: $CF_BASE/law.cfg
[modules]
columnflow.tasks.cms.inference
columnflow.tasks.cms.external
# columnflow.tasks.data_driven_methods
httcp.tasks
[logging]
law: INFO
luigi-interface: INFO
gfal2: WARNING
columnflow.columnar_util-perf: INFO
[analysis]
default_analysis: httcp.config.analysis_httcp.analysis_httcp
default_config: run2_2017_nano_local_v10
default_dataset: h_ggf_tautau_powheg
calibration_modules: columnflow.calibration.cms.{jets,met}, httcp.calibration.main
selection_modules: columnflow.selection.{empty}, columnflow.selection.cms.{json_filter, met_filters}, httcp.selection.main
production_modules: columnflow.production.{categories,normalization,processes}, columnflow.production.cms.{btag,electron,mc_weight,muon,pdf,pileup,scale,seeds}, httcp.production.main
categorization_modules: httcp.categorization.main
ml_modules: columnflow.ml, httcp.ml.example
inference_modules: columnflow.inference, httcp.inference.example
weight_production_modules: columnflow.weight.{empty,all_weights}, httcp.weight.main
# namespace of all columnflow tasks
cf_task_namespace: cf
# default sandbox for main tasks with standard packages for columnar processing
default_columnar_sandbox: bash::$CF_BASE/sandboxes/venv_columnar.sh
# wether or not the ensure_proxy decorator should be skipped, even if used by task's run methods
skip_ensure_proxy: False
# some remote workflow parameter defaults
htcondor_flavor: $CF_HTCONDOR_FLAVOR
htcondor_share_software: False
slurm_flavor: $CF_SLURM_FLAVOR
slurm_partition: $CF_SLURM_PARTITION
# ChunkedIOHandler defaults
chunked_io_chunk_size: 100000
chunked_io_pool_size: 2
chunked_io_debug: False
# csv list of task families that inherit from ChunkedReaderMixin and whose output arrays should be
# checked (raising an exception) for non-finite values before saving them to disk
check_finite_output: cf.CalibrateEvents, cf.SelectEvents, cf.ProduceColumns
# csv list of task families that inherit from ChunkedReaderMixin and whose input columns should be
# checked (raising an exception) for overlaps between fields when created a merged input array
check_overlapping_inputs: None
# whether to log runtimes of array functions by default
log_array_function_runtime: False
[outputs]
# list of all used file systems
wlcg_file_systems: local, wlcg_fs, wlcg_fs_infn_redirector, wlcg_fs_global_redirector
# list of file systems used by columnflow.tasks.external.GetDatasetLFNs.iter_nano_files to
# look for the correct fs per nano input file (in that order)
lfn_sources: local, wlcg_fs_infn_redirector, wlcg_fs_global_redirector
# output locations per task family
# for local targets : "local[, LOCAL_FS_NAME or STORE_PATH]"
# for remote targets: "wlcg[, WLCG_FS_NAME]"
# (when WLCG_FS_NAME is empty, the tasks' "default_wlcg_fs" attribute is used)
# examples:
cf.BundleRepo: wlcg
cf.BundleSoftware: wlcg
cf.BundleBashSandbox: wlcg
cf.BundleCMSSWSandbox: wlcg
cf.BundleExternalFiles: wlcg
cf.GetDatasetLFNs: wlcg
cf.CalibrateEvents: wlcg
cf.SelectEvents: wlcg
cf.MergeSelectionStats: wlcg
cf.MergeSelectionMasks: wlcg
cf.ReduceEvents: wlcg
cf.MergeReductionStats: wlcg
cf.MergeReducedEvents: wlcg
cf.ProduceColumns: wlcg
cf.CreateHistograms : wlcg
cf.MergeHistograms : wlcg
cf.PlotVariables1D : local
cf.CreatePileupWeights: wlcg
cf.PrepareMLEvents: wlcg
cf.MergeMLEvents: wlcg
cf.MLTraining: wlcg
cf.MLEvaluation: wlcg
cf.UniteColumns: wlcg
[job]
job_file_dir: $CF_JOB_BASE
job_file_dir_cleanup: False
# storage element (SE) and output directory on that SE for crab's internal output
# (crab might not even move files there, but it is strictly required for crab's job submission)
crab_storage_element: $CF_CRAB_STORAGE_ELEMENT
crab_base_directory: $CF_CRAB_BASE_DIRECTORY
# lcg setup file sourced in remote jobs to access gfal tools
remote_lcg_setup: /cvmfs/grid.cern.ch/alma9-ui-test/etc/profile.d/setup-alma9-test.sh
[local]
base: root://eosuser.cern.ch
[local_fs]
base: /
[wlcg_fs]
# set this to your desired location
base: root://eosuser.cern.ch//eos/user/j/jmalvaso/higgs_cp_store/
create_file_dir: True
use_cache: $CF_WLCG_USE_CACHE
cache_root: $CF_WLCG_CACHE_ROOT
cache_cleanup: $CF_WLCG_CACHE_CLEANUP
cache_max_size: 50GB
[wlcg_fs_infn_redirector]
base: root://xrootd-cms.infn.it
use_cache: $CF_WLCG_USE_CACHE
cache_root: $CF_WLCG_CACHE_ROOT
cache_cleanup: $CF_WLCG_CACHE_CLEANUP
cache_max_size: 15GB
cache_global_lock: True
cache_mtime_patience: -1
[wlcg_fs_eoscms_redirector]
base: root://eoscms.cern.ch
use_cache: $CF_WLCG_USE_CACHE
cache_root: $CF_WLCG_CACHE_ROOT
cache_cleanup: $CF_WLCG_CACHE_CLEANUP
cache_max_size: 15GB
cache_global_lock: True
cache_mtime_patience: -1
[wlcg_fs_global_redirector]
base: root://cms-xrd-global.cern.ch
use_cache: $CF_WLCG_USE_CACHE
cache_root: $CF_WLCG_CACHE_ROOT
cache_cleanup: $CF_WLCG_CACHE_CLEANUP
cache_max_size: 15GB
cache_global_lock: True
cache_mtime_patience: -1