run.py 6.05 KB
Newer Older
BO ZHANG's avatar
tweaks  
BO ZHANG committed
1
2
3
4
5
6
7
"""
Aim
---
Process an MSC dataset, given a set of parameters.

Example
-------
BO ZHANG's avatar
BO ZHANG committed
8
python -m csst_dag.cli.run -h
BO ZHANG's avatar
tweaks  
BO ZHANG committed
9

BO ZHANG's avatar
BO ZHANG committed
10
python -m csst_dag.cli.run \
BO ZHANG's avatar
BO ZHANG committed
11
    --dags csst-msc-l1-mbi \
BO ZHANG's avatar
tweaks  
BO ZHANG committed
12
13
14
    --dataset=csst-msc-c9-25sqdeg-v3 \
    --instrument=MSC \
    --obs-type=WIDE \
BO ZHANG's avatar
tweaks    
BO ZHANG committed
15
    --obs-group=W2 \
BO ZHANG's avatar
tweaks  
BO ZHANG committed
16
17
18
19
20
    --obs-id=10100232366 \
    --detector=09 \
    --batch-id=test-b1 \
    --priority=1 \
    --pmapname=csst_000070.pmap \
BO ZHANG's avatar
BO ZHANG committed
21
    --ref-cat=trilegal_093
BO ZHANG's avatar
tweaks    
BO ZHANG committed
22

BO ZHANG's avatar
BO ZHANG committed
23
# 25平方度宽场
BO ZHANG's avatar
BO ZHANG committed
24
25
python -m csst_dag.cli.run \
    --dags csst-msc-l1-mbi \
BO ZHANG's avatar
tweaks    
BO ZHANG committed
26
27
28
    --dataset=csst-msc-c9-25sqdeg-v3 \
    --instrument=MSC \
    --obs-type=WIDE \
BO ZHANG's avatar
BO ZHANG committed
29
30
    --prc-status=-2 \
    --batch-id=25sqdeg-test-b2 \
BO ZHANG's avatar
tweaks    
BO ZHANG committed
31
32
33
34
    --priority=1 \
    --pmapname=csst_000070.pmap \
    --ref-cat=trilegal_093 \
    --submit
BO ZHANG's avatar
tweaks    
BO ZHANG committed
35

BO ZHANG's avatar
tweaks  
BO ZHANG committed
36
37
"""

BO ZHANG's avatar
BO ZHANG committed
38
import argparse
BO ZHANG's avatar
BO ZHANG committed
39
import os
40
import json
BO ZHANG's avatar
BO ZHANG committed
41
42

import joblib
BO ZHANG's avatar
tweaks  
BO ZHANG committed
43

BO ZHANG's avatar
BO ZHANG committed
44
45
from csst_dag import CSST_DAGS, Dispatcher, BaseDAG, dfs

BO ZHANG's avatar
tweaks  
BO ZHANG committed
46
parser = argparse.ArgumentParser(
BO ZHANG's avatar
BO ZHANG committed
47
    description="Scheduler for CSST L1 pipeline.",
BO ZHANG's avatar
tweaks  
BO ZHANG committed
48
49
50
51
52
53
54
55
56
57
58
    formatter_class=argparse.ArgumentDefaultsHelpFormatter,
)

# data parameters
parser.add_argument("--dataset", type=str, help="Dataset name")
parser.add_argument("--instrument", type=str, help="Instrument name", default=None)
parser.add_argument("--obs-type", type=str, help="Observation type", default=None)
parser.add_argument("--obs-group", type=str, help="Observation group", default=None)
parser.add_argument("--obs-id", type=str, help="Observation ID", default=None)
parser.add_argument("--detector", type=str, help="Detector name", default=None)
parser.add_argument(
59
    "--prc-status", type=int, help="Initial processing status", default=None
BO ZHANG's avatar
tweaks  
BO ZHANG committed
60
)
61
parser.add_argument("--qc-status", type=int, help="Initial QC status", default=None)
BO ZHANG's avatar
tweaks  
BO ZHANG committed
62
63
# task parameters
parser.add_argument("--batch-id", type=str, help="Batch ID", default="test-batch")
BO ZHANG's avatar
BO ZHANG committed
64
parser.add_argument("--priority", type=str, help="Task priority", default="1")
BO ZHANG's avatar
tweaks  
BO ZHANG committed
65
66
67
68
69
70
71
72
73
74
75
# DAG parameters
parser.add_argument("--pmapname", type=str, help="CCDS pmapname", default="")
parser.add_argument(
    "--ref-cat", type=str, help="Reference catalog", default="trilegal_093"
)
# submit
parser.add_argument("--submit", action="store_true", help="Push results", default=False)
# post-processing parameters
parser.add_argument(
    "--final-prc-status", type=int, help="Final processing status", default=-2
)
BO ZHANG's avatar
BO ZHANG committed
76
# additional options
BO ZHANG's avatar
BO ZHANG committed
77
parser.add_argument("--force", action="store_true", help="Force success", default=False)
BO ZHANG's avatar
BO ZHANG committed
78
parser.add_argument(
79
    "--verbose", action="store_true", help="Force success", default=False
BO ZHANG's avatar
BO ZHANG committed
80
)
81
82
# submit top N
parser.add_argument("--top-n", type=int, help="Submit top N tasks", default=-1)
BO ZHANG's avatar
BO ZHANG committed
83
# select DAGs
84
parser.add_argument("--dags", nargs="+", type=str, help="DAGs to select", default=None)
BO ZHANG's avatar
BO ZHANG committed
85

BO ZHANG's avatar
tweaks  
BO ZHANG committed
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116

args = parser.parse_args()


# from csst_dag import DotDict
#
# args = DotDict(
#     dataset="csst-msc-c9-25sqdeg-v3",
#     instrument="MSC",
#     obs_type="WIDE",
#     obs_group="W2",
#     obs_id="10100232366",
#     detector=None,
#     prc_status=None,
#     batch_id="test-batch",
#     priority=1,
#     pmapname="csst_000070.pmap",
#     ref_cat="trilegal_093",
#     submit=False,
# )

print("CLI parameters: ", args)

plan_basis, data_basis = Dispatcher.find_plan_level0_basis(
    dataset=args.dataset,
    instrument=args.instrument,
    obs_type=args.obs_type,
    obs_group=args.obs_group,
    obs_id=args.obs_id,
    detector=args.detector,
    prc_status=args.prc_status,
BO ZHANG's avatar
BO ZHANG committed
117
    qc_status=args.qc_status,
BO ZHANG's avatar
tweaks  
BO ZHANG committed
118
119
120
121
)
print(f"{len(plan_basis)} plan basis, {len(data_basis)} data basis found")

# generate DAG group run
122
dag_group_run = BaseDAG.generate_dag_group_run(
BO ZHANG's avatar
BO ZHANG committed
123
    dag_group="csst-l1-pipeline",
BO ZHANG's avatar
tweaks  
BO ZHANG committed
124
125
126
    batch_id=args.batch_id,
    priority=args.priority,
)
127

BO ZHANG's avatar
tweaks  
BO ZHANG committed
128
# generate DAG run list
BO ZHANG's avatar
tweaks    
BO ZHANG committed
129
print("\n")
BO ZHANG's avatar
BO ZHANG committed
130
print(">>> Matching DAGs ...")
131
dag_run_list = []
132
data_id_list = []
BO ZHANG's avatar
tweaks    
BO ZHANG committed
133
134
n_dag_run_all = 0
n_dag_run_success = 0
BO ZHANG's avatar
BO ZHANG committed
135
136

DEFAULT_DAGS = {
137
138
139
140
    "csst-msc-l1-mbi",
    "csst-msc-l1-ast",
    "csst-msc-l1-sls",
    "csst-msc-l1-qc0",
BO ZHANG's avatar
BO ZHANG committed
141
142
143
    "csst-msc-l1-ooc",
    "csst-mci-l1-qc0",
    "csst-mci-l1",
BO ZHANG's avatar
BO ZHANG committed
144
    "csst-ifs-l1",
BO ZHANG's avatar
BO ZHANG committed
145
146
147
    "csst-cpic-l1-qc0",
    "csst-cpic-l1",
    "csst-hstdm-l1",
BO ZHANG's avatar
BO ZHANG committed
148
}
149
150
151
152
153
154
assert args.dags is None or set(args.dags).issubset(
    DEFAULT_DAGS
), f"Selected DAGs: {args.dags}"
SELECTED_DAGS = (
    DEFAULT_DAGS.intersection(args.dags) if args.dags is not None else DEFAULT_DAGS
)
BO ZHANG's avatar
BO ZHANG committed
155
print("Selected DAGs: ", SELECTED_DAGS)
156

BO ZHANG's avatar
BO ZHANG committed
157
for dag in SELECTED_DAGS:
158
    this_task_list = CSST_DAGS[dag].schedule(
159
160
161
162
        dag_group_run=dag_group_run,
        plan_basis=plan_basis,
        data_basis=data_basis,
        pmapname=args.pmapname,
BO ZHANG's avatar
BO ZHANG committed
163
        ref_cat=args.ref_cat,
BO ZHANG's avatar
tweaks    
BO ZHANG committed
164
        force_success=args.force,
165
    )
166
167
168
169
170
171
172
173
174
175
    this_dag_run_list = [
        this_task["dag_run"]
        for this_task in this_task_list
        if this_task["dag_run"] is not None
    ]
    this_data_id_list = [
        this_task["relevant_data_id_list"]
        for this_task in this_task_list
        if this_task["dag_run"] is not None
    ]
BO ZHANG's avatar
tweaks    
BO ZHANG committed
176

177
    dag_run_list.extend(this_dag_run_list)
178
    data_id_list.extend(this_data_id_list)
BO ZHANG's avatar
tweaks    
BO ZHANG committed
179
180
181
182
183
    this_n_dag_run_all = len(this_task_list)
    this_n_dag_run_success = len(this_dag_run_list)
    n_dag_run_all += this_n_dag_run_all
    n_dag_run_success += this_n_dag_run_success
    print(f"- `{dag}` : [ {this_n_dag_run_success} / {this_n_dag_run_all} ] dag_runs")
BO ZHANG's avatar
BO ZHANG committed
184

BO ZHANG's avatar
tweaks    
BO ZHANG committed
185
# print dag_group_run and dag_run_list
BO ZHANG's avatar
BO ZHANG committed
186
187
188
if args.verbose:
    print("\n")
    print(">>> `dag_group_run` :")
BO ZHANG's avatar
tweaks    
BO ZHANG committed
189
    print(f"\t- {json.dumps(dag_group_run, separators=(',', ':'))}")
BO ZHANG's avatar
BO ZHANG committed
190
191
192
    print(f">>> `dag_run_list` : [ {n_dag_run_success} / {n_dag_run_all} ]")
    if len(dag_run_list) > 0:
        for dag_run in dag_run_list:
BO ZHANG's avatar
BO ZHANG committed
193
194
195
196
            try:
                print(f"\t- {json.dumps(dag_run, separators=(',', ':'))}")
            except:
                print(f"\t- {dag_run}")
BO ZHANG's avatar
BO ZHANG committed
197

BO ZHANG's avatar
tweaks    
BO ZHANG committed
198
# dump dag_group_run
BO ZHANG's avatar
BO ZHANG committed
199
200
joblib.dump(
    dict(
BO ZHANG's avatar
BO ZHANG committed
201
202
        plan_basis=plan_basis,
        data_basis=data_basis,
BO ZHANG's avatar
BO ZHANG committed
203
204
205
206
207
208
209
210
211
        dag_group_run=dag_group_run,
        dag_run_list=dag_run_list,
    ),
    os.path.join(
        os.getenv("HOME"),
        "csst_dag",
        f"{dag_group_run['dag_group_run']}.joblib",
    ),
)
BO ZHANG's avatar
BO ZHANG committed
212
213
# submit DAG group run
if args.submit:
BO ZHANG's avatar
tweaks    
BO ZHANG committed
214
    res = dfs.dag.new_dag_group_run(
BO ZHANG's avatar
BO ZHANG committed
215
216
217
        dag_group_run=dag_group_run,
        dag_run_list=dag_run_list,
    )
BO ZHANG's avatar
tweaks    
BO ZHANG committed
218
    print(res)