cta-observatory · morcuended · Mar 30, 2022 · Mar 12, 2022 · Mar 14, 2022 · Mar 29, 2022
diff --git a/osa/scripts/gain_selection.py b/osa/scripts/gain_selection.py
@@ -0,0 +1,120 @@
+"""Script to run the gain selection over a list of dates."""
+import fileinput
+import logging
+import re
+import subprocess as sp
+from pathlib import Path
+from textwrap import dedent
+
+import click
+from astropy.table import Table
+from lstchain.paths import run_info_from_filename
+
+from osa.scripts.reprocessing import get_list_of_dates
+from osa.utils.logging import myLogger
+
+log = myLogger(logging.getLogger(__name__))
+
+PATH = "PATH=/fefs/aswg/software/gain_selection/bin:$PATH"
+
+
+def get_sbatch_script(
+        run_id,
+        subrun,
+        input_file,
+        output_dir,
+        log_dir,
+        ref_time,
+        ref_counter,
+        module,
+        ref_source
+):
+    return dedent(f"""\
+    #!/bin/bash
+
+    #SBATCH -D {log_dir}
+    #SBATCH -o "gain_selection_{run_id:05d}_{subrun:04d}_%j.log"
+    #SBATCH --job-name "gain_selection_{run_id:05d}"
+    #SBATCH --export {PATH} 
+
+    lst_select_gain {input_file} {output_dir} {ref_time} {ref_counter} {module} {ref_source}
+    """)
+
+
+def apply_gain_selection(date: str, output_basedir: Path = None):
+    run_summary_dir = Path("/fefs/aswg/data/real/monitoring/RunSummary")
+    run_summary_file = run_summary_dir / f"RunSummary_{date}.ecsv"
+    summary_table = Table.read(run_summary_file)
+    # Apply gain selection only to DATA runs
+    summary_table = summary_table[summary_table['run_type'] == 'DATA']
+
+    output_dir = output_basedir / date
+    log_dir = output_basedir / "log"
+    output_dir.mkdir(parents=True, exist_ok=True)
+    log_dir.mkdir(parents=True, exist_ok=True)
+
+    for run in summary_table:
+        run_id = run["run_id"]
+        ref_time = run["dragon_reference_time"]
+        ref_counter = run["dragon_reference_counter"]
+        module = run["dragon_reference_module_index"]
+        ref_source = run["dragon_reference_source"].upper()
+
+        r0_dir = Path(f"/fefs/aswg/data/real/R0/{date}")
+        input_files = r0_dir.glob(f"LST-1.1.Run{run_id:05d}.????.fits.fz")
+
+        for file in input_files:
+            run_info = run_info_from_filename(file)
+            job_file = log_dir / f"gain_selection_{run_info.run:05d}.{run_info.subrun:04d}.sh"
+            with open(job_file, "w") as f:
+                f.write(get_sbatch_script(
+                    run_id,
+                    run_info.subrun,
+                    file,
+                    output_dir,
+                    log_dir,
+                    ref_time,
+                    ref_counter,
+                    module,
+                    ref_source
+                ))
+            sp.run(["sbatch", job_file], check=True)
+
+
+def check_failed_jobs(output_basedir: Path = None):
+    failed_jobs = []
+    log_dir = output_basedir / "log"
+    filenames = log_dir.glob('gain_selection*.log')
+
+    for line in fileinput.input(filenames):
+        if re.search('FAILED', line):
+            job_id = fileinput.filename()[-12:-4]
+            failed_jobs.append(job_id)
+
+    if len(failed_jobs) != 0:    
+        log.info(f'The following jobs failed: {failed_jobs}')
+
+
+@click.command()
+@click.argument('dates-file', type=click.Path(exists=True, path_type=Path))
+@click.argument('output-basedir', type=click.Path(path_type=Path))
+def main(dates_file: Path, output_basedir: Path):
+    """
+    Loop over the dates listed in the input file and launch the gain selection
+    script for each of them. The input file should list the dates in the format
+    YYYYMMDD one date per line.
+    """
+    log.setLevel(logging.DEBUG)
+
+    list_of_dates = get_list_of_dates(dates_file)
+
+    for date in list_of_dates:
+        apply_gain_selection(date, output_basedir)
+
+    log.info("Done! No more dates to process.")
+
+    check_failed_jobs(output_basedir)
+
+
+if __name__ == "__main__":
+    main()