Skip to content

Commit

Permalink
Introducing syntax for vetoing injections in PyGRB and final version …
Browse files Browse the repository at this point in the history
…of `pycbc_pygrb_plot_null_stats` (gwastro#4947)

* Introducing a (mute) apply_vetoes_to_found_injs function in PyGRB

* Version of pycbc_pygrb_plot_null_stats with vetoes (albeit with a mute apply_vetoes_to_found_injs for the time being)

* Small cleanup

* Addresing typos

* Update bin/pygrb/pycbc_pygrb_plot_null_stats

---------

Co-authored-by: Marco Cusinato <[email protected]>
  • Loading branch information
2 people authored and prayush committed Nov 21, 2024
1 parent 263cd2c commit b5483fc
Show file tree
Hide file tree
Showing 2 changed files with 114 additions and 74 deletions.
141 changes: 67 additions & 74 deletions bin/pygrb/pycbc_pygrb_plot_null_stats
Original file line number Diff line number Diff line change
Expand Up @@ -46,55 +46,6 @@ __program__ = "pycbc_pygrb_plot_null_stats"
# =============================================================================
# Functions
# =============================================================================
# Function to load trigger data
def load_data(input_file, ifos, vetoes, opts, injections=False, slide_id=None):
"""Load data from a trigger/injection file"""

null_stat_type = opts.y_variable

# Initialize the dictionary
data = {}
data['coherent'] = None
data[null_stat_type] = None

if input_file:
if injections:
logging.info("Loading injections...")
# This will eventually become ppu.load_injections()
trigs_or_injs = \
ppu.load_triggers(input_file, ifos, vetoes,
rw_snr_threshold=opts.newsnr_threshold,
slide_id=slide_id)
else:
logging.info("Loading triggers...")
trigs_or_injs = \
ppu.load_triggers(input_file, ifos, vetoes,
rw_snr_threshold=opts.newsnr_threshold,
slide_id=slide_id)

# Coherent SNR is always used
data['coherent'] = trigs_or_injs['network/coherent_snr']

# The other SNR may vary
if null_stat_type == 'null':
data[null_stat_type] = \
trigs_or_injs['network/%s_snr' % null_stat_type][:]
elif null_stat_type == 'single':
key = opts.ifo + '/snr'
data[null_stat_type] = trigs_or_injs[key][:]
elif null_stat_type == 'coincident':
data[null_stat_type] = ppu.get_coinc_snr(trigs_or_injs)

# Count surviving points
num_trigs_or_injs = len(trigs_or_injs['network/reweighted_snr'])
if injections:
logging.info("%d injections found.", num_trigs_or_injs)
else:
logging.info("%d triggers found.", num_trigs_or_injs)

return data


# Function that produces the contrours to be plotted
def calculate_contours(opts, new_snrs=None):
"""Generate the contours to plot"""
Expand Down Expand Up @@ -153,20 +104,19 @@ trig_file = os.path.abspath(opts.trig_file)
found_missed_file = os.path.abspath(opts.found_missed_file)\
if opts.found_missed_file else None
zoom_in = opts.zoom_in
null_stat_type = opts.y_variable

# Prepare plot title and caption
y_labels = {'null': "Null SNR",
'coincident': "Coincident SNR"} # TODO: overwhitened
if opts.plot_title is None:
opts.plot_title = y_labels[null_stat_type] + " vs Coherent SNR"
opts.plot_title = y_labels[opts.y_variable] + " vs Coherent SNR"
if opts.plot_caption is None:
opts.plot_caption = ("Blue crosses: background triggers. ")
if found_missed_file:
opts.plot_caption = opts.plot_caption +\
("Red crosses: injections triggers. ")

if null_stat_type == 'coincident':
if opts.y_variable == 'coincident':
opts.plot_caption += ("Green line: coincident SNR = coherent SNR.")
else:
opts.plot_caption = opts.plot_caption +\
Expand All @@ -181,30 +131,76 @@ outdir = os.path.split(os.path.abspath(opts.output_file))[0]
if not os.path.isdir(outdir):
os.makedirs(outdir)

# Extract IFOs and vetoes
ifos, vetoes = ppu.extract_ifos_and_vetoes(trig_file, opts.veto_files,
opts.veto_category)

# Extract trigger data
trig_data = load_data(trig_file, ifos, vetoes, opts,
slide_id=opts.slide_id)

# Extract (or initialize) injection data
inj_data = load_data(found_missed_file, ifos, vetoes, opts,
injections=True, slide_id=0)
# Extract IFOs
ifos = ppu.extract_ifos(trig_file)

# Generate time-slides dictionary
slide_dict = ppu.load_time_slides(trig_file)

# We will be looping over slide_dict below so here we reduce it if possible
if opts.slide_id is not None:
for key in list(slide_dict.keys()):
if key != opts.slide_id:
slide_dict.pop(key, None)

# Generate segments dictionary
segment_dict = ppu.load_segment_dict(trig_file)

# Construct trials removing vetoed times
trial_dict, total_trials = ppu.construct_trials(
opts.seg_files,
segment_dict,
ifos,
slide_dict,
opts.veto_file
)

# Load triggers/injections (apply reweighted SNR cut, not vetoes)
trig_data = ppu.load_data(trig_file, ifos, data_tag='trigs',
rw_snr_threshold=opts.newsnr_threshold,
slide_id=opts.slide_id)
inj_data = ppu.load_data(found_missed_file, ifos, data_tag='injs',
rw_snr_threshold=opts.newsnr_threshold,
slide_id=0)

# Extract needed trigger properties and store them as dictionaries
# Based on trial_dict: if vetoes were applied, trig_* are the veto survivors
# Coherent SNR is always used
x_key = 'network/coherent_snr'
# The other SNR may vary
y_key = 'network/' + opts.y_variable + '_snr'
found_trigs_slides = ppu.extract_trig_properties(
trial_dict,
trig_data,
slide_dict,
segment_dict,
[x_key, y_key]
)
found_trigs = {}
for key in [x_key, y_key]:
found_trigs[key] = numpy.concatenate(
[found_trigs_slides[key][slide_id][:] for slide_id in slide_dict]
)

# Gather injections found surviving vetoes
found_injs, *_ = ppu.apply_vetoes_to_found_injs(
found_missed_file,
inj_data,
ifos,
veto_file=opts.veto_file,
keys=[x_key, y_key]
)

# Generate plots
logging.info("Plotting...")

# Contours
cont_colors = ['g-']
snr_vals = None
cont_colors = None
shade_cont_value = None
x_max = None
# Coincident SNR plot case: we want a coinc=coh diagonal line on the plot
if null_stat_type == 'coincident':
cont_colors = ['g-']
x_max = plu.axis_max_value(trig_data['coherent'], inj_data['coherent'],
if y_key == 'network/coincident_snr':
x_max = plu.axis_max_value(found_trigs[x_key], found_injs[x_key],
found_missed_file)
snr_vals = [4, x_max]
null_stat_conts = [[4, x_max]]
Expand All @@ -226,12 +222,9 @@ if not opts.y_lims and zoom_in:
opts.y_lims = '0,30'
# Get rcParams
rc('font', size=14)
# Set color for out-of-range values
# Determine y-axis values of triggers and injections
y_label = y_labels[null_stat_type]
trigs = [trig_data['coherent'], trig_data[null_stat_type]]
injs = [inj_data['coherent'], inj_data[null_stat_type]]
plu.pygrb_plotter(trigs, injs, "Coherent SNR", y_label, opts,
plu.pygrb_plotter([found_trigs[x_key], found_trigs[y_key]],
[found_injs[x_key], found_injs[y_key]],
"Coherent SNR", y_labels[opts.y_variable], opts,
snr_vals=snr_vals, conts=null_stat_conts,
shade_cont_value=shade_cont_value,
colors=cont_colors, vert_spike=True,
Expand Down
47 changes: 47 additions & 0 deletions pycbc/results/pygrb_postprocessing_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -368,6 +368,53 @@ def load_data(input_file, ifos, rw_snr_threshold=None, data_tag=None,
return trigs_dict


# =============================================================================
# Function to apply vetoes to found injections
# =============================================================================
def apply_vetoes_to_found_injs(found_missed_file, found_injs, ifos,
veto_file=None, keys=None):
"""Separate injections surviving vetoes from vetoed injections.
THIS IS ESSENTIALLY AN EMPTY PLACE HOLDER AT THE MOMENT: IT RETURNS
THE INJECTIONS GIVEN IN INPUT, WITHOUT APPLYING VETOES.
Parameters
----------
found_missed_file: injections results File
found_injs: dictionary of found injections
ifos: list of interferometers to use in vetoing
veto_file: vetoed segments File (optional)
keys: list of desired dataset names (optional)
Return
------
found_after_vetoes: dictionary of injections surviving vetoes
missed_after_vetoes: dictionary of vetoed injections
found_idx: numpy.array of indices of surviving injections
veto_idx: numpy.array of indices of vetoed injections
"""

keep_keys = keys if keys else found_injs.keys()

if not found_missed_file:
return (dict.fromkeys(keep_keys, numpy.array([])),
dict.fromkeys(keep_keys, numpy.array([])),
None, None)

found_after_vetoes = found_injs
missed_after_vetoes = dict.fromkeys(keep_keys, numpy.array([]))
found_idx = numpy.arange(len(found_injs[ifos[0]+'/end_time'][:]))
veto_idx = numpy.array([], dtype=numpy.int64)

return found_after_vetoes, missed_after_vetoes, found_idx, veto_idx


# =============================================================================
# Detector utils:
# * Function to calculate the antenna response F+^2 + Fx^2
Expand Down

0 comments on commit b5483fc

Please sign in to comment.