Gravitational Wave Workshop Organized by Caltech

Gravitational Waves workshop and data challenge by Caltech


    
         Workshop details 
    
            Advanced LIGO and Advanced Virgo are now observing the gravitational-wave sky with unprecedented sensitivity. 
 
            To date, there have been over 60 potential gravitational-wave transients observed, and planned detector upgrades 

            are likely to accelerate the pace of discovery in the coming years. This new window on the universe is providing 

            insights on a range of topics, including compact body populations, cosmology, and fundamental physics.

            LIGO and Virgo strain data from past observation runs and data snippets around discoveries are made publicly available 

            at gw-openscience.org, along with associated software libraries. The GW workshop, May 2022 was intended for scientists 
 
            and students that wish to learn about using gravitational-wave data and software in order to conduct research of their 
 
            own, and is the third in a series of workshops that began in 2018. The workshop will provide a mixture of lecture style 

            presentations and hands-on programming exercises, using publicly available gravitational-wave data and specialized 

            software tools.
            
            As a part of the GW workshop organized by Caltech in May 2022, I was involved in going through video lectures on fundamentals 

            of GW Wave, detection techniques and tutorials related to libraries such as GWPy, PyCBC, GSTLal etc. I also participated in 

            GW data challenge and solved three challenging problems. 
 


    
        Data Challenge Code 
    

            # GW Data challenge 1: Download the challenge set files
            from pycbc.frame import read_frame
            import urllib.request
            import pylab
            from pycbc.catalog import Merger
            from pycbc.filter import resample_to_delta_t, highpass
            from pycbc.filter import matched_filter
            import numpy
            %matplotlib inline

            def get_file(fname):
                url = "https://github.com/aman8533/GravitationalWaves/raw/main/GWChallenge/{}"
                url = url.format(fname)
                urllib.request.urlretrieve(url, fname)
                print('Getting : {}'.format(url))

            files = ['challenge1.gwf']
            for fname in files:
                get_file(fname)
                

            # An example of how to read the data from these files:
            file_name = "challenge1.gwf"

            channel_name = "H1:CHALLENGE1"

            ts = read_frame(file_name, channel_name)
            samplerate = ts.get_sample_rate()
            duration = ts.get_duration()
            print(ts)
            print("Sample Rate of the dataset",samplerate)
            print("Duration of the dataset",duration)

            strain = highpass(ts, 15.0)
            strain = resample_to_delta_t(strain, 1.0/2048)

            #Plot the data in the time-domain.
            conditioned = strain.crop(2, 2)
            psd = conditioned.psd(4)
            psd = interpolate(psd, conditioned.delta_f)
            psd = inverse_spectrum_truncation(psd, int(4 * conditioned.sample_rate), low_frequency_cutoff=15)
            tshiftgaussian = 60
            pylab.plot(conditioned.sample_times+tshiftgaussian, conditioned)
            pylab.xlabel('Time (s)')
            pylab.show()

            print("Strain Sampletimes",conditioned.sample_times)

            #Qtransform white data and plot the graph
            #Qtransform white data and plot the graph[
            # Plot a spectrogram (or q-transform) of the data, and try to identify the signal

            for data in [conditioned]:
                t, f, p = data.whiten(4, 4).qtransform(.001, logfsteps=100, qrange=(8, 8), frange=(20, 512))
                pylab.figure(figsize=[15, 3])
                pylab.title(title)
                pylab.pcolormesh(t+tshiftgaussian, f, p**0.5, vmin=1, vmax=6, shading='auto')
                pylab.yscale('log')
                pylab.xlabel('Time (s)')
                pylab.ylabel('Frequency (Hz)')
                
                pylab.show()
                print ("Merger time is observed at:",tshiftgaussian,"seconds")
                # GW170814 data
                merger = Merger("GW170814")
                # Get the data from the Hanford detector
                strain = merger.strain('H1')
                print("Merger Time of GW170814 is:",merger.time)
                # Remove the low frequency content and downsample the data to 2048Hz
                strain = highpass(strain, 15.0)
                strain = resample_to_delta_t(strain, 1.0/2048)
                conditioned = strain.crop(2, 2)

                pylab.plot(conditioned.sample_times, conditioned)
                pylab.xlabel('Time (s)')
                pylab.show()


            # GW Data challenge 2: Download the challenge set files
            from pycbc.frame import read_frame
            import urllib.request
            import pylab
            import pycbc
            from pycbc.catalog import Merger
            from pycbc.filter import resample_to_delta_t, highpass
            from pycbc.filter import matched_filter
            from pycbc.waveform import get_td_waveform
            from pycbc.filter import sigma
            from pycbc.psd import interpolate, inverse_spectrum_truncation
            from pycbc.types import TimeSeries
            import numpy
            %matplotlib inline

            def get_file(fname):
                url = "https://github.com/aman8533/GravitationalWaves/raw/main/GWChallenge/{}"
                url = url.format(fname)
                urllib.request.urlretrieve(url, fname)
                print('Getting : {}'.format(url))

            files = ['challenge2.gwf']
            for fname in files:
                get_file(fname)
                

            # An example of how to read the data from these files:
            file_name = "challenge2.gwf"

            channel_name = "H1:CHALLENGE2"

            ts = read_frame(file_name, channel_name)
            samplerate = ts.get_sample_rate()
            duration = ts.get_duration()

            strain = highpass(ts, 20)
            strain = resample_to_delta_t(strain, 1.0/2048)

            #Plot the data in the time-domain.
            conditioned = strain.crop(2, 2)
            psd = conditioned.psd(4)

            # Now that we have the psd we need to interpolate it to match our data
            # and then limit the filter length of 1 / PSD. After this, we can
            # directly use this PSD to filter the data in a controlled manner

            psd = interpolate(psd, conditioned.delta_f)

            # 1/PSD will now act as a filter with an effective length of 4 seconds
            # Since the data has been highpassed above 20 Hz, and will have low values
            # below this we need to informat the function to not include frequencies
            # below this frequency. 
            psd = inverse_spectrum_truncation(psd, int(4 * conditioned.sample_rate),
                                            low_frequency_cutoff=20)

            print(psd.sample_frequencies)
            pylab.plot(psd.sample_frequencies, psd, label="Spectral Data")

            pylab.yscale('log')
            pylab.xscale('log')
            pylab.ylim(1e-47, 1e-41)
            pylab.xlim(20, 1024)
            pylab.ylabel('$Strain^2 / Hz$')
            pylab.xlabel('Frequency (Hz)')
            pylab.grid()
            pylab.legend()
            pylab.show()

            #PSD Plotting ends

            #pylab.loglog(psd.sample_frequencies, psd)
            #pylab.ylabel('$Strain^2 / Hz$')
            #pylab.xlabel('Frequency (Hz)')
            #pylab.xlim(30, 1024)

            #plot the strain data
            pylab.plot(conditioned.sample_times+tshiftgaussian , conditioned)
            pylab.xlabel('Time (s)')
            pylab.show()
            # Strain data plotting ends

            #Generate waveform with mass m = 30 and spin = 0
            m = 30 # Solar masses
            hp, hc = get_td_waveform(approximant="SEOBNRv4_opt",
                                mass1=m,
                                mass2=m,
                                delta_t=conditioned.delta_t,
                                f_lower=20)

            # Resize the vector to match our data
            hp.resize(len(conditioned))

            pylab.figure()
            pylab.title('Before shifting')
            pylab.plot(hp.sample_times, hp)
            pylab.xlabel('Time (s)')
            pylab.ylabel('Strain')

            template = hp.cyclic_time_shift(hp.start_time)

            pylab.figure()
            pylab.title('After shifting')
            pylab.plot(template.sample_times, template)
            pylab.xlabel('Time (s)')
            pylab.ylabel('Strain')

            #Wave form generation ends 

            #Create Matched filter
            snr = matched_filter(template, conditioned,
                                psd=psd, low_frequency_cutoff=20)

            # Remove time corrupted by the template filter and the psd filter
            # We remove 4 seconds at the beginning and end for the PSD filtering
            # And we remove 4 additional seconds at the beginning to account for
            # the template length (this is somewhat generous for 
            # so short a template). A longer signal such as from a BNS, would 
            # require much more padding at the beginning of the vector.
            snr = snr.crop(4 + 4, 4)

            # Why are we taking an abs() here?
            # The `matched_filter` function actually returns a 'complex' SNR.
            # What that means is that the real portion correponds to the SNR
            # associated with directly filtering the template with the data.
            # The imaginary portion corresponds to filtering with a template that
            # is 90 degrees out of phase. Since the phase of a signal may be 
            # anything, we choose to maximize over the phase of the signal.
            pylab.figure(figsize=[10, 4])
            pylab.plot(snr.sample_times, abs(snr))
            pylab.ylabel('Signal-to-noise')
            pylab.xlabel('Time (s)')
            pylab.show()

            #Calculate SnR Peak
            peak = abs(snr).numpy().argmax()
            snrp = snr[peak]
            time = snr.sample_times[peak]

            print("We found a signal at {}s with SNR {}".format(time+tshiftgaussian, 
                                                                abs(snrp)))

            # The time, amplitude, and phase of the SNR peak tell us how to align
            # our proposed signal with the data.

            # Shift the template to the peak time
            dt = time - conditioned.start_time
            aligned = template.cyclic_time_shift(dt)

            # scale the template so that it would have SNR 1 in this data
            aligned /= sigma(aligned, psd=psd, low_frequency_cutoff=20.0)

            # Scale the template amplitude and phase to the peak value
            aligned = (aligned.to_frequencyseries() * snrp).to_timeseries()
            aligned.start_time = conditioned.start_time

            #Whiten the data
            # We do it this way so that we can whiten both the template and the data
            white_data = (conditioned.to_frequencyseries() / psd**0.5).to_timeseries()
            white_template = (aligned.to_frequencyseries() / psd**0.5).to_timeseries()

            white_data = white_data.highpass_fir(30., 512).lowpass_fir(300, 512)
            white_template = white_template.highpass_fir(30, 512).lowpass_fir(300, 512)

            # Select the time around the merger
            mergertime = time+tshiftgaussian
            white_data = white_data.time_slice(mergertime-.2, mergertime+.1)
            white_template = white_template.time_slice(mergertime-.2, mergertime+.1)

            pylab.figure(figsize=[15, 3])
            pylab.plot(white_data.sample_times, white_data, label="Data")
            pylab.plot(white_template.sample_times, white_template, label="Template")
            pylab.legend()
            pylab.show()

            subtracted = conditioned - aligned

            # Plot the original data and the subtracted signal data

            #Qtransform white data and plot the graph
            #Qtransform white data and plot the graph[
            # Plot a spectrogram (or q-transform) of the data, and try to identify the signal

            for data, title in [(conditioned, 'Original H1 Data'),
                                (subtracted, 'Signal Subtracted from H1 Data')]:

                t, f, p = data.whiten(4, 4).qtransform(.001, logfsteps=100, qrange=(8, 8), frange=(20, 512))
                pylab.figure(figsize=[15, 3])
                pylab.title(title)
                pylab.pcolormesh(t+tshiftgaussian, f, p**0.5, vmin=1, vmax=6, shading='auto')
                pylab.yscale('log')
                pylab.xlabel('Time (s)')
                pylab.ylabel('Frequency (Hz)')
                #pylab.xlim(mergertime - 2, mergertime + 1)
                pylab.show()
Gravitational Waves workshop and data challenge by Caltech

Workshop details

Data Challenge Code

Certificate