Source code for template_gen

#!/usr/bin/python
r"""Function to generate template waveforms and information to go with them\
for the application of cross-correlation of seismic data for the detection of\
 repeating events.

Part of the EQcorrscan module to read nordic format s-files\
EQcorrscan is a python module designed to run match filter routines for\
seismology, within it are routines for integration to seisan and obspy.\
With obspy integration (which is necessary) all main waveform formats can be\
read in and output.

This main section contains a script, LFE_search.py which demonstrates the\
usage of the built in functions from template generation from picked waveforms\
through detection by match filter of continuous data to the generation of lag\
times to be used for relative locations.

The match-filter routine described here was used a previous Matlab code for\
the Chamberlain et al. 2014 G-cubed publication.  The basis for the lag-time\
generation section is outlined in Hardebeck & Shelly 2011, GRL.

Code generated by Calum John Chamberlain of Victoria University of Wellington,\
2015.


.. rubric:: Note
Pre-requisites:
    - gcc             - for the installation of the openCV correlation routine
    - python-cv2      - Python bindings for the openCV routines
    - python-joblib   - used for parallel processing
    - python-obspy    - used for lots of common seismological processing
                        - requires:
                            - numpy
                            - scipy
                            - matplotlib
    - NonLinLoc       - used outside of all codes for travel-time generation

Copyright 2015 Calum Chamberlain

This file is part of EQcorrscan.

    EQcorrscan is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    EQcorrscan is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with EQcorrscan.  If not, see <http://www.gnu.org/licenses/>.

"""


[docs]def from_sfile(sfile, lowcut, highcut, samp_rate, filt_order, length, swin, debug=0): r"""Function to read in picks from sfile then generate the template from the picks within this and the wavefile found in the pick file. :type sfile: string :param sfile: sfilename must be the\ path to a seisan nordic type s-file containing waveform and pick\ information. :type lowcut: float :param lowcut: Low cut (Hz), if set to None will look in template\ defaults file :type highcut: float :param lowcut: High cut (Hz), if set to None will look in template\ defaults file :type samp_rate: float :param samp_rate: New sampling rate in Hz, if set to None will look in\ template defaults file :type filt_order: int :param filt_order: Filter level, if set to None will look in\ template defaults file :type swin: str :param swin: Either 'all', 'P' or 'S', to select which phases to output. :type length: float :param length: Extract length in seconds, if None will look in template\ defaults file. :type debug: int :param debug: Debug level, higher number=more output. """ # Perform some checks first import os if not os.path.isfile(sfile): raise IOError('sfile does not exist') from eqcorrscan.utils import pre_processing from eqcorrscan.utils import Sfile_util from obspy import read as obsread # Read in the header of the sfile wavefiles = Sfile_util.readwavename(sfile) pathparts = sfile.split('/')[0:-1] for part in pathparts: if part == 'REA': part = 'WAV' wavpath = os.path.join(pathparts) # Read in waveform file for wavefile in wavefiles: print ''.join(["I am going to read waveform data from: ", wavpath, wavefile]) if 'st' not in locals(): st = obsread(wavpath + wavefile) else: st += obsread(wavpath + wavefile) for tr in st: if tr.stats.sampling_rate < samp_rate: print 'Sampling rate of data is lower than sampling rate asked for' print 'Not good practice for correlations: I will not do this' raise ValueError("Trace: " + tr.stats.station + " sampling rate: " + str(tr.stats.sampling_rate)) # Read in pick info picks = Sfile_util.readpicks(sfile) print "I have found the following picks" for pick in picks: print ' '.join([pick.station, pick.channel, pick.phase, str(pick.time)]) # Process waveform data st = pre_processing.shortproc(st, lowcut, highcut, filt_order, samp_rate, debug) st1 = _template_gen(picks, st, length, swin) return st1
[docs]def from_contbase(sfile, contbase_list, lowcut, highcut, samp_rate, filt_order, length, prepick, swin, debug=0): r"""Function to read in picks from sfile then generate the template from\ the picks within this and the wavefiles from the continous database of\ day-long files. Included is a section to sanity check that the files are\ daylong and that they start at the start of the day. You should ensure\ this is the case otherwise this may alter your data if your data are\ daylong but the headers are incorrectly set. :type sfile: string :param sfile: sfilename must be the path to a seisan nordic type s-file \ containing waveform and pick information, all other arguments can \ be numbers save for swin which must be either P, S or all \ (case-sensitive). :type contbase_list: List of tuple of string :param contbase_list: List of tuples of the form\ ['path', 'type', 'network']. Where path is the path to the continuous\ database, type is the directory structure, which can be either\ Yyyyy/Rjjj.01, which is the standard IRIS Year, julian day structure, or,\ yyyymmdd which is a single directory for every day. :type lowcut: float :param lowcut: Low cut (Hz), if set to None will look in template\ defaults file :type highcut: float :param lowcut: High cut (Hz), if set to None will look in template\ defaults file :type samp_rate: float :param samp_rate: New sampling rate in Hz, if set to None will look in\ template defaults file :type filt_order: int :param filt_order: Filter level, if set to None will look in\ template defaults file :type length: float :param length: Extract length in seconds, if None will look in template\ defaults file. :type prepick: float :param prepick: Pre-pick time in seconds :type swin: str :param swin: Either 'all', 'P' or 'S', to select which phases to output. :type debug: int :param debug: Level of debugging output, higher=more """ # Perform some checks first import os if not os.path.isfile(sfile): raise IOError('sfile does not exist') # import some things from eqcorrscan.utils import pre_processing from eqcorrscan.utils import Sfile_util import glob from obspy import UTCDateTime from obspy import read as obsread # Read in the header of the sfile header = Sfile_util.readheader(sfile) day = UTCDateTime('-'.join([str(header.time.year), str(header.time.month).zfill(2), str(header.time.day).zfill(2)])) # Read in pick info picks = Sfile_util.readpicks(sfile) print "I have found the following picks" pick_chans = [] used_picks = [] for pick in picks: if pick.station + pick.channel not in pick_chans\ and pick.phase in ['P', 'S']: pick_chans.append(pick.station + pick.channel) used_picks.append(pick) print pick for contbase in contbase_list: if contbase[1] == 'yyyy/mm/dd': daydir = os.path.join([str(day.year), str(day.month).zfill(2), str(day.day).zfill(2)]) elif contbase[1] == 'Yyyyy/Rjjj.01': daydir = os.path.join(['Y' + str(day.year), 'R' + str(day.julday).zfill(3) + '.01']) elif contbase[1] == 'yyyymmdd': daydir = day.datetime.strftime('%Y%m%d') if 'wavefiles' not in locals(): wavefiles = (glob.glob(os.path.join([contbase[0], daydir, '*' + pick.station + '.*']))) else: wavefiles += glob.glob(os.path.join([contbase[0], daydir, '*' + pick.station + '.*'])) elif pick.phase in ['P', 'S']: print ' '.join(['Duplicate pick', pick.station, pick.channel, pick.phase, str(pick.time)]) elif pick.phase == 'IAML': print ' '.join(['Amplitude pick', pick.station, pick.channel, pick.phase, str(pick.time)]) picks = used_picks wavefiles = list(set(wavefiles)) # Read in waveform file wavefiles.sort() for wavefile in wavefiles: print "I am going to read waveform data from: " + wavefile if 'st' not in locals(): st = obsread(wavefile) else: st += obsread(wavefile) # Porcess waveform data st.merge(fill_value='interpolate') for tr in st: tr = pre_processing.dayproc(tr, lowcut, highcut, filt_order, samp_rate, debug, day) # Cut and extract the templates st1 = _template_gen(picks, st, length, swin, prepick=prepick) return st1
[docs]def _template_gen(picks, st, length, swin, prepick=0.05, plot=False): r"""Function to generate a cut template in the obspy\ Stream class from a given set of picks and data, also in an obspy stream\ class. Should be given pre-processed data (downsampled and filtered) :type picks: :class: 'makesfile.pick' :param picks: Picks to extract data around :type st: :class: 'obspy.Stream' :param st: Stream to etract templates from :type length: float :param length: Length of template in seconds :type swin: string :param swin: P, S or all :type prepick: float :param prepick: Length in seconds to extract before the pick time\ default is 0.05 seconds :type plot: bool :param plot: To plot the template or not, default is True """ import copy from eqcorrscan.utils.EQcorrscan_plotting import pretty_template_plot as tplot from obspy import Stream import warnings stations = [] channels = [] st_stachans = [] for pick in picks: stations.append(pick.station) channels.append(pick.channel) for tr in st: st_stachans.append('.'.join([tr.stats.station, tr.stats.channel])) for i in xrange(len(stations)): if not '.'.join([stations[i], channels[i]]) in st_stachans: warnings.warn('No data provided for ' + stations[i] + '.' + channels[i]) # Select which channels we actually have picks for for tr in st: if tr.stats.station in stations: if swin == 'all': if len(tr.stats.channel) == 3: temp_channel = tr.stats.channel[0] + tr.stats.channel[2] elif len(tr.stats.channel) == 2: temp_channel = tr.stats.channel # if temp_channel in channels: tr.stats.channel = temp_channel if 'st1' not in locals(): st1 = Stream(tr) else: st1 += tr else: if 'st1' not in locals(): st1 = Stream(tr) else: st1 += tr st = copy.deepcopy(st1) del st1 if plot: stplot = st.copy() # Cut the data for tr in st: if 'starttime' in locals(): del starttime if swin == 'all': for pick in picks: if pick.station == tr.stats.station and \ pick.channel == tr.stats.channel and\ pick.phase == 'P': starttime = pick.time - prepick elif pick.station == tr.stats.station and\ tr.stats.channel[-1] in ['1', '2', 'N', 'E'] and\ pick.phase == 'S': starttime = pick.time - prepick else: for pick in picks: if pick.station == tr.stats.station and pick.phase == swin: starttime = pick.time - prepick if 'starttime' in locals(): print "Cutting " + tr.stats.station + '.' + tr.stats.channel tr.trim(starttime=starttime, endtime=starttime + length, nearest_sample=False) print tr.stats.starttime print tr.stats.endtime if 'st1' not in locals(): st1 = Stream(tr) else: st1 += tr else: print 'No pick for ' + tr.stats.station + '.' + tr.stats.channel # Ensure that the template is the correct length if len(tr.data) == (tr.stats.sampling_rate * length) + 1: tr.data = tr.data[0:-1] if plot: background = stplot.trim(st1.sort(['starttime'])[0].stats.starttime - 10, st1.sort(['starttime'])[-1].stats.endtime + 10) tplot(st1, background=background) del stplot del st # st1.plot(size=(800,600)) return st1
[docs]def extract_from_stack(stack, template, length, pre_pick, pre_pad, Z_include=False, pre_processed=True, samp_rate=False, lowcut=False, highcut=False, filt_order=False): r"""Function to extract a new template from a stack of previous detections. Requires the stack, the template used to make the detections for the stack, and we need to know if the stack has been pre-processed. :type stack: :class:obspy.Stream :param stack: Waveform stack from detections. Can be of any length and\ can have delays already included, or not. :type template: :class:obspy.Stream :param template: Template used to make the detections in the stack. Will\ use the delays of this for the new template. :type length: float :param length: Length of new template in seconds :type pre_pick: float :param pre_pick: Extract additional data before the detection, seconds :type pre_pad: float :param pre_pad: Pad used in seconds when extracting the data, e.g. the\ time before the detection extracted. If using\ clustering.extract_detections this half the length of the extracted\ waveform. :type Z_include: bool :param Z_include: If True will include any Z-channels even if there is\ no template for this channel, as long as there is a template for this\ station at a different channel. If this is False and Z channels are\ included in the template Z channels will be included in the new_template\ anyway. :type pre_processed: bool :param pre_processed: Have the data been pre-processed, if True (default)\ then we will only cut the data here. :type samp_rate: float :param samp_rate: If pre_processed=False then this is required, desired\ sampling rate in Hz, defaults to False. :type lowcut: float :param lowcut: If pre_processed=False then this is required, lowcut in Hz,\ defaults to False :type highcut: float :param highcut: If pre_processed=False then this is required, highcut in\ Hz, defaults to False :type filt_order: int :param filt_order: If pre_processed=False then this is required, filter\ order, defaults to False :returns: :class:obspy.Stream Newly cut template """ from eqcorrscan.utils import pre_processing import warnings new_template = stack.copy() # Copy the data before we trim it to keep the stack safe # Get the earliest time in the template as this is when the detection is # taken. mintime = min([tr.stats.starttime for tr in template]) # Generate a list of tuples of (station, channel, delay) with delay in # seconds delays = [(tr.stats.station, tr.stats.channel[-1], mintime - tr.stats.starttime) for tr in template] # Loop through the stack and trim! for tr in new_template: # Process the data if necessary if not pre_processed: new_template = pre_processing.shortproc(new_template, lowcut, highcut, filt_order, samp_rate, 0) # Find the matching delay delay = [d[2] for d in delays if d[0] == tr.stats.station and d[1] == tr.stats.channel[-1]] if Z_include and len(delay) == 0: delay = [d[2] for d in delays if d[0] == tr.stats.station] if len(delay) == 0: msg = ' '.join(['No matching template channel found for stack', 'channel', tr.stats.station, tr.stats.channel]) warnings.warn(msg) new_template.remove(tr) elif len(delay) > 1: msg = ' '.join(['Multiple delays found for stack channel', tr.stats.station, tr.stats.channel]) warnings.warn(msg) else: tr.trim(starttime=tr.stats.starttime + delay[0] + pre_pad - pre_pick, endtime=tr.stats.starttime + delay[0] + pre_pad + length - pre_pick) return new_template
if __name__ == '__main__': import sys if len(sys.argv) != 2: raise IOError('Requires 1 arguments: sfilename') sfile = str(sys.argv[1]) template = from_sfile(sfile) template.write(sfile + '_template.ms', format="MSEED")