From 28f9dbe73134f71f6923e16d848afb617d799bba Mon Sep 17 00:00:00 2001 From: "E. Joshua Rigler" <erigler@usgs.gov> Date: Thu, 26 Sep 2024 18:02:19 -0600 Subject: [PATCH] Fix _post_process() in FDSNFactory The FDSNFactory was not working with input streams that contained multiple segments. This was because FDSNFactory wasn't doing the full "_post_process" like, for example, EdgeFactory. More specifically, FDSNFactory's `_post_process()` method did not convert masked arrays (which is how obspy prefers to deal with gappy data) into regular numpy arrays with NaNs for missing data, as expected in all geomag-algorithms code. This became quickly obvious once some of the less stable ASL variometers were processed, like US-EYMN. This fix should allow us to now pull and plot EYMN, DGMT, and other stations that were not working with the previous release of FDSNFactory. --- geomagio/edge/FDSNFactory.py | 25 ++++++++++++++++--------- 1 file changed, 16 insertions(+), 9 deletions(-) diff --git a/geomagio/edge/FDSNFactory.py b/geomagio/edge/FDSNFactory.py index b4109d4d..c1112c92 100644 --- a/geomagio/edge/FDSNFactory.py +++ b/geomagio/edge/FDSNFactory.py @@ -285,11 +285,6 @@ class FDSNFactory(TimeseriesFactory): if data.count() == 0: return data - if data.count() != 0: - TimeseriesUtility.pad_and_trim_trace( - trace=data[0], starttime=starttime, endtime=endtime - ) - self._set_metadata(data, observatory, channel, type, interval) return data @@ -302,10 +297,12 @@ class FDSNFactory(TimeseriesFactory): channels: List[str], ): """Post process a timeseries stream after the raw data is - is fetched from querymom. Specifically changes - any MaskedArray to a ndarray with nans representing gaps. - Then calls pad_timeseries to deal with gaps at the - beggining or end of the streams. + is fetched from FDSN client. Specifically: + - adds USGS provisional data disclaimer + - changes any MaskedArray to ndarray with nans as gaps + - converts arcminutes to radians for any "D" channels + - calls pad_timeseries to deal with gaps at the + beggining or end of the streams. Parameters ---------- @@ -335,6 +332,16 @@ class FDSNFactory(TimeseriesFactory): if not any("DISCLAIMER" in comment for comment in trace.stats.comments): trace.stats.comments.extend(disclaimer_texts) + if isinstance(trace.data, numpy.ma.MaskedArray): + trace.data.set_fill_value(numpy.nan) + trace.data = trace.data.filled() + + if "D" in channels: + for trace in timeseries.select(channel="D"): + trace.data = ChannelConverter.get_radians_from_minutes(trace.data) + + TimeseriesUtility.pad_timeseries(timeseries, starttime, endtime) + def _set_metadata( self, stream: Stream, -- GitLab