from __future__ import print_function
import cdms2
import MV2
import genutil
import cdutil
import vcs
import os
import requests
import numpy


filename = 'tas_Amon_IPSL-CM5A-LR_1pctCO2_r1i1p1_185001-198912.nc'
if not os.path.exists(filename):
    r = requests.get("https://cdat.llnl.gov/cdat/sample_data/notebooks/{}".format(filename), stream=True)
    with open(filename,"wb") as f:
        for chunk in r.iter_content(chunk_size=1024):
            if chunk:  # filter local_filename keep-alive new chunks
                f.write(chunk)


f = cdms2.open(filename)

data = f("tas")


data.info()

*** Description of Slab tas ***
id: tas
shape: (1680, 13, 16)
filename: 
missing_value: 1e+20
comments: 
grid_name: <None>
grid_type: generic
time_statistic: 
long_name: Near-Surface Air Temperature
units: K
tileIndex: None
original_name: t2m
associated_files: baseURL: http://cmip-pcmdi.llnl.gov/CMIP5/dataLocation gridspecFile: gridspec_atmos_fx_IPSL-CM5A-LR_1pctCO2_r0i0p0.nc areacella: areacella_fx_IPSL-CM5A-LR_1pctCO2_r0i0p0.nc
coordinates: height
standard_name: air_temperature
cell_methods: time: mean (interval: 30 minutes)
cell_measures: area: areacella
history: 2011-03-07T11:45:34Z altered by CMOR: Treated scalar dimension: 'height'. 2011-03-07T11:45:34Z altered by CMOR: replaced missing value flag (9.96921e+36) with standard missing value (1e+20). 2011-03-07T11:45:34Z altered by CMOR: Inverted axis: lat.
Grid has Python id 0x16496e150.
Gridtype: generic
Grid shape: (13, 16)
Order: yx
** Dimension 1 **
   id: time
   Designated a time axis.
   units:  days since 1850-01-01 00:00:00
   Length: 1680
   First:  15.5
   Last:   51084.5
   Other axis attributes:
      axis: T
      calendar: noleap
      realtopology: linear
      long_name: time
      standard_name: time
   Python id:  0x164be8550
** Dimension 2 **
   id: lat
   Designated a latitude axis.
   units:  degrees_north
   Length: 13
   First:  25.578947067260742
   Last:   48.31578826904297
   Other axis attributes:
      axis: Y
      realtopology: linear
      long_name: latitude
      standard_name: latitude
   Python id:  0x106aaa150
** Dimension 3 **
   id: lon
   Designated a longitude axis.
   units:  degrees_east
   Length: 16
   First:  -123.75
   Last:   -67.5
   Other axis attributes:
      axis: X
      modulo: 360.0
      topology: circular
      realtopology: circular
      long_name: longitude
      standard_name: longitude
   Python id:  0x164986410
*** End of description for tas ***


data_ts = genutil.averager(data, axis='xy', weights=['weighted','weighted'], combinewts=1)
data_ts.shape

/Users/davis278/miniconda3/envs/cdat821/lib/python3.7/site-packages/genutil/averager.py:627: FutureWarning: elementwise comparison failed; returning scalar instead, but in the future will perform elementwise comparison
  if wgt in ['equal', 'unweighted']:
/Users/davis278/miniconda3/envs/cdat821/lib/python3.7/site-packages/genutil/averager.py:665: FutureWarning: elementwise comparison failed; returning scalar instead, but in the future will perform elementwise comparison
  if dim_wt in ['equal', 'unweighted']:

(1680,)


x = vcs.init(bg=True, geometry=(1200,900))
line = vcs.create1d()
line.markersize = .5
x.plot(data_ts, line)

<vcs.displayplot.Dp at 0x157912830>


import numpy
array = numpy.array([[3,4,999,7],[999,5,999,999],[1,2,5,5],[999,999,6,4.]])
array

array([[  3.,   4., 999.,   7.],
       [999.,   5., 999., 999.],
       [  1.,   2.,   5.,   5.],
       [999., 999.,   6.,   4.]])


masked = numpy.ma.masked_equal(array, 999.)
masked

masked_array(
  data=[[3.0, 4.0, --, 7.0],
        [--, 5.0, --, --],
        [1.0, 2.0, 5.0, 5.0],
        [--, --, 6.0, 4.0]],
  mask=[[False, False,  True, False],
        [ True, False,  True,  True],
        [False, False, False, False],
        [ True,  True, False, False]],
  fill_value=999.0)


a = numpy.ma.average(numpy.ma.average(masked, axis=-1))
print ("Y, X:", "{0:.3f}".format(a))

Y, X: 4.479


b = numpy.ma.average(numpy.ma.average(masked, axis=0))
print ("X, Y:", "{0:.3f}".format(b))

X, Y: 4.125


c = numpy.ma.average(numpy.ma.average(masked))
print ("All:", "{0:.3f}".format(c))

All: 4.200


datamskd = MV2.masked_greater(data, data.max()-7)


datamskd_departures = cdutil.times.ANNUALCYCLE.departures(datamskd) # extract the departures of the masked data.


datamskd_departures.shape

(1680, 13, 16)


datamskd_departures_ts = genutil.averager(datamskd_departures, axis='xy', weights=['weighted','weighted'], combinewts=1) # create time series of the masked data departures.


datamskd_departures_ts.shape

(1680,)


x = vcs.init(bg=True, geometry=(1200,900))
x.clear()
x.plot(datamskd_departures_ts)

<vcs.displayplot.Dp at 0x164a08bb0>


# Format the monthly mean anomaly data to show 5 digits after the decimal point.
numpy.set_printoptions(precision=5, formatter={'float': '{: 0.5f}'.format})


print(cdutil.times.ANNUALCYCLE.climatology(datamskd_departures_ts))

[ 0.00000 -0.00000  0.00000 -0.00000  0.01006  0.05874  0.09536  0.09576
  0.01505 -0.00000  0.00000  0.00000]


datamskd_departures_ts_corrected = cdutil.times.ANNUALCYCLE.departures(datamskd_departures_ts)


datamskd_departures_ts_corrected.shape

(1680,)


print(cdutil.times.ANNUALCYCLE.climatology(datamskd_departures_ts_corrected))

[ 0.00000  0.00000 -0.00000  0.00000 -0.00000  0.00000  0.00000  0.00000
 -0.00000  0.00000  0.00000 -0.00000]


print(numpy.mean(datamskd_departures_ts_corrected))
#print("{0:.5f}".format(numpy.mean(datamskd_departures_ts_corrected)))

-1.3534147347811433e-16


print(cdutil.averager(datamskd_departures_ts_corrected, weights='unweighted'))

-1.3534147347811433e-16


print(cdutil.averager(datamskd_departures_ts_corrected, weights='weighted'))

-1.4238664607012576e-16


print(cdutil.averager(datamskd_departures_ts_corrected))

-1.4238664607012576e-16


x.clear()
x.plot(datamskd_departures_ts_corrected)

<vcs.displayplot.Dp at 0x164a08ad0>


datamskd_ts = genutil.averager(datamskd, axis='xy', weights=['weighted','weighted'], combinewts=1)


datamskd_ts.shape

(1680,)


x = vcs.init(bg=True, geometry=(1200,900))
line = vcs.create1d()
line.markersize = .5
x.plot(datamskd_ts, line)

<vcs.displayplot.Dp at 0x168d56130>


datamskd_ts_departures = cdutil.times.ANNUALCYCLE.departures(datamskd_ts)
datamskd_ts_departures.shape

(1680,)


print(cdutil.times.ANNUALCYCLE.climatology(datamskd_ts_departures)) # All 12 annual cycle values should now be 0

[ 0.00000  0.00000  0.00000  0.00000  0.00000 -0.00000 -0.00000  0.00000
 -0.00000 -0.00000 -0.00000  0.00000]


print(numpy.mean(datamskd_ts_departures)) # unweighted mean
#print("{0:.5f}".format(numpy.mean(datamskd_ts_departures)))

4.0602442043434294e-15


print(cdutil.averager(datamskd_ts_departures)) # weighted mean
#print("{0:.5f}".format(cdutil.averager(datamskd_ts_departures)))

4.2715993821037725e-15


x.clear()
x.plot(datamskd_ts_departures)

<vcs.displayplot.Dp at 0x168d56210>


x.clear()
x.plot(datamskd_departures_ts_corrected - datamskd_ts_departures)

<vcs.displayplot.Dp at 0x168d562f0>


slope_ts, intercept_ts = genutil.statistics.linearregression(datamskd_departures_ts_corrected, axis="t")


datamskd_departures_ts_corrected.shape

(1680,)


times = MV2.array(datamskd.getTime()[:])
times.setAxis(0, datamskd.getTime())
times.shape

(1680,)


datamskd_departures_ts_corrected_detrend = datamskd_departures_ts_corrected - times * slope_ts - intercept_ts
datamskd_departures_ts_corrected_detrend.shape

(1680,)


print(numpy.mean(datamskd_departures_ts_corrected_detrend)) # unweighted mean
#print("{0:.5f}".format(numpy.mean(datamskd_departures_ts_corrected_detrend)))

-3.552713678800501e-16


x.clear()
x.plot(datamskd_departures_ts_corrected_detrend)

<vcs.displayplot.Dp at 0x168d564b0>


slope, intercept = genutil.statistics.linearregression(datamskd_departures, axis="t")
print("Shapes: slope {}, intercept {}".format(slope.shape, intercept.shape))

Shapes: slope (13, 16), intercept (13, 16)


tmp, full_times = genutil.grower(datamskd_departures, times)
print("Shape: full_times {}".format(full_times.shape))

Shape: full_times (1680, 13, 16)


tmp, slope_full = genutil.grower(datamskd, slope)
print("Shape: slope_full {}".format(slope_full.shape))
tmp, intercept_full = genutil.grower(datamskd, intercept)
print("Shape: intercept_full {}".format(intercept_full.shape))

Shape: slope_full (1680, 13, 16)
Shape: intercept_full (1680, 13, 16)


datamskd_departures_detrend = datamskd_departures - full_times * slope_full - intercept_full
datamskd_departures_detrend.shape

(1680, 13, 16)


datamskd_departures_detrend_ts = genutil.averager(datamskd_departures_detrend, axis='xy')
datamskd_departures_detrend_ts.shape

(1680,)


print(numpy.mean(datamskd_departures_detrend_ts))
#print("{0:.5f}".format(numpy.mean(datamskd_departures_detrend_ts)))

0.0037278531235266526


slope_detrend_ts, intercept_detrend_ts = genutil.statistics.linearregression(datamskd_departures_detrend_ts, axis="t")
print("Shapes: slope_detrend_ts {}, intercept_detrend_ts {}".format(slope_detrend_ts.shape, intercept_detrend_ts.shape))

Shapes: slope_detrend_ts (), intercept_detrend_ts ()


datamskd_departures_detrend_ts_corrected = datamskd_departures_detrend_ts - times * slope_detrend_ts - intercept_detrend_ts


print(numpy.mean(datamskd_departures_detrend_ts_corrected))
#print("{0:.5f}".format(numpy.mean(datamskd_departures_detrend_ts_corrected)))

-1.6917684184764292e-17


x.clear()
x.plot(datamskd_departures_detrend_ts_corrected - datamskd_departures_ts_corrected_detrend)

<vcs.displayplot.Dp at 0x168d56670>

	Y1	Y2	Y3	Y4
X1	3	4	-	7
X2	-	5	-	-
X3	1	2	5	5
X4	-	-	6	4

	Y1	Y2	Y3	Y4	Average
X1	3	4	-	7	4.667
X2	-	5	-	-	5.000
X3	1	2	5	5	3.250
X4	-	-	6	4	5.000
Average					4.479

	Y1	Y2	Y3	Y4	Average
X1	3	4	-	7
X2	-	5	-	-
X3	1	2	5	5
X4	-	-	6	4
Average	2.000	3.667	5.500	5.333	4.125

Remove Climatological Mean Annual Cycle and Detrend Data ¶

Table of Contents

Prepare Notebook and Data¶

Download Data¶

Open Data File, Extract Variable¶

Data Exploration¶

Order of Operations Matters¶

Numerical Example¶

Removing the Climatological Annual Cycle¶

Processing Option 1: Remove the annual cycle, then spatially average to create a single time series¶

Processing Option 2: Spatially average data to obtain a single time-series, then remove the annual cycle¶

Detrend Data¶

Consider Two Options¶

Processing Option A: Spatially average the anomaly fields over the domain, then remove the trend from the resulting time-series.¶

Processing Option B: Remove the trend at each grid cell, then spatially average the results.¶