Versions Compared

Key

  • This line was added.
  • This line was removed.
  • Formatting was changed.

This knowledge base article shows you how to calculate daily total precipitation using ERA-Interim data. If you just want monthly means, then you can simply download it from http://apps.ecmwf.int/datasets/data/interim-mdfa/levtype=sfc/.ERA5 data.

Before you continue, make sure you read through knowledge base articles listed below:

You are also supposed to know how to work with Python under Linux, in particular, how to install packages using pip. You are recommended to use the latest release of packages listed here:

  • ECMWF WebAPI CDS API (tested with 0.1.5.01) - required for step 1
  • netCDF4 (tested with 1.4.0) - required for step 2
  • numpy (tested with 1.14.5) - required for step 2

...

  1. Use script below to download daily total precipitation ERA-Interim ERA5 data for 1st and 2nd January 20182017. This script will download total precipitation from two forecasts at 00 UTC and 12 UTC, both at step 12. This will give you 24 hours coverage.
    CDS (Climate Data Store). Notice to cover 1st January 2017, we need two days of data.
    1. 1st January 2017 time = 01 - 23  will give you total precipitation data to cover 00 - 23 UTC for 1st January 2017
    2. 2nd January 2017 time = 00 will give you total precipitation data to cover 23 - 24 UTC for 1st January 2017
    3. Time 00 UTC and step 12 will give you 00 - 12 UTC total precipitation data
    4. Time 12 UTC and step 12 will give you 12 - 24 UTC total precipitation data
    Code Block
    languagepy
    #!/usr/bin/env python
    """
    Save as get-tp.py, then run "python get-tp.py".
     
    Input file : None
    Output file: tp_2018010120170101-20170102.nc
    """
    from ecmwfapi import ECMWFDataServercdsapi
    
    serverc = ECMWFDataServercdsapi.Client()
    serverr = c.retrieve(
        'reanalysis-era5-single-levels', {
               "class" 'variable'    : "ei"'total_precipitation',
        "dataset": "interim",
        "date"        'product_type': 'reanalysis',
                'year'        : "2018-01-01"'2017',
        "expver"        'month'       : "1"'01',
         "grid"       'day'         : "0.75/0.75",
     ['01', '02'],
                'time'     "levtype": "sfc",
       : [
                    '00:00','01:00','02:00',
                  "param"  '03:00','04: "228.128"00','05:00',
                    '06:00','07:00','08:00',
        "step"            '09:00','10:00','11: "12",
        "stream" : "oper",
        "time"   : "00:00:00/12:00:00",
        "type"   : "fc",
        "format" : "netcdf",
        "target" : "tp_20180101.nc",
    }00',
                    '12:00','13:00','14:00',
                    '15:00','16:00','17:00',
                    '18:00','19:00','20:00',
                    '21:00','22:00','23:00'
                ],
                'format'      : 'netcdf'
        })
    r.download('tp_20170101-20170102.nc')


  2. Run a second script to calculate daily total precipitation. All it does is to add up the two 24 values for 00 - 12 UTC and 12 - 24 UTC for a given day as describe in step 1.

    Code Block
    languagepy
    #!/usr/bin/env python
    """
    Save as file calculate-daily-tp.py and run "python calculate-daily-tp.py".
     
    Input file : tp_2018010120170101-20170102.nc
    Output file: daily-tp_2018010120170101.nc
    """
    import time, sys
    from datetime import datetime, timedelta
    
    from netCDF4 import Dataset, date2num, num2date
    import numpy as np
    
    day = 20170101
    d = 20180101datetime.strptime(str(day), '%Y%m%d')
    f_in = 'tp_%d-%s.nc' % (day, (d + timedelta(days = 1)).strftime('%Y%m%d'))
    f_out = 'daily-tp_%d.nc' % day
    
    dtime_needed = datetime.strptime(str(day), '%Y%m%d')
    time_needed = [ []
    for i in range(1, 25):
        time_needed.append(d + timedelta(hours = 12), d + timedelta(days = 1)]i))
    
    with Dataset(f_in) as ds_src:
        var_time = ds_src.variables['time']
        time_avail = num2date(var_time[:], var_time.units,
                calendar = var_time.calendar)
    
        indices = []
        for tm in time_needed:
            a = np.where(time_avail == tm)[0]
            if len(a) == 0:
                sys.stderr.write('Error: precipitation data is missing/incomplete - %s!\n'
                        % tm.strftime('%Y%m%d %H:%M:%S'))
                sys.exit(200)
            else:
                print('Found %s' % tm.strftime('%Y%m%d %H:%M:%S'))
                indices.append(a[0])
    
        var_tp = ds_src.variables['tp']
        tp_values_set = False
        for idx in indices:
            if not tp_values_set:
                data = var_tp[idx, :, :]
                tp_values_set = True
            else:
                data += var_tp[idx, :, :]
            
        with Dataset(f_out, mode = 'w', format = 'NETCDF3_64BIT_OFFSET') as ds_dest:
            # Dimensions
            for name in ['latitude', 'longitude']:
                dim_src = ds_src.dimensions[name]
                ds_dest.createDimension(name, dim_src.size)
                var_src = ds_src.variables[name]
                var_dest = ds_dest.createVariable(name, var_src.datatype, (name,))
                var_dest[:] = var_src[:]
                var_dest.setncattr('units', var_src.units)
                var_dest.setncattr('long_name', var_src.long_name)
    
            ds_dest.createDimension('time', None)
    
            # Variables
            var var = ds_dest.createVariable('time', np.int32, ('time',))
            time_units = 'hours since 1900-01-01 00:00:00'
            time_cal = 'gregorian'
            var[:] = date2num([d], units = time_units, calendar = time_cal)
            var.setncattr('units', time_units)
            var.setncattr('long_name', 'time')
            var.setncattr('calendar', time_cal)
    
            # Variables
            var = ds_dest.createVariable(var_tp.name, np.double, var_tp.dimensions)
            var[0, :, :] = data
            var.setncattr('units', var_tp.units)
            var.setncattr('long_name', var_tp.long_name)
    
            # Attributes
            ds_dest.setncattr('Conventions', 'CF-1.6')
            ds_dest.setncattr('history', '%s %s'
                    % (datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
                    ' '.join(time.tzname)))
    
            print('Done! Daily total precipitation saved in %s' % f_out)
    


...