forked from tsutterley/read-ICESat-2
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMPI_reduce_ICESat2_ATL03_RGI.py
585 lines (545 loc) · 28 KB
/
MPI_reduce_ICESat2_ATL03_RGI.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
#!/usr/bin/env python
u"""
MPI_reduce_ICESat2_ATL03_RGI.py
Written by Tyler Sutterley (10/2019)
Create masks for reducing ICESat-2 data to the Randolph Glacier Inventory
https://www.glims.org/RGI/rgi60_dl.html
COMMAND LINE OPTIONS:
-D X, --directory=X: Working Data Directory
-R X, --region=X: region of Randolph Glacier Inventory to run
1: Alaska
2: Western Canada and USA
3: Arctic Canada North
4: Arctic Canada South
5: Greenland Periphery
6: Iceland
7: Svalbard
8: Scandinavia
9: Russian Arctic
10: North Asia
11: Central Europe
12: Caucasus, Middle East
13: Central Asia
14: South Asia West
15: South Asia East
16: Low Latitudes
17: Southern Andes
18: New Zealand
19: Antarctic, Subantarctic
-M X, --mode=X: Permission mode of directories and files created
-V, --verbose: Output information about each created file
REQUIRES MPI PROGRAM
MPI: standardized and portable message-passing system
https://www.open-mpi.org/
http://mpitutorial.com/
PYTHON DEPENDENCIES:
numpy: Scientific Computing Tools For Python
https://numpy.org
https://numpy.org/doc/stable/user/numpy-for-matlab-users.html
mpi4py: MPI for Python
http://pythonhosted.org/mpi4py/
http://mpi4py.readthedocs.org/en/stable/
h5py: Python interface for Hierarchal Data Format 5 (HDF5)
https://h5py.org
http://docs.h5py.org/en/stable/mpi.html
shapely: PostGIS-ish operations outside a database context for Python
http://toblerity.org/shapely/index.html
pyshp: Python read/write support for ESRI Shapefile format
https://github.com/GeospatialPython/pyshp
PROGRAM DEPENDENCIES:
base_directory.py: sets the user-specific working data directory as
specified by the $PYTHONDATA environmental variable set in .pythonrc
convert_julian.py: returns the calendar date and time given a Julian date
count_leap_seconds.py: determines number of leap seconds for a GPS time
UPDATE HISTORY:
Updated 10/2019: using delta_time as output HDF5 variable dimensions
changing Y/N flags to True/False
Updated 09/2019: using date functions paralleling public repository
Updated 05/2019: read shapefiles from RGI provided zip files
check if beam exists in a try except else clause
Updated 04/2019: check if subsetted beam contains land ice data
save RGIId for valid points to determine containing RGI polygons
Written 04/2019
"""
from __future__ import print_function
import sys
import os
import re
import io
import h5py
import getopt
import zipfile
import datetime
import shapefile
import numpy as np
from mpi4py import MPI
from shapely.geometry import MultiPoint, Polygon
from icesat2_toolkit.convert_julian import convert_julian
from icesat2_toolkit.count_leap_seconds import count_leap_seconds
#-- PURPOSE: help module to describe the optional input parameters
def usage():
print('\nHelp: {}'.format(os.path.basename(sys.argv[0])))
print(' -D X, --directory=X\tWorking Data Directory')
print(' -R X, --region=X\tRegion of Randolph Glacier Inventory to run')
print(' -M X, --mode=X\t\tPermission mode of directories and files created')
print(' -V, --verbose\t\tOutput information about each created file\n')
#-- PURPOSE: keep track of MPI threads
def info(rank, size):
print('Rank {0:d} of {1:d}'.format(rank+1,size))
print('module name: {0}'.format(__name__))
if hasattr(os, 'getppid'):
print('parent process: {0:d}'.format(os.getppid()))
print('process id: {0:d}'.format(os.getpid()))
#-- PURPOSE: load zip file containing Randolph Glacier Inventory shapefiles
def load_glacier_inventory(RGI_DIRECTORY,RGI_REGION):
#-- list of Randolph Glacier Inventory files
RGI_files = []
RGI_files.append('01_rgi60_Alaska')
RGI_files.append('02_rgi60_WesternCanadaUS')
RGI_files.append('03_rgi60_ArcticCanadaNorth')
RGI_files.append('04_rgi60_ArcticCanadaSouth')
RGI_files.append('05_rgi60_GreenlandPeriphery')
RGI_files.append('06_rgi60_Iceland')
RGI_files.append('07_rgi60_Svalbard')
RGI_files.append('08_rgi60_Scandinavia')
RGI_files.append('09_rgi60_RussianArctic')
RGI_files.append('10_rgi60_NorthAsia')
RGI_files.append('11_rgi60_CentralEurope')
RGI_files.append('12_rgi60_CaucasusMiddleEast')
RGI_files.append('13_rgi60_CentralAsia')
RGI_files.append('14_rgi60_SouthAsiaWest')
RGI_files.append('15_rgi60_SouthAsiaEast')
RGI_files.append('16_rgi60_LowLatitudes')
RGI_files.append('17_rgi60_SouthernAndes')
RGI_files.append('18_rgi60_NewZealand')
RGI_files.append('19_rgi60_AntarcticSubantarctic')
#-- read input zipfile containing RGI shapefiles
zs = zipfile.ZipFile(os.path.join(RGI_DIRECTORY,
'{0}.zip'.format(RGI_files[RGI_REGION-1])))
dbf,prj,shp,shx = [io.BytesIO(zs.read(s)) for s in sorted(zs.namelist())
if re.match('(.*?)\.(dbf|prj|shp|shx)$',s)]
#-- read the shapefile and extract entities
shape_input = shapefile.Reader(dbf=dbf, prj=prj, shp=shp, shx=shx,
encodingErrors='ignore')
shape_entities = shape_input.shapes()
shape_attributes = shape_input.records()
#-- extract the RGI entities
poly_dict = {}
for i,att in enumerate(shape_attributes):
#-- extract latitude and longitude coordinates for entity
points = np.array(shape_entities[i].points)
#-- entities can have multiple parts
parts = shape_entities[i].parts
parts.append(len(points))
#-- list object for coordinates (exterior and holes)
poly_list = []
#-- add each part to list
for p1,p2 in zip(parts[:-1],parts[1:]):
poly_list.append(list(zip(points[p1:p2,0],points[p1:p2,1])))
#-- convert poly_list into Polygon object with holes
poly_obj = Polygon(poly_list[0],poly_list[1:])
#-- Valid Polygon may not possess overlapping exterior or interior rings
if (not poly_obj.is_valid):
poly_obj = poly_obj.buffer(0)
#-- add to dictionary based on RGI identifier
poly_dict[att[0]] = poly_obj
#-- close the zipfile
zs.close()
#-- return the dictionary of polygon objects and the input file
return (poly_dict, RGI_files[RGI_REGION-1])
#-- PURPOSE: read ICESat-2 data from NSIDC or MPI_ICESat2_ATL03.py
#-- reduce to the Randolph Glacier Inventory
def main():
#-- start MPI communicator
comm = MPI.COMM_WORLD
#-- Read the system arguments listed after the program
long_options = ['help','directory=','region=','verbose','mode=']
optlist,arglist = getopt.getopt(sys.argv[1:],'hD:R:VM:',long_options)
#-- working data directory for location of RGI files
base_dir = os.getcwd()
#-- region of Randolph Glacier Inventory to run
RGI_REGION = 17
#-- verbosity settings
VERBOSE = False
#-- permissions mode of the local files (number in octal)
MODE = 0o775
for opt, arg in optlist:
if opt in ('-h','--help'):
usage() if (comm.rank==0) else None
sys.exit()
elif opt in ("-D","--directory"):
base_dir = os.path.expanduser(arg)
elif opt in ("-R","--region"):
RGI_REGION = np.int(arg)
elif opt in ("-V","--verbose"):
#-- output module information for process
info(comm.rank,comm.size)
VERBOSE = True
elif opt in ("-M","--mode"):
MODE = int(arg, 8)
#-- enter HDF5 file as system argument
if not arglist:
raise IOError('No input file entered as system arguments')
#-- tilde-expansion of listed input file
FILE = os.path.expanduser(arglist[0])
#-- read data from input file
print('{0} -->'.format(FILE)) if (VERBOSE and (comm.rank==0)) else None
#-- Open the HDF5 file for reading
fileID = h5py.File(FILE, 'r', driver='mpio', comm=comm)
DIRECTORY = os.path.dirname(FILE)
#-- extract parameters from ICESat-2 ATLAS HDF5 file name
rx = re.compile('(ATL\d{2})_(\d{4})(\d{2})(\d{2})(\d{2})(\d{2})(\d{2})_'
'(\d{4})(\d{2})(\d{2})_(\d{3})_(\d{2})(.*?).h5$',re.VERBOSE)
PRD,YY,MM,DD,HH,MN,SS,TRK,CYCL,GRAN,RL,VERS,AUX = rx.findall(FILE).pop()
#-- read data on rank 0
if (comm.rank == 0):
#-- read RGI for region and create shapely polygon objects
poly_dict,RGI_file = load_glacier_inventory(base_dir,RGI_REGION)
else:
#-- create empty object for list of shapely objects
poly_dict = None
RGI_file = None
#-- Broadcast Shapely polygon objects
poly_dict = comm.bcast(poly_dict, root=0)
RGI_file = comm.bcast(RGI_file, root=0)
#-- RGI version and name
RGI_VERSION,RGI_NAME = re.findall('\d_rgi(\d+)_(.*?)$',RGI_file).pop()
#-- read each input beam within the file
IS2_atl03_beams = []
for gtx in [k for k in fileID.keys() if bool(re.match(r'gt\d[lr]',k))]:
#-- check if subsetted beam contains data
try:
fileID[gtx]['geolocation']['segment_id']
except KeyError:
pass
else:
IS2_atl03_beams.append(gtx)
#-- number of GPS seconds between the GPS epoch
#-- and ATLAS Standard Data Product (SDP) epoch
atlas_sdp_gps_epoch = fileID['ancillary_data']['atlas_sdp_gps_epoch'][:]
#-- copy variables for outputting to HDF5 file
IS2_atl03_mask = {}
IS2_atl03_fill = {}
IS2_atl03_mask_attrs = {}
#-- number of GPS seconds between the GPS epoch (1980-01-06T00:00:00Z UTC)
#-- and ATLAS Standard Data Product (SDP) epoch (2018-01-01T00:00:00Z UTC)
#-- Add this value to delta time parameters to compute full gps_seconds
IS2_atl03_mask['ancillary_data'] = {}
IS2_atl03_mask_attrs['ancillary_data'] = {}
for key in ['atlas_sdp_gps_epoch']:
#-- get each HDF5 variable
IS2_atl03_mask['ancillary_data'][key] = fileID['ancillary_data'][key][:]
#-- Getting attributes of group and included variables
IS2_atl03_mask_attrs['ancillary_data'][key] = {}
for att_name,att_val in fileID['ancillary_data'][key].attrs.items():
IS2_atl03_mask_attrs['ancillary_data'][key][att_name] = att_val
#-- for each input beam within the file
for gtx in sorted(IS2_atl03_beams):
#-- output data dictionaries for beam
IS2_atl03_mask[gtx] = dict(heights={},subsetting={})
IS2_atl03_fill[gtx] = dict(heights={},subsetting={})
IS2_atl03_mask_attrs[gtx] = dict(heights={},subsetting={})
#-- number of photon events
n_pe, = fileID[gtx]['heights']['h_ph'].shape
#-- define indices to run for specific process
ind = np.arange(comm.Get_rank(), n_pe, comm.Get_size(), dtype=np.int)
#-- extract delta time
delta_time = fileID[gtx]['heights']['delta_time'][:]
#-- extract lat/lon
longitude = fileID[gtx]['heights']['lon_ph'][:]
latitude = fileID[gtx]['heights']['lat_ph'][:]
#-- convert reduced lat/lon to shapely multipoint object
xy_point = MultiPoint(list(zip(longitude[ind],latitude[ind])))
#-- create distributed intersection map for calculation
distributed_map = np.zeros((n_pe),dtype=np.bool)
distributed_RGIId = np.zeros((n_pe),dtype='|S14')
#-- create empty intersection map array for receiving
associated_map = np.zeros((n_pe),dtype=np.bool)
associated_RGIId = np.zeros((n_pe),dtype='|S14')
for key,poly_obj in poly_dict.items():
#-- finds if points are encapsulated (within RGI polygon)
int_test = poly_obj.intersects(xy_point)
if int_test:
#-- extract intersected points
int_map = list(map(poly_obj.intersects,xy_point))
int_indices, = np.nonzero(int_map)
#-- set distributed_map indices to True for intersected points
distributed_map[ind[int_indices]] = True
distributed_RGIId[ind[int_indices]] = key
#-- communicate output MPI matrices between ranks
#-- operation is a logical "or" across the elements.
comm.Allreduce(sendbuf=[distributed_map, MPI.BOOL], \
recvbuf=[associated_map, MPI.BOOL], op=MPI.LOR)
#-- operation is a element summation.
comm.Allreduce(sendbuf=[distributed_RGIId, MPI.CHAR], \
recvbuf=[associated_RGIId, MPI.CHAR], op=MPI.SUM)
distributed_map = None
distributed_RGIId = None
#-- wait for all processes to finish calculation
comm.Barrier()
#-- group attributes for beam
IS2_atl03_mask_attrs[gtx]['Description'] = fileID[gtx].attrs['Description']
IS2_atl03_mask_attrs[gtx]['atlas_pce'] = fileID[gtx].attrs['atlas_pce']
IS2_atl03_mask_attrs[gtx]['atlas_beam_type'] = fileID[gtx].attrs['atlas_beam_type']
IS2_atl03_mask_attrs[gtx]['groundtrack_id'] = fileID[gtx].attrs['groundtrack_id']
IS2_atl03_mask_attrs[gtx]['atmosphere_profile'] = fileID[gtx].attrs['atmosphere_profile']
IS2_atl03_mask_attrs[gtx]['atlas_spot_number'] = fileID[gtx].attrs['atlas_spot_number']
IS2_atl03_mask_attrs[gtx]['sc_orientation'] = fileID[gtx].attrs['sc_orientation']
#-- group attributes for heights
IS2_atl03_mask_attrs[gtx]['heights']['Description'] = ("Contains arrays of the "
"parameters for each received photon.")
IS2_atl03_mask_attrs[gtx]['heights']['data_rate'] = ("Data are stored at the "
"photon detection rate.")
#-- geolocation, time and segment ID
#-- delta time
IS2_atl03_mask[gtx]['heights']['delta_time'] = delta_time
IS2_atl03_fill[gtx]['heights']['delta_time'] = None
IS2_atl03_mask_attrs[gtx]['heights']['delta_time'] = {}
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['units'] = "seconds since 2018-01-01"
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['long_name'] = "Elapsed GPS seconds"
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['standard_name'] = "time"
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['calendar'] = "standard"
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['description'] = ("Number of GPS "
"seconds since the ATLAS SDP epoch. The ATLAS Standard Data Products (SDP) epoch offset "
"is defined within /ancillary_data/atlas_sdp_gps_epoch as the number of GPS seconds "
"between the GPS epoch (1980-01-06T00:00:00.000000Z UTC) and the ATLAS SDP epoch. By "
"adding the offset contained within atlas_sdp_gps_epoch to delta time parameters, the "
"time in gps_seconds relative to the GPS epoch can be computed.")
IS2_atl03_mask_attrs[gtx]['heights']['delta_time']['coordinates'] = \
"lat_ph lon_ph"
#-- latitude
IS2_atl03_mask[gtx]['heights']['latitude'] = latitude
IS2_atl03_fill[gtx]['heights']['latitude'] = None
IS2_atl03_mask_attrs[gtx]['heights']['latitude'] = {}
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['units'] = "degrees_north"
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['contentType'] = "physicalMeasurement"
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['long_name'] = "Latitude"
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['standard_name'] = "latitude"
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['description'] = ("Latitude of each "
"received photon. Computed from the ECF Cartesian coordinates of the bounce point.")
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['valid_min'] = -90.0
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['valid_max'] = 90.0
IS2_atl03_mask_attrs[gtx]['heights']['latitude']['coordinates'] = \
"delta_time lon_ph"
#-- longitude
IS2_atl03_mask[gtx]['heights']['longitude'] = longitude
IS2_atl03_fill[gtx]['heights']['longitude'] = None
IS2_atl03_mask_attrs[gtx]['heights']['longitude'] = {}
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['units'] = "degrees_east"
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['contentType'] = "physicalMeasurement"
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['long_name'] = "Longitude"
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['standard_name'] = "longitude"
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['description'] = ("Longitude of each "
"received photon. Computed from the ECF Cartesian coordinates of the bounce point.")
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['valid_min'] = -180.0
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['valid_max'] = 180.0
IS2_atl03_mask_attrs[gtx]['heights']['longitude']['coordinates'] = \
"delta_time lat_ph"
#-- subsetting variables
IS2_atl03_mask_attrs[gtx]['subsetting']['Description'] = ("The subsetting group "
"contains parameters used to reduce photon events to specific regions of interest.")
IS2_atl03_mask_attrs[gtx]['subsetting']['data_rate'] = ("Data are stored at the photon "
"detection rate.")
#-- output mask to HDF5
key = RGI_NAME.replace('_',' ')
IS2_atl03_mask[gtx]['subsetting'][RGI_NAME] = associated_map
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME] = {}
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['contentType'] = "referenceInformation"
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['long_name'] = '{0} Mask'.format(key)
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['description'] = ('Mask calculated '
'using the {0} region from the Randolph Glacier Inventory.').format(key)
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['source'] = \
'RGIv{0}'.format(RGI_VERSION)
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['reference'] = \
'https://www.glims.org/RGI/'
IS2_atl03_mask_attrs[gtx]['subsetting'][RGI_NAME]['coordinates'] = \
"../heights/delta_time ../heights/lat_ph ../heights/lon_ph"
#-- output RGI identifier
IS2_atl03_mask[gtx]['subsetting']['RGIId'] = associated_RGIId
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId'] = {}
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['contentType'] = "referenceInformation"
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['long_name'] = "RGI Identifier"
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['description'] = ('Identification '
'code within version {0} of the Randolph Glacier Inventory (RGI).').format(RGI_VERSION)
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['source'] = \
'RGIv{0}'.format(RGI_VERSION)
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['reference'] = \
'https://www.glims.org/RGI/'
IS2_atl03_mask_attrs[gtx]['subsetting']['RGIId']['coordinates'] = \
"../heights/delta_time ../heights/lat_ph ../heights/lon_ph"
#-- wait for all processes to finish calculation
comm.Barrier()
#-- parallel h5py I/O does not support compression filters at this time
if (comm.rank == 0) and associated_map.any():
#-- output HDF5 file with RGI masks
args = (PRD,RGI_VERSION,RGI_NAME,YY,MM,DD,HH,MN,SS,TRK,CYCL,GRAN,RL,VERS,AUX)
file_format='{0}_RGI{1}_{2}_{3}{4}{5}{6}{7}{8}_{9}{10}{11}_{12}_{13}{14}.h5'
#-- print file information
print('\t{0}'.format(file_format.format(*args))) if VERBOSE else None
HDF5_atl03_mask_write(IS2_atl03_mask, IS2_atl03_mask_attrs, CLOBBER=True,
INPUT=os.path.basename(FILE), FILL_VALUE=IS2_atl03_fill,
FILENAME=os.path.join(DIRECTORY,file_format.format(*args)))
#-- change the permissions mode
os.chmod(os.path.join(DIRECTORY,file_format.format(*args)), MODE)
#-- close the input file
fileID.close()
#-- PURPOSE: outputting the interpolated DEM data for ICESat-2 data to HDF5
def HDF5_ATL03_mask_write(IS2_atl03_mask, IS2_atl03_attrs, INPUT=None,
FILENAME='', FILL_VALUE=None, CLOBBER=True):
#-- setting HDF5 clobber attribute
if CLOBBER:
clobber = 'w'
else:
clobber = 'w-'
#-- open output HDF5 file
fileID = h5py.File(os.path.expanduser(FILENAME), clobber)
#-- create HDF5 records
h5 = {}
#-- number of GPS seconds between the GPS epoch (1980-01-06T00:00:00Z UTC)
#-- and ATLAS Standard Data Product (SDP) epoch (2018-01-01T00:00:00Z UTC)
h5['ancillary_data'] = {}
for k,v in IS2_atl03_mask['ancillary_data'].items():
#-- Defining the HDF5 dataset variables
val = 'ancillary_data/{0}'.format(k)
h5['ancillary_data'][k] = fileID.create_dataset(val, np.shape(v), data=v,
dtype=v.dtype, compression='gzip')
#-- add HDF5 variable attributes
for att_name,att_val in IS2_atl03_attrs['ancillary_data'][k].items():
h5['ancillary_data'][k].attrs[att_name] = att_val
#-- write each output beam
beams = [k for k in IS2_atl03_mask.keys() if bool(re.match(r'gt\d[lr]',k))]
for gtx in beams:
fileID.create_group(gtx)
#-- add HDF5 group attributes for beam
for att_name in ['Description','atlas_pce','atlas_beam_type',
'groundtrack_id','atmosphere_profile','atlas_spot_number',
'sc_orientation']:
fileID[gtx].attrs[att_name] = IS2_atl03_attrs[gtx][att_name]
#-- create heights group
fileID[gtx].create_group('heights')
h5[gtx] = dict(heights={})
for att_name in ['Description','data_rate']:
att_val = IS2_atl03_attrs[gtx]['heights'][att_name]
fileID[gtx]['heights'].attrs[att_name] = att_val
#-- delta_time
v = IS2_atl03_mask[gtx]['heights']['delta_time']
attrs = IS2_atl03_attrs[gtx]['heights']['delta_time']
#-- Defining the HDF5 dataset variables
val = '{0}/{1}/{2}'.format(gtx,'heights','delta_time')
h5[gtx]['heights']['delta_time'] = fileID.create_dataset(val,
np.shape(v), data=v, dtype=v.dtype, compression='gzip')
#-- add HDF5 variable attributes
for att_name,att_val in attrs.items():
h5[gtx]['heights']['delta_time'].attrs[att_name] = att_val
#-- geolocation variables
for k in ['latitude','longitude']:
#-- values and attributes
v = IS2_atl03_mask[gtx]['heights'][k]
attrs = IS2_atl03_attrs[gtx]['heights'][k]
fillvalue = FILL_VALUE[gtx]['heights'][k]
#-- Defining the HDF5 dataset variables
val = '{0}/{1}/{2}'.format(gtx,'heights',k)
if fillvalue:
h5[gtx]['heights'][k] = fileID.create_dataset(val, np.shape(v),
data=v,dtype=v.dtype,fillvalue=fillvalue,compression='gzip')
else:
h5[gtx]['heights'][k] = fileID.create_dataset(val, np.shape(v),
data=v, dtype=v.dtype, compression='gzip')
#-- attach dimensions
for dim in ['delta_time']:
h5[gtx]['heights'][k].dims.create_scale(
h5[gtx]['heights'][dim], dim)
h5[gtx]['heights'][k].dims[0].attach_scale(
h5[gtx]['heights'][dim])
#-- add HDF5 variable attributes
for att_name,att_val in attrs.items():
h5[gtx]['heights'][k].attrs[att_name] = att_val
#-- create subsetting group
fileID[gtx].create_group('subsetting')
h5[gtx]['subsetting'] = {}
for att_name in ['Description','data_rate']:
att_val = IS2_atl03_attrs[gtx]['subsetting'][att_name]
fileID[gtx]['subsetting'].attrs[att_name] = att_val
#-- add to subsetting variables
for k,v in IS2_atl03_mask[gtx]['subsetting'].items():
#-- attributes
attrs = IS2_atl03_attrs[gtx]['subsetting'][k]
#-- Defining the HDF5 dataset variables
val = '{0}/{1}/{2}'.format(gtx,'subsetting',k)
h5[gtx]['subsetting'][k] = fileID.create_dataset(val, np.shape(v),
data=v, dtype=v.dtype, compression='gzip')
#-- attach dimensions
for dim in ['delta_time']:
h5[gtx]['subsetting'][k].dims.create_scale(
h5[gtx]['heights'][dim], dim)
h5[gtx]['subsetting'][k].dims[0].attach_scale(
h5[gtx]['heights'][dim])
#-- add HDF5 variable attributes
for att_name,att_val in attrs.items():
h5[gtx]['subsetting'][k].attrs[att_name] = att_val
#-- HDF5 file title
fileID.attrs['featureType'] = 'trajectory'
fileID.attrs['title'] = 'ATLAS/ICESat-2 L2A Global Geolocated Photon Data'
fileID.attrs['summary'] = ("The purpose of ATL03 is to provide along-track "
"photon data for all 6 ATLAS beams and associated statistics.")
fileID.attrs['description'] = ("Photon heights determined by ATBD "
"Algorithm using POD and PPD. All photon events per transmit pulse per "
"beam. Includes POD and PPD vectors. Classification of each photon by "
"several ATBD Algorithms.")
date_created = datetime.datetime.today()
fileID.attrs['date_created'] = date_created.isoformat()
project = 'ICESat-2 > Ice, Cloud, and land Elevation Satellite-2'
fileID.attrs['project'] = project
platform = 'ICESat-2 > Ice, Cloud, and land Elevation Satellite-2'
fileID.attrs['project'] = platform
#-- add attribute for elevation instrument and designated processing level
instrument = 'ATLAS > Advanced Topographic Laser Altimeter System'
fileID.attrs['instrument'] = instrument
fileID.attrs['source'] = 'Spacecraft'
fileID.attrs['references'] = 'http://nsidc.org/data/icesat2/data.html'
fileID.attrs['processing_level'] = '4'
#-- add attributes for input ATL03 and ATL09 files
fileID.attrs['input_files'] = ','.join([os.path.basename(i) for i in INPUT])
#-- find geospatial and temporal ranges
lnmn,lnmx,ltmn,ltmx,tmn,tmx = (np.inf,-np.inf,np.inf,-np.inf,np.inf,-np.inf)
for gtx in beams:
lon = IS2_atl03_mask[gtx]['heights']['longitude']
lat = IS2_atl03_mask[gtx]['heights']['latitude']
delta_time = IS2_atl03_mask[gtx]['heights']['delta_time']
#-- setting the geospatial and temporal ranges
lnmn = lon.min() if (lon.min() < lnmn) else lnmn
lnmx = lon.max() if (lon.max() > lnmx) else lnmx
ltmn = lat.min() if (lat.min() < ltmn) else ltmn
ltmx = lat.max() if (lat.max() > ltmx) else ltmx
tmn = delta_time.min() if (delta_time.min() < tmn) else tmn
tmx = delta_time.max() if (delta_time.max() > tmx) else tmx
#-- add geospatial and temporal attributes
fileID.attrs['geospatial_lat_min'] = ltmn
fileID.attrs['geospatial_lat_max'] = ltmx
fileID.attrs['geospatial_lon_min'] = lnmn
fileID.attrs['geospatial_lon_max'] = lnmx
fileID.attrs['geospatial_lat_units'] = "degrees_north"
fileID.attrs['geospatial_lon_units'] = "degrees_east"
fileID.attrs['geospatial_ellipsoid'] = "WGS84"
fileID.attrs['date_type'] = 'UTC'
fileID.attrs['time_type'] = 'CCSDS UTC-A'
#-- convert start and end time from ATLAS SDP seconds into Julian days
atlas_sdp_gps_epoch=IS2_atl03_mask['ancillary_data']['atlas_sdp_gps_epoch']
gps_seconds = atlas_sdp_gps_epoch + np.array([tmn,tmx])
time_leaps = count_leap_seconds(gps_seconds)
time_julian = 2444244.5 + (gps_seconds - time_leaps)/86400.0
#-- convert to calendar date with convert_julian.py
YY,MM,DD,HH,MN,SS = convert_julian(time_julian,FORMAT='tuple')
#-- add attributes with measurement date start, end and duration
tcs = datetime.datetime(np.int(YY[0]), np.int(MM[0]), np.int(DD[0]),
np.int(HH[0]), np.int(MN[0]), np.int(SS[0]), np.int(1e6*(SS[0] % 1)))
fileID.attrs['time_coverage_start'] = tcs.isoformat()
tce = datetime.datetime(np.int(YY[1]), np.int(MM[1]), np.int(DD[1]),
np.int(HH[1]), np.int(MN[1]), np.int(SS[1]), np.int(1e6*(SS[1] % 1)))
fileID.attrs['time_coverage_end'] = tce.isoformat()
fileID.attrs['time_coverage_duration'] = '{0:0.0f}'.format(tmx-tmn)
#-- Closing the HDF5 file
fileID.close()
#-- run main program
if __name__ == '__main__':
main()