Source code for S1_NRB.metadata.stac

import os
import re
import shutil
from statistics import mean, median
from copy import deepcopy
from datetime import datetime
import pystac
from pystac.extensions.sar import SarExtension, FrequencyBand, Polarization, ObservationDirection
from pystac.extensions.sat import SatExtension, OrbitState
from pystac.extensions.projection import ProjectionExtension
from pystac.extensions.view import ViewExtension
from spatialist import Raster
from spatialist.ancillary import finder
from S1_NRB.metadata.mapping import SAMPLE_MAP
from S1_NRB.metadata.extract import get_header_size


[docs]def product_json(meta, target, tifs, exist_ok=False): """ Function to generate product-level metadata for an NRB product in STAC compliant JSON format. Parameters ---------- meta: dict Metadata dictionary generated with :func:`~S1_NRB.metadata.extract.meta_dict`. target: str A path pointing to the root directory of a product scene. tifs: list[str] List of paths to all GeoTIFF files of the currently processed NRB product. exist_ok: bool, optional Do not create files if they already exist? """ scene_id = os.path.basename(target) outname = os.path.join(target, '{}.json'.format(scene_id)) if os.path.isfile(outname) and exist_ok: return print(outname) start = meta['prod']['timeStart'] stop = meta['prod']['timeStop'] date = start + (stop - start) / 2 item = pystac.Item(id=scene_id, geometry=meta['prod']['geom_stac_geometry_4326'], bbox=meta['prod']['geom_stac_bbox_4326'], datetime=date, properties={}) item.common_metadata.license = meta['prod']['licence'] item.common_metadata.start_datetime = start item.common_metadata.end_datetime = stop item.common_metadata.created = meta['prod']['timeCreated'] item.common_metadata.instruments = [meta['common']['instrumentShortName'].lower()] item.common_metadata.constellation = meta['common']['constellation'] item.common_metadata.platform = meta['common']['platformFullname'] item.common_metadata.gsd = float(meta['prod']['pxSpacingColumn']) SarExtension.add_to(item) SatExtension.add_to(item) ProjectionExtension.add_to(item) sar_ext = SarExtension.ext(item) sat_ext = SatExtension.ext(item) proj_ext = ProjectionExtension.ext(item) item.stac_extensions.append('https://stac-extensions.github.io/processing/v1.1.0/schema.json') item.stac_extensions.append('https://stac-extensions.github.io/card4l/v0.1.0/sar/product.json') item.stac_extensions.append('https://stac-extensions.github.io/raster/v1.1.0/schema.json') item.stac_extensions.append('https://stac-extensions.github.io/file/v2.1.0/schema.json') item.stac_extensions.append('https://stac-extensions.github.io/mgrs/v1.0.0/schema.json') sar_ext.apply(instrument_mode=meta['common']['operationalMode'], frequency_band=FrequencyBand[meta['common']['radarBand'].upper()], polarizations=[Polarization[pol] for pol in meta['common']['polarisationChannels']], product_type=meta['prod']['productName-short'], looks_range=int(meta['prod']['rangeNumberOfLooks']), looks_azimuth=int(meta['prod']['azimuthNumberOfLooks'])) sat_ext.apply(orbit_state=OrbitState[meta['common']['orbitDirection'].upper()], relative_orbit=meta['common']['orbitNumbers_rel']['stop'], absolute_orbit=meta['common']['orbitNumbers_abs']['stop']) item.properties['processing:facility'] = meta['prod']['processingCenter'] item.properties['processing:software'] = {meta['prod']['processorName']: meta['prod']['processorVersion']} item.properties['processing:level'] = meta['common']['processingLevel'] item.properties['card4l:specification'] = meta['prod']['productName-short'] item.properties['card4l:specification_version'] = meta['prod']['card4l-version'] item.properties['card4l:beam_id'] = meta['common']['swathIdentifier'] item.properties['card4l:measurement_type'] = meta['prod']['backscatterMeasurement'] item.properties['card4l:measurement_convention'] = meta['prod']['backscatterConvention'] item.properties['card4l:pixel_coordinate_convention'] = meta['prod']['pixelCoordinateConvention'] item.properties['card4l:speckle_filtering'] = meta['prod']['speckleFilterApplied'] item.properties['card4l:noise_removal_applied'] = meta['prod']['NRApplied'] item.properties['card4l:conversion_eq'] = meta['prod']['backscatterConversionEq'] item.properties['card4l:relative_radiometric_accuracy'] = meta['prod']['radiometricAccuracyRelative'] item.properties['card4l:absolute_radiometric_accuracy'] = meta['prod']['radiometricAccuracyAbsolute'] item.properties['card4l:resampling_method'] = meta['prod']['geoCorrResamplingMethod'] item.properties['card4l:dem_resampling_method'] = meta['prod']['demResamplingMethod'] item.properties['card4l:egm_resampling_method'] = meta['prod']['demEGMResamplingMethod'] item.properties['card4l:geometric_accuracy_type'] = meta['prod']['geoCorrAccuracyType'] for x in ['Northern', 'Eastern']: key = ['geoCorrAccuracy{}{}'.format(x, y) for y in ['STDev', 'Bias']] stddev = float(meta['prod'][key[0]]) if meta['prod'][key[0]] is not None else None bias = float(meta['prod'][key[1]]) if meta['prod'][key[1]] is not None else None item.properties['card4l:{}_geometric_accuracy'.format(x.lower())] = {'bias': bias, 'stddev': stddev} item.properties['card4l:geometric_accuracy_radial_rmse'] = meta['prod']['geoCorrAccuracy_rRMSE'] proj_ext.apply(epsg=int(meta['prod']['crsEPSG']), wkt2=meta['prod']['crsWKT'], bbox=meta['prod']['geom_stac_bbox_native'], shape=[int(meta['prod']['numPixelsPerLine']), int(meta['prod']['numLines'])], transform=meta['prod']['transform']) mgrs = meta['prod']['mgrsID'] item.properties['mgrs:utm_zone'] = int(mgrs[:2]) item.properties['mgrs:latitude_band'] = mgrs[2:3] item.properties['mgrs:grid_square'] = mgrs[3:] item.add_link(link=pystac.Link(rel='card4l-document', target=meta['prod']['card4l-link'].replace('.pdf', '.docx'), media_type='application/vnd.openxmlformats-officedocument.wordprocessingml.document', title='CARD4L Product Family Specification: Normalised Radar Backscatter (v{})' ''.format(meta['prod']['card4l-version']))) item.add_link(link=pystac.Link(rel='card4l-document', target=meta['prod']['card4l-link'], media_type='application/pdf', title='CARD4L Product Family Specification: Normalised Radar Backscatter (v{})' ''.format(meta['prod']['card4l-version']))) for src in list(meta['source'].keys()): x = os.path.basename(meta['source'][src]['filename']).split('.')[0] src_target = os.path.join('./source', '{}.json'.format(x)).replace('\\', '/') item.add_link(link=pystac.Link(rel='derived_from', target=src_target, media_type='application/json', title='Source metadata formatted in STAC compliant JSON format.')) item.add_link(link=pystac.Link(rel='about', target=meta['prod']['doi'], title='Product definition reference.')) item.add_link(link=pystac.Link(rel='access', target=meta['prod']['access'], title='Product data access.')) item.add_link(link=pystac.Link(rel='related', target=meta['prod']['ancillaryData_KML'], title='Sentinel-2 Military Grid Reference System (MGRS) tiling grid file ' 'used as auxiliary data during processing.')) if meta['prod']['NRApplied']: item.add_link(link=pystac.Link(rel='noise-removal', target=meta['prod']['NRAlgorithm'], title='Reference to the noise removal algorithm details.')) item.add_link(link=pystac.Link(rel='radiometric-terrain-correction', target=meta['prod']['RTCAlgorithm'], title='Reference to the Radiometric Terrain Correction algorithm details.')) item.add_link(link=pystac.Link(rel='radiometric-accuracy', target=meta['prod']['radiometricAccuracyReference'], title='Reference describing the radiometric uncertainty of the product.')) item.add_link(link=pystac.Link(rel='geometric-correction', target=meta['prod']['geoCorrAlgorithm'], title='Reference to the Geometric Correction algorithm details.')) item.add_link(link=pystac.Link(rel='{}-model'.format(meta['prod']['demType']), target=meta['prod']['demReference'], title='Digital Elevation Model used as auxiliary data during processing: ' '{}'.format(meta['prod']['demName']))) item.add_link(link=pystac.Link(rel='earth-gravitational-model', target=meta['prod']['demEGMReference'], title='Reference to the Earth Gravitational Model (EGM) used for Geometric ' 'Correction.')) item.add_link(link=pystac.Link(rel='geometric-accuracy', target=meta['prod']['geoCorrAccuracyReference'], title='Reference documenting the estimate of absolute localization error.')) item.add_link(link=pystac.Link(rel='gridding-convention', target=meta['prod']['griddingConventionURL'], title='Reference describing the gridding convention used.')) xml_relpath = './' + os.path.relpath(outname.replace('.json', '.xml'), target).replace('\\', '/') item.add_asset(key='card4l', asset=pystac.Asset(href=xml_relpath, title='Metadata in XML format.', media_type=pystac.MediaType.XML, roles=['metadata', 'card4l'])) for tif in tifs: relpath = './' + os.path.relpath(tif, target).replace('\\', '/') size = os.path.getsize(tif) header_size = get_header_size(tif=tif) if 'measurement' in tif: pol = re.search('[vh]{2}', tif).group().lower() created = datetime.fromtimestamp(os.path.getctime(tif)).isoformat() extra_fields = {'created': created, 'raster:bands': [{'unit': 'natural', 'nodata': 'NaN', 'data_type': '{}{}'.format(meta['prod']['fileDataType'], meta['prod']['fileBitsPerSample']), 'bits_per_sample': int(meta['prod']['fileBitsPerSample'])}], 'file:byte_order': meta['prod']['fileByteOrder'], 'file:size': size, 'file:header_size': header_size, 'card4l:border_pixels': meta['prod']['numBorderPixels']} item.add_asset(key=pol, asset=pystac.Asset(href=relpath, title='{} backscatter data'.format(pol.upper()), media_type=pystac.MediaType[meta['prod']['fileFormat']], roles=['backscatter', 'data'], extra_fields=extra_fields)) elif 'annotation' in tif: key = re.search('-[a-z]{2}(?:-[a-z]{2}|).tif', tif).group() np_pat = '-np-[vh]{2}.tif' if re.search(np_pat, key) is not None: pol = re.search('[vh]{2}', key).group() key = np_pat asset_key = 'noise-power-{}'.format(pol) else: asset_key = SAMPLE_MAP[key]['role'] if SAMPLE_MAP[key]['unit'] is None: SAMPLE_MAP[key]['unit'] = 'unitless' if key in ['-dm.tif', '-id.tif']: ras_bands_base = {'unit': SAMPLE_MAP[key]['unit'], 'nodata': 255, 'data_type': 'uint8', 'bits_per_sample': 8} raster_bands = [] if key == '-dm.tif': with Raster(tif) as dm_ras: band_descr = [dm_ras.raster.GetRasterBand(band).GetDescription() for band in range(1, dm_ras.bands + 1)] if 1 < len(band_descr) < len(SAMPLE_MAP[key]['values']): samples = {key: val for key, val in SAMPLE_MAP[key]['values'].items() if val in band_descr} for sample_item in samples.items(): vals = {'values': [{'value': 1, 'summary': sample_item[1]}]} band_dict = deepcopy(ras_bands_base) band_dict.update(vals) raster_bands.append(band_dict) else: raise RuntimeError('{} contains an unexpected number of bands!'.format(tif)) else: # key == '-id.tif' src_list = list(meta['source'].keys()) src_target = [ os.path.basename(meta['source'][src]['filename']).replace('.SAFE', '').replace('.zip', '') for src in src_list] vals = {'values': [{'value': [i + 1], 'summary': s} for i, s in enumerate(src_target)]} band_dict = deepcopy(ras_bands_base) band_dict.update(vals) raster_bands = [band_dict] extra_fields = {'raster:bands': raster_bands, 'file:byte_order': meta['prod']['fileByteOrder'], 'file:size': size, 'file:header_size': header_size} else: raster_bands = {'unit': SAMPLE_MAP[key]['unit'], 'nodata': 'NaN', 'data_type': '{}{}'.format(meta['prod']['fileDataType'], meta['prod']['fileBitsPerSample']), 'bits_per_sample': int(meta['prod']['fileBitsPerSample'])} extra_fields = {'raster:bands': [raster_bands], 'file:byte_order': meta['prod']['fileByteOrder'], 'file:size': size, 'file:header_size': header_size} if key == '-ei.tif': extra_fields['card4l:ellipsoidal_height'] = meta['prod']['ellipsoidalHeight'] item.add_asset(key=asset_key, asset=pystac.Asset(href=relpath, title=SAMPLE_MAP[key]['title'], media_type=pystac.MediaType[meta['prod']['fileFormat']], roles=[SAMPLE_MAP[key]['role'], 'metadata'], extra_fields=extra_fields)) item.save_object(dest_href=outname)
[docs]def source_json(meta, target, exist_ok=False): """ Function to generate source-level metadata for an NRB product in STAC compliant JSON format. Parameters ---------- meta: dict Metadata dictionary generated with :func:`~S1_NRB.metadata.extract.meta_dict`. target: str A path pointing to the root directory of a product scene. exist_ok: bool, optional Do not create files if they already exist? """ metadir = os.path.join(target, 'source') os.makedirs(metadir, exist_ok=True) for uid in list(meta['source'].keys()): scene = os.path.basename(meta['source'][uid]['filename']).split('.')[0] outname = os.path.join(metadir, '{}.json'.format(scene)) if os.path.isfile(outname) and exist_ok: continue print(outname) start = meta['source'][uid]['timeStart'] stop = meta['source'][uid]['timeStop'] date = start + (stop - start) / 2 item = pystac.Item(id=scene, geometry=meta['source'][uid]['geom_stac_geometry_4326'], bbox=meta['source'][uid]['geom_stac_bbox_4326'], datetime=date, properties={}) item.common_metadata.start_datetime = start item.common_metadata.end_datetime = stop item.common_metadata.created = datetime.strptime(meta['source'][uid]['processingDate'], '%Y-%m-%dT%H:%M:%S.%f') item.common_metadata.instruments = [meta['common']['instrumentShortName'].lower()] item.common_metadata.constellation = meta['common']['constellation'] item.common_metadata.platform = meta['common']['platformFullname'] SarExtension.add_to(item) SatExtension.add_to(item) ViewExtension.add_to(item) sar_ext = SarExtension.ext(item) sat_ext = SatExtension.ext(item) view_ext = ViewExtension.ext(item) item.stac_extensions.append('https://stac-extensions.github.io/processing/v1.1.0/schema.json') item.stac_extensions.append('https://stac-extensions.github.io/card4l/v0.1.0/sar/source.json') enl = meta['source'][uid]['perfEquivalentNumberOfLooks'] sar_ext.apply(instrument_mode=meta['common']['operationalMode'], frequency_band=FrequencyBand[meta['common']['radarBand'].upper()], polarizations=[Polarization[pol] for pol in meta['common']['polarisationChannels']], product_type=meta['source'][uid]['productType'], center_frequency=float(meta['common']['radarCenterFreq'] / 1e9), resolution_range=mean(meta['source'][uid]['rangeResolution'].values()), resolution_azimuth=mean(meta['source'][uid]['azimuthResolution'].values()), pixel_spacing_range=mean(meta['source'][uid]['rangePixelSpacing'].values()), pixel_spacing_azimuth=mean(meta['source'][uid]['azimuthPixelSpacing'].values()), looks_range=median(meta['source'][uid]['rangeNumberOfLooks'].values()), looks_azimuth=median(meta['source'][uid]['azimuthNumberOfLooks'].values()), looks_equivalent_number=float(enl), observation_direction=ObservationDirection[meta['common']['antennaLookDirection']]) sat_ext.apply(orbit_state=OrbitState[meta['common']['orbitDirection'].upper()], relative_orbit=meta['common']['orbitNumbers_rel']['stop'], absolute_orbit=meta['common']['orbitNumbers_abs']['stop'], anx_datetime=datetime.strptime(meta['source'][uid]['ascendingNodeDate'], '%Y-%m-%dT%H:%M:%S.%f')) view_ext.apply(incidence_angle=float(meta['source'][uid]['incidenceAngleMidSwath']), azimuth=float(meta['source'][uid]['instrumentAzimuthAngle'])) item.properties['processing:facility'] = meta['source'][uid]['processingCenter'] item.properties['processing:software'] = {meta['source'][uid]['processorName']: meta['source'][uid]['processorVersion']} item.properties['processing:level'] = meta['common']['processingLevel'] item.properties['card4l:specification'] = meta['prod']['productName-short'] item.properties['card4l:specification_version'] = meta['prod']['card4l-version'] item.properties['card4l:beam_id'] = meta['common']['swathIdentifier'] item.properties['card4l:orbit_data_source'] = meta['source'][uid]['orbitDataSource'] item.properties['card4l:orbit_mean_altitude'] = float(meta['common']['orbitMeanAltitude']) range_look_bandwidth = {k: v / 1e9 for k, v in meta['source'][uid]['rangeLookBandwidth'].items()} # GHz azimuth_look_bandwidth = {k: v / 1e9 for k, v in meta['source'][uid]['azimuthLookBandwidth'].items()} # GHz item.properties['card4l:source_processing_parameters'] = {'lut_applied': meta['source'][uid]['lutApplied'], 'range_look_bandwidth': range_look_bandwidth, 'azimuth_look_bandwidth': azimuth_look_bandwidth} for field, key in zip(['card4l:resolution_range', 'card4l:resolution_azimuth'], ['rangeResolution', 'azimuthResolution']): res = {} for k, v in meta['source'][uid][key].items(): res[k] = float(v) item.properties[field] = res item.properties['card4l:source_geometry'] = meta['source'][uid]['dataGeometry'] item.properties['card4l:incidence_angle_near_range'] = meta['source'][uid]['incidenceAngleMin'] item.properties['card4l:incidence_angle_far_range'] = meta['source'][uid]['incidenceAngleMax'] item.properties['card4l:noise_equivalent_intensity'] = meta['source'][uid]['perfEstimates'] item.properties['card4l:noise_equivalent_intensity_type'] = meta['source'][uid][ 'perfNoiseEquivalentIntensityType'] item.properties['card4l:peak_sidelobe_ratio'] = meta['source'][uid]['perfPeakSideLobeRatio'] item.properties['card4l:integrated_sidelobe_ratio'] = meta['source'][uid]['perfIntegratedSideLobeRatio'] item.properties['card4l:mean_faraday_rotation_angle'] = meta['source'][uid]['faradayMeanRotationAngle'] item.properties['card4l:ionosphere_indicator'] = meta['source'][uid]['ionosphereIndicator'] item.add_link(link=pystac.Link(rel='card4l-document', target=meta['prod']['card4l-link'].replace('.pdf', '.docx'), media_type='application/vnd.openxmlformats-officedocument.wordprocessingml' '.document', title='CARD4L Product Family Specification: Normalised Radar Backscatter (v{})' ''.format(meta['prod']['card4l-version']))) item.add_link(link=pystac.Link(rel='card4l-document', target=meta['prod']['card4l-link'], media_type='application/pdf', title='CARD4L Product Family Specification: Normalised Radar Backscatter (v{})' ''.format(meta['prod']['card4l-version']))) item.add_link(link=pystac.Link(rel='about', target=meta['source'][uid]['doi'], title='Product definition reference.')) item.add_link(link=pystac.Link(rel='access', target=meta['source'][uid]['access'], title='Product data access.')) item.add_link(link=pystac.Link(rel='satellite', target=meta['common']['platformReference'], title='CEOS Missions, Instruments and Measurements Database record')) item.add_link(link=pystac.Link(rel='state-vectors', target=meta['source'][uid]['orbitStateVector'], title='Orbit data file containing state vectors.')) item.add_link(link=pystac.Link(rel='sensor-calibration', target=meta['source'][uid]['sensorCalibration'], title='Reference describing sensor calibration parameters.')) item.add_link(link=pystac.Link(rel='pol-cal-matrices', target=meta['source'][uid]['polCalMatrices'], title='Reference to the complex-valued polarimetric distortion matrices.')) item.add_link(link=pystac.Link(rel='referenced-faraday-rotation', target=meta['source'][uid]['faradayRotationReference'], title='Reference describing the method used to derive the estimate for the mean' ' Faraday rotation angle.')) xml_relpath = './' + os.path.relpath(outname.replace('.json', '.xml'), target).replace('\\', '/') item.add_asset(key='card4l', asset=pystac.Asset(href=xml_relpath, title='Metadata in XML format.', media_type=pystac.MediaType.XML, roles=['metadata', 'card4l'])) item.save_object(dest_href=outname)
[docs]def parse(meta, target, tifs, exist_ok=False): """ Wrapper for :func:`~S1_NRB.metadata.stac.source_json` and :func:`~S1_NRB.metadata.stac.product_json`. Parameters ---------- meta: dict Metadata dictionary generated with :func:`~S1_NRB.metadata.extract.meta_dict` target: str A path pointing to the root directory of a product scene. tifs: list[str] List of paths to all GeoTIFF files of the currently processed NRB product. exist_ok: bool, optional Do not create files if they already exist? """ source_json(meta=meta, target=target, exist_ok=exist_ok) product_json(meta=meta, target=target, tifs=tifs, exist_ok=exist_ok)
[docs]def make_catalog(directory, recursive=True, silent=False): """ For a given directory of Sentinel-1 NRB products, this function will create a high-level STAC :class:`~pystac.catalog.Catalog` object serving as the STAC endpoint and lower-level STAC :class:`~pystac.collection.Collection` objects for each subdirectory corresponding to a unique MGRS tile ID. WARNING: The directory content will be reorganized into subdirectories based on unique MGRS tile IDs if this is not yet the case. Parameters ---------- directory: str Path to a directory that contains Sentinel-1 NRB products. recursive: bool, optional Search for NRB products in `directory` recursively? Default is True. silent: bool, optional Should the output during directory reorganization be suppressed? Default is False. Returns ------- nrb_catalog: pystac.catalog.Catalog STAC Catalog object Notes ----- The returned STAC Catalog object contains Item asset hrefs that are absolute, whereas the actual on-disk files contain relative asset hrefs corresponding to the self-contained Catalog-Type. The returned in-memory STAC Catalog object deviates in this regard to ensure compatibility with the stackstac library: https://github.com/gjoseph92/stackstac/issues/20 """ overwrite = False pattern = r'^S1[AB]_(IW|EW|S[1-6])_NRB__1S(SH|SV|DH|DV|VV|HH|HV|VH)_[0-9]{8}T[0-9]{6}_[0-9]{6}_' \ r'[0-9A-F]{6}_[0-9A-Z]{5}_[0-9A-Z]{4}$' products = finder(target=directory, matchlist=[pattern], foldermode=2, regex=True, recursive=recursive) # Check if Catalog already exists catalog_path = os.path.join(directory, 'catalog.json') if os.path.isfile(catalog_path): overwrite = True catalog = pystac.Catalog.from_file(catalog_path) items = catalog.get_all_items() item_ids = [item.id for item in items] products_base = [os.path.basename(prod) for prod in products] diff = set(products_base) - set(item_ids) if len(diff) == 0: # See note in docstring - https://github.com/gjoseph92/stackstac/issues/20 catalog.make_all_asset_hrefs_absolute() print(f"\n#### Existing STAC endpoint found: {os.path.join(directory, 'catalog.json')}") return catalog sp_extent = pystac.SpatialExtent([None, None, None, None]) tmp_extent = pystac.TemporalExtent([None, None]) unique_tiles = list( set([re.search(re.compile(r'_[0-9A-Z]{5}_'), prod).group().replace('_', '') for prod in products])) products = _reorganize_by_tile(directory=directory, products=products, recursive=recursive, silent=silent) nrb_catalog = pystac.Catalog(id='nrb_catalog', description='A STAC Catalog of Sentinel-1 NRB products.', title='Sentinel-1 NRB STAC Catalog', catalog_type=pystac.CatalogType.SELF_CONTAINED) for tile in unique_tiles: tile_collection = pystac.Collection(id=tile, description=f'A STAC Collection for Sentinel-1 NRB products corresponding ' f'to MGRS tile {tile}.', title='Sentinel-1 NRB STAC Collection', extent=pystac.Extent(sp_extent, tmp_extent), keywords=['sar', 'backscatter', 'esa', 'copernicus', 'sentinel'], providers=[pystac.Provider(name='ESA', roles=[pystac.ProviderRole.LICENSOR, pystac.ProviderRole.PRODUCER])]) nrb_catalog.add_child(tile_collection) items = [] for prod in products: if tile in prod: item_path = os.path.join(prod, os.path.basename(prod) + '.json') item = pystac.read_file(href=item_path) items.append(item) tile_collection.add_item(item=item) else: continue extent = tile_collection.extent.from_items(items=items) tile_collection.extent = extent # Save Catalog and Collections on disk nrb_catalog.normalize_and_save(root_href=directory) # See note in docstring - https://github.com/gjoseph92/stackstac/issues/20 nrb_catalog.make_all_asset_hrefs_absolute() if overwrite: print(f"\n#### Existing STAC endpoint updated: {os.path.join(directory, 'catalog.json')}") else: print(f"\n#### New STAC endpoint created: {os.path.join(directory, 'catalog.json')}") return nrb_catalog
def _reorganize_by_tile(directory, products=None, recursive=True, silent=False): """ Reorganizes a directory containing Sentinel-1 NRB products based on unique MGRS tile IDs. If a product is already located in a subdirectory named after the MGRS tile it was created for, it will not be moved. Parameters ---------- directory: str Path to a directory that contains Sentinel-1 NRB products. products: list[str], optional List of NRB product paths. Will be created from `directory` if not provided. recursive: bool, optional Search for NRB products in `directory` recursively? Default is True. silent: bool, optional If False (default), a message for each NRB product is printed if it has been moved to a new location or not. Returns ------- products_new: list[str] An updated list of NRB product paths. """ if products is None: pattern = r'^S1[AB]_(IW|EW|S[1-6])_NRB__1S(SH|SV|DH|DV|VV|HH|HV|VH)_[0-9]{8}T[0-9]{6}_[0-9]{6}_' \ r'[0-9A-F]{6}_[0-9A-Z]{5}_[0-9A-Z]{4}$' products = finder(target=directory, matchlist=[pattern], foldermode=2, regex=True, recursive=recursive) inp = input('WARNING:\n{}\nand the NRB products it contains will be reorganized into subdirectories ' 'based on unique MGRS tile IDs if this directory structure does not yet exist. ' '\nDo you wish to continue? [yes|no] '.format(directory)) if inp == 'yes': tile_dict = {} for prod in products: tile = re.search(re.compile(r'_[0-9A-Z]{5}_'), prod).group().replace('_', '') if tile in tile_dict and isinstance(tile_dict[tile], list): tile_dict[tile].append(prod) else: tile_dict[tile] = [prod] tiles = list(tile_dict.keys()) products_new = [] for tile in tiles: tile_dir = os.path.join(directory, tile) os.makedirs(tile_dir, exist_ok=True) for old_dir in tile_dict[tile]: new_dir = os.path.join(tile_dir, os.path.basename(old_dir)) products_new.append(new_dir) if os.path.dirname(old_dir) != tile_dir: shutil.move(old_dir, new_dir) if not silent: print(f"{os.path.basename(old_dir)} moved to {tile_dir}") else: if not silent: print(f"{os.path.basename(old_dir)} already in {tile_dir} - skip") continue return products_new else: print('abort!') exit()