RestClient.py

'''
Created on 13 nov. 2018

@author: QFAURE
'''
import os
import logging
import requests #sudo pip install requests
import json
from pathlib import Path
from properties.p import Property
from typing import Iterable


logging.basicConfig(filename='RestClient.log', level=logging.DEBUG, format='%(asctime)s %(levelname)-8s %(message)s', datefmt='%Y-%m-%d %H:%M:%S')
url = os.environ['BMAP_BACKEND_URL'] + 'catalogue/granule/'

# gets a granule by name and returns the json containing the granule's metadata.
def get_granule_by_name(granule_name: str,formatmetadata=False) -> Iterable:
    try:
        response = requests.get(url + 'granulename/' + granule_name)
        json_str = response.text
      
        # if the response body contains something
        if len(json_str) > 0:
            json_obj = json.loads(json_str)
            
            if formatmetadata==True :
                            
                return format_metadata([json_obj])
            else : 
                return json_obj
        else:
            print('INFO: There is no data with ID: ' + granule_name)
            logging.info('There is no data with ID: ' + granule_name)
            return {}
    except requests.exceptions.RequestException as e:
        print('ERROR: ' + str(e))
        logging.error(str(e))


# gets granules by criteria and returns json containing granules' metadata:
def get_granules_by_criteria(input_file: str='datacriteria.properties',formatmetadata=False) -> Iterable:
    
    
    if Path(input_file).is_file():
        # load properties file
        data_criteria = Property().load_property_files(input_file)
        # add the criteria from the properties file to the dictionary
        criteria_list = {}
        try :
            start_date = data_criteria['start_date']
            if len(start_date) > 0:
                criteria_list['"startDate"'] = '"' + start_date + '"'
        except:
            pass
        try : 
            end_date = data_criteria['end_date']
            if len(end_date) > 0:
                criteria_list['"endDate"'] = '"' + end_date + '"'
        except:
            pass
        try :    
            product_types = data_criteria['product_types']
            if len(product_types) > 0:
                criteria_list['"productTypes"'] = to_table_string(product_types)
        except:
            pass
        try :    
            instrument_names = data_criteria['instrument_names']
            if len(instrument_names) > 0:
                criteria_list['"instrumentNames"'] = to_table_string(instrument_names)
        except:
            pass
        
        # location = data_criteria['location']
        try :
            polarizations = data_criteria['polarizations']
            if len(polarizations) > 0:
                criteria_list['"polarizations"'] = to_table_string(polarizations)
        except:
            pass
        try : 
            geometry_types = data_criteria['geometry_types']
            if len(geometry_types) > 0:
                criteria_list['"geometryTypes"'] = to_table_string(geometry_types)
        except:
            pass
        try : 
            processing_levels = data_criteria['processing_levels']
            if len(processing_levels) > 0:
                criteria_list['"processingLevels"'] = to_table_string(processing_levels)
        except:
            pass
        try : 
            sub_region_names = data_criteria['sub_region_names']
            if len(sub_region_names) > 0:
                criteria_list['"subRegionNames"'] = to_table_string(sub_region_names) 
        except:
            pass
        try : 
            collectionNames = data_criteria['collection_names']
            if len(collectionNames) > 0:
                criteria_list['"collectionNames"'] = to_table_string(collectionNames)
        except:
            pass
        # if there is at least one criterion besides scene
        if len(criteria_list) >= 1:
            # concatenate the criteria from the dictionary together in a string (i.e. "key1": "value1", "key2: "value2")
            criteria_str = ""
            for i in criteria_list:
                key = i
                value = criteria_list[i]
                if len(value) > 0:
                    if len(criteria_str) > 0:
                        criteria_str += ', '
                    criteria_str += key + ': ' + value
            # add the concatenated criteria string it inside a string representing a data criteria json
            request_body = '{"GranuleCriteria": {' + criteria_str + '}}'
            try:
                response = requests.post(url, headers={'content-type': 'application/json'}, data=request_body)
                json_str = response.text
                # if the response body contains something
                if len(json_str) > 0:
                    json_obj = json.loads(json_str)
                    #return filter_by_scene(json_obj, data_criteria['scene_name'].split(','))
                    if data_criteria['scene_name']:
                        json_obj=filter_by_scene(json_obj, data_criteria['scene_name'].split(','))
                        if formatmetadata == True:
                            return format_metadata(json_obj)
                        else:
                            return json_obj
                    else:
                        if formatmetadata==True:
                            return format_metadata(json_obj)
                        else : 
                            return json_obj
                else:
                    print('INFO: There is no data matching the given criteria.')
                    logging.info('There is no data matching the given criteria.')
                    return {}
            except requests.exceptions.RequestException as e:
                print('ERROR: ' + str(e))
                logging.error(str(e))
        else:
            print('ERROR: You need to specify at least one search criteria besides scene name.')
            logging.error('You need to specify at least one search criteria besides scene name.')
    else:
        print('ERROR: The file "' + input_file + '" does not exist.')
        logging.error('The file "' + input_file + '" does not exist.')


# returns the string passed as parameter as a string representing a table (e.g. ["a", "b", "c"])
def to_table_string(string: str) -> str:
    string_to_return = string.replace(', ', ',').replace(',', '", "')
    return '["' + string_to_return + '"]'


def filter_by_scene(json_result, scene_list):
    for granule in json_result[:] : 
        scene = granule['Granule']['granuleScene']
        if scene:
            scene=granule['Granule']['granuleScene']['Granule']['name']
            if not scene in scene_list : 
                json_result.remove(granule)
             
    return json_result

# download granule data(s) in a specified dir:
# granule_id: granuleID.
# target_Dir: directory the file(s) will be saved at".
def download_granule(granule_id: str, target_Dir: str) -> Iterable:
    try:
        response = requests.get(url + 'granulename/' + granule_id)
        json_str = response.text
        # if the response body contains something
        if len(json_str) > 0:
            json_obj = json.loads(response.text)
            for data in json_obj['Granule']['dataList'][:] :
                #print(target_Dir+'/'+data['Data']['fileName'])
                my_file = Path(target_Dir+'/'+data['Data']['fileName'])
                urlToData=''
                if my_file.is_file():
                    print(data['Data']['fileName']+' already exists in targetDir: '+ target_Dir)
                    logging.info(data['Data']['fileName']+' already exists in targetDir: '+ target_Dir)
                else:
                    urlToData = data['Data']['urlToData']
                    completeName = os.path.join(target_Dir, data['Data']['fileName'])
                    r = requests.get(urlToData, allow_redirects=True)
                    open(completeName, 'wb').write(r.content)
                    print(data['Data']['fileName']+' has been successfully downloaded in targetDir: '+ target_Dir)
                    logging.info(data['Data']['fileName']+' has been successfully downloaded in targetDir: '+ target_Dir)
                    
            return urlToData
        else:
            print('INFO: There is no data with ID: ' + granule_id)
            logging.info('There is no data with ID: ' + granule_id)
            return {}
    except requests.exceptions.RequestException as e:
        print('ERROR: ' + str(e))
        logging.error(str(e))


#########################################################################

# -*- coding: utf-8 -*-
class dataset:
    def __init__(self):
        """
        This class contains the dataset and all the auxiliary information"""
        self.campaign = ""
        self.scenes = []
        self.SLClist = {}
        self.SLCFilenames = {}
        self.heading={}
        self.z_flight={}
        self.z_terrain={}
        self.GRD_resol={}
        self.pixel_spacing = {}
        self.surface_resol = {}
        self.SLR_start = {}
        self.master = {}
        self.demname = {}
        self.demFilenames= {}
        self.incFilenames = {}
        self.kzFilenames = {}
        self.azimuthFiles = {}
        self.rangeFiles = {}
        
def get_url(collection,granulename):
    granule=get_granule_by_name(collection+':@'+granulename)
    datalist=granule['Granule']['dataList']
    
    url=datalist[0]['Data']['filePath']
    return(url)

def format_metadata(json_result):
    """Parse configuration xml and init dataset class"""
    import re
    
    
    # Init
    data_stack = dataset()
    
    data_stack.campaign = json_result[0]['Granule']['collection']['Collection']['shortName']
    #if the research asked some specific scenes
    
    
    # All the data of the collections are returned and the scene list must be extract from the granules
    for granule in json_result :
        if granule['Granule']['productType']=='SLC':
            scene=granule['Granule']['granuleScene']['Granule']['name']   
            #add scene in the list avoiding duplicates
            
            
            ## inputfilenames
            polarisation=granule['Granule']['polarization']
            key=(scene,polarisation)
            value=granule['Granule']['name']
            url=get_url(data_stack.campaign,value)
            
            data_stack.SLClist.update(dict([(key,value)]))
            data_stack.SLCFilenames.update(dict([(key,url)]))
            if not scene in data_stack.scenes:
                #append scenes and all metadata of the scene
                data_stack.scenes.append(scene)            
                
                
                #### heading
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['heading'])])
                data_stack.heading.update(keyval)
                #z_flight
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['zFlight'])])
                data_stack.z_flight.update(keyval)
                ##z_terrain
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['zTerrain'])])
                data_stack.z_terrain.update(keyval)
                ##GRD_resol
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['grdResol'])])
                data_stack.GRD_resol.update(keyval)
                ##pixel_spacing
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['pixelSpacing'])])
                data_stack.pixel_spacing.update(keyval)
                ##surface_resol
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['surfaceResol'])])
                data_stack.surface_resol.update(keyval)
                
                ##SLR_start
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['slrStart'])])
                data_stack.SLR_start.update(keyval)
                
                ##master
                #search for the presence of az files in the file list of the granule
                #bool_list=bool(re.search("az.tiff",data)) for data in granule['Granule']['granuleScene']['Granule']['granuleList']]                    
                #if True in bool_list : 
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['master'])])
                data_stack.master.update(keyval)
                ##demname
                keyval=dict([(scene,granule['Granule']['granuleScene']['Granule']['dem'])])
                data_stack.demname.update(keyval)
                
                ##demFilenames
                demname=granule['Granule']['granuleScene']['Granule']['dem']
                #if a dem is referenced, try to get its filename
                if len(demname)>0:
                    try :
                        demfilename=get_url(data_stack.campaign,data_stack.campaign+'_'+demname+'_dem.tiff')
                        
                    except:
                        demfilename=''
                else : 
                        demfilename=''
                keyval=dict([(scene,demfilename)])
                data_stack.demFilenames.update(keyval)
                
                ##azfilenames
                #search for the presence of az files in the file list of the granule
                bool_list=[bool(re.search("az.tiff",data)) for data in granule['Granule']['granuleScene']['Granule']['granuleList']]     
                if True in bool_list :
                    azfile=granule['Granule']['granuleScene']['Granule']['granuleList'][bool_list.index(True)]
                    azfile=get_url(data_stack.campaign,azfile)
                elif  granule['Granule']['granuleScene']['Granule']['master']!='n/a':
                    #get master name and get its azimtuh
                    master=granule['Granule']['granuleScene']['Granule']['master']
                    
                    if len(master)>0:
                        try : 
                            master_granules=get_granule_by_name(data_stack.campaign+':@'+master)['Granule']['granuleList']
                            
                            azfile=[file for file in master_granules if "az" in file][0]      
                            azfile=get_url(data_stack.campaign,azfile)
                        except: 
                            azfile=''
                    else:
                        azfile=''
                else:
                    azfile=''
                keyval=dict([(scene,azfile)])
                data_stack.azimuthFiles.update(keyval)
                
                ##rgfilenames
                bool_list=[bool(re.search("rg.tiff",data)) for data in granule['Granule']['granuleScene']['Granule']['granuleList']]     
                if True in bool_list :
                    rgfile=granule['Granule']['granuleScene']['Granule']['granuleList'][bool_list.index(True)]
                    rgfile=get_url(data_stack.campaign,rgfile)
                elif  granule['Granule']['granuleScene']['Granule']['master']!='n/a':
                    #get master name and get its azimtuh
                    master=granule['Granule']['granuleScene']['Granule']['master']
                    if len(master)>0:
                        try : 
                            master_granules=get_granule_by_name(data_stack.campaign+':@'+master)['Granule']['granuleList']
                            rgfile=[file for file in master_granules if "rg" in file][0]    
                            rgfile=get_url(data_stack.campaign,rgfile)
                        except: 
                            rgfile=''
                    else:
                        rgfile=''
                else:
                    rgfile=''
                keyval=dict([(scene,rgfile)])
                data_stack.rangeFiles.update(keyval)
                
                ##incfilenames
                bool_list=[bool(re.search("inc.tiff",data)) for data in granule['Granule']['granuleScene']['Granule']['granuleList']]     
                if True in bool_list :
                    incfile=granule['Granule']['granuleScene']['Granule']['granuleList'][bool_list.index(True)]
                    incfile=get_url(data_stack.campaign,incfile)
                elif  granule['Granule']['granuleScene']['Granule']['master']!='n/a':
                    #get master name and get its azimtuh
                    master=granule['Granule']['granuleScene']['Granule']['master']
                    if len(master)>0:
                        try : 
                            master_granules=get_granule_by_name(data_stack.campaign+':@'+master)['Granule']['granuleList']
                            incfile=[file for file in master_granules if "inc" in file][0] 
                            incfile=get_url(data_stack.campaign,incfile)
                        except: 
                            incfile=''
                    else:
                        incfile=''
                else:
                    incfile=''
                keyval=dict([(scene,incfile)])
                data_stack.incFilenames.update(keyval)
                               
                ##kzfilenames
                bool_list=[bool(re.search("kz.tiff",data)) for data in granule['Granule']['granuleScene']['Granule']['granuleList']]     
                if True in bool_list :
                    kzfile=granule['Granule']['granuleScene']['Granule']['granuleList'][bool_list.index(True)]
                    kzfile=get_url(data_stack.campaign,kzfile)
                else:
                    kzfile=''
                keyval=dict([(scene,kzfile)])
                data_stack.kzFilenames.update(keyval)
    return data_stack