Source code for pyLARDA

#!/usr/bin/python3


import pyLARDA.Connector as Connector
import pyLARDA.ParameterInfo as ParameterInfo
import pyLARDA.spec2mom_limrad94 as spec2mom_limrad94
import datetime, os, calendar, copy, time
from pathlib import Path
import numpy as np
import csv
import logging
import toml
import requests
import json
import pprint

from pyLARDA._meta import __version__, __author__, __init_text__, __default_info__

ROOT_DIR = Path(__file__).resolve().parent
logger = logging.getLogger(__name__)

os.environ["HDF5_USE_FILE_LOCKING"] = 'FALSE'

[docs] class LARDA : """init a new larda instance Args: data_source (str, optional): either ``'local'``, ``'remote'`` or ``'filepath'`` uri: link to backend Returns: larda object """ def __init__(self, data_source='local', uri=None): if data_source == 'local': self.data_source = 'local' self.camp = LARDA_campaign(ROOT_DIR.parents[1] / "larda-cfg", 'campaigns.toml') self.campaign_list = self.camp.get_campaign_list() elif data_source == 'remote': self.data_source = 'remote' self.uri = uri resp = requests.get(self.uri + '/api/') self.campaign_list = resp.json()['campaign_list'] elif data_source == 'filepath': self.data_source = 'filepath' self.uri = '' self.campaign_list = [] logger.warning(__init_text__) logger.warning(f"campaign list: {', '.join(self.campaign_list)}")
[docs] def connect(self, *args, **kwargs): "switch to decide whether connect to local or remote data source" if self.data_source == 'local': return self.connect_local(*args, **kwargs) elif self.data_source == 'remote': return self.connect_remote(*args, **kwargs) elif self.data_source == 'filepath': return self.connect_templates(*args, **kwargs)
[docs] def connect_local(self, camp_name, build_lists=True, filt=None): """built the connector list for the specified campaign (only valid systems are considered) the connectors are instances of the Connector.Connector Class NEW: one connector per system then the params are parts of this system Args: camp_name (str): name of campaign as defined in ``campaigns.toml`` build_lists (Bool, optional): Flag to build the filelists or not (with many files this may take some time) filt (list, optional): Filter for name ``['system', 'MIRA']`` or insturment identifiert ``['instr_name', 'hatpro_g2_lacros']`` """ self.connectors={} logger.info("campaign list " + ' '.join(self.camp.get_campaign_list())) logger.info("camp_name set {}".format(camp_name)) description_dir = ROOT_DIR.parents[1] / "larda-description" self.camp.assign_campaign(camp_name) config_file=self.camp.CONFIGURATION_FILE cinfo_hand_down = {'coordinates': self.camp.COORDINATES, 'altitude': self.camp.ALTITUDE, 'location': self.camp.LOCATION, 'mira_azi_zero': self.camp.info_dict['mira_azi_zero']} logger.debug("config file {}".format(config_file)) paraminformation = ParameterInfo.ParameterInfo( self.camp.config_dir, config_file, cinfo_hand_down=cinfo_hand_down, root=ROOT_DIR) starttime = time.time() if filt is not None and filt[0] == 'system': assert filt[1] in self.camp.VALID_SYSTEMS, f"{filt[1]} not in VALID_SYSTEMS" self.camp.VALID_SYSTEMS = [filt[1]] filt = None logger.info("camp.VALID_SYSTEMS {}".format(self.camp.VALID_SYSTEMS)) #if camp_name == 'LACROS_at_Leipzig': # build_lists = False # build the filelists or load them from json for system, systeminfo in paraminformation.iterate_systems( keys=self.camp.VALID_SYSTEMS, filter=filt): logger.debug('current parameter {} {}'.format(system, systeminfo)) if system in self.camp.system_only: valid_dates = self.camp.system_only[system] else: valid_dates = self.camp.VALID_DATES conn = Connector.Connector(system, systeminfo, valid_dates, description_dir=description_dir) if build_lists: conn.build_filehandler() conn.save_filehandler(self.camp.info_dict['connectordump'], camp_name) else: #load lists conn.load_filehandler(self.camp.info_dict['connectordump'], camp_name) if system in self.camp.VALID_SYSTEMS: self.connectors[system] = conn else: logger.warning("{} not in valid systems".format(system)) logger.info('Time for generating connectors (build_lists {}) {} s'.format( build_lists, time.time() - starttime)) #print "Availability array: ", self.array_avail(2014, 2) logger.warning(self.camp.INFO_TEXT) logger.info("systems {}".format(self.connectors.keys())) logger.info("Parameters in stock: {}".format([(k, self.connectors[k].params_list) for k in self.connectors.keys()])) return self
[docs] def connect_remote(self, camp_name, **kwargs): """connect to a remote data source Args: camp_name: name of the campaign in the remote source """ logger.info("connect_remote {}".format(camp_name)) resp = requests.get(self.uri + '/api/{}/'.format(camp_name)) #print(resp.json()) self.camp = LARDA_campaign_remote(resp.json()['config_file']) self.camp.INFO_TEXT = resp.json()['info_text'] self.connectors = {} for k, c in resp.json()['connectors'].items(): self.connectors[k] = Connector.Connector_remote(camp_name, k, c, self.uri) logger.warning(self.camp.INFO_TEXT) return self
[docs] def connect_templates(self, c_info={}): """set up the connector for the filepath option Args: c_info (optional): campaign meta info """ template_files = list((ROOT_DIR / 'template_params').glob('*')) self.connectors = {} self.camp = LARDA_campaign_remote(c_info) templist = ['coordinates', 'altitude', 'location', 'mira_azi_zero'] cinfo_hand_down = {k: v for k,v in c_info.items() if k in templist} for f in template_files: temp = toml.load(f) temp = ParameterInfo.do_parameter_generic_inheritance( temp, cinfo_hand_down=cinfo_hand_down) for system, systeminfo in temp.items(): conn = Connector.Connector(system, systeminfo, []) self.connectors[system] = conn logger.info("Systems with default templates {}".format(self.connectors.keys())) logger.info("Parameters in stock: {}".format([(k, self.connectors[k].params_list) for k in self.connectors.keys()])) return self
[docs] def read(self, system, parameter, time_interval, *further_slices, **kwargs): """ Args: system (str): identifier for the system parameter (str): choosen param time_interval: ``[dt, dt]`` time interval, or [dt] one time *further_slices: range, vel,.. ``[0, max]`` or [3000] Returns: the dictionary with data """ if self.data_source == 'filepath': data = self.connectors[system].collect_path(parameter, time_interval, *further_slices, **kwargs) else: data = self.connectors[system].collect(parameter, time_interval, *further_slices, **kwargs) return data
[docs] def description(self, system, parameter): """ Args: system (str): identifier for the system parameter (str): choosen param Returns: the description tag as string """ descr = self.connectors[system].description(parameter) return descr
def print_params(self): print("System, Param") [print(k, self.connectors[k].params_list) for k in self.connectors.keys()]
[docs] def get_avail_dict(self, *args): """get the no files for each date Args: *args: either empty or `system`, `parameter` Returns: the number of files per day for each system """ if len(args) == 0: return {system:conn.get_as_plain_dict() for system, conn in self.connectors.items()} elif len(args) == 2: system, param = args d = self.connectors[system].get_as_plain_dict() return d['avail'][d['params'][param]]
[docs] def resolve_today(lst): """ resolve 'today' in [['2012101', 'today']]""" return [[e[0], e[1]] if e[1] != 'today' else [e[0], datetime.datetime.utcnow().strftime("%Y%m%d")] for e in lst ]
[docs] class LARDA_campaign: """ provides information about campaigns collected in LARDA""" def __init__(self, config_dir, campaign_file): logger.info('campaign file at LARDA_campaign ' + campaign_file) self.campaigns = toml.load(config_dir / campaign_file) self.campaigns = toml.load(Path(config_dir) / Path(campaign_file)) self.campaign_list = list(self.campaigns.keys()) self.config_dir = config_dir
[docs] def get_campaign_list(self): """ list of all campaign names stored in csv-file """ return self.campaign_list
[docs] def assign_campaign(self, name): """dedicate object to a specific campaign""" self.info_dict = self.campaigns[name] logger.debug("info dict@assing campaign {}".format(self.info_dict)) self.ALTITUDE=float(self.info_dict['altitude']) self.VALID_SYSTEMS = self.info_dict['systems'] self.VALID_DATES = resolve_today(self.info_dict["duration"]) self.COORDINATES = self.info_dict["coordinates"] self.CLOUDNET_STATIONNAME = self.info_dict["cloudnet_stationname"] self.CONFIGURATION_FILE = self.info_dict["param_config_file"] self.LOCATION = self.info_dict["location"] if not 'info_text_loc' in self.info_dict \ or self.info_dict['info_text_loc'] == 'default': self.INFO_TEXT = __default_info__ else: self.INFO_TEXT = toml.load( self.config_dir / self.info_dict['info_text_loc'])['info_text'] if 'system_only' in self.info_dict: self.system_only = { k: resolve_today(v) for k, v in self.info_dict['system_only'].items()} else: self.system_only = {}
[docs] class LARDA_campaign_remote: """store the campaign information in a similar structure as for local""" def __init__(self, info_dict): self.info_dict = info_dict if 'altitude' in info_dict: self.ALTITUDE=float(self.info_dict['altitude']) if 'systems' in info_dict: self.VALID_SYSTEMS = self.info_dict['systems'] if 'duration' in info_dict: self.VALID_DATES = resolve_today(self.info_dict["duration"]) if 'coordinates' in info_dict: self.COORDINATES = self.info_dict["coordinates"] if 'cloudnet_stationname' in info_dict: self.CLOUDNET_STATIONNAME = self.info_dict["cloudnet_stationname"] if 'param_config_file' in info_dict: self.CONFIGURATION_FILE = self.info_dict["param_config_file"] if 'location' in info_dict: self.LOCATION = self.info_dict["location"] self.INFO_TEXT = ''