scc_access/scc_access.py

Wed, 25 May 2022 23:00:57 +0200

author
Claudio Dema <claudio.dema@imaa.cnr.it>
date
Wed, 25 May 2022 23:00:57 +0200
changeset 68
70c869fa3242
parent 67
0106aeed80d8
child 69
cd8bc07f8419
permissions
-rw-r--r--

Added more filters (date interval, stations) to the list method; new method E-SHAPE downloader for batch execution;

ioannis@67 1 """ This is a script that allows interaction with the SCC through the command line.
ioannis@67 2
ioannis@67 3 It is based on the requests module for accessing the server.
ioannis@67 4
ioannis@67 5 Most of the interactions are done through the web interface, i.e. by mimicking user interaction with the
ioannis@67 6 SCC website (i.e. user login, data submission, etc.). In few cases, the SCC API is also used.
ioannis@67 7
ioannis@67 8 Most of the functionality is included in the SCC class. The class is used to login into the SCC website and automate
ioannis@67 9 interaction with the site (i.e. upload a file, get measurement status, etc.).
ioannis@67 10
ioannis@67 11 Two other classes (Measurement, AncillaryFile) are used in some cases to handle the output of the SCC API.
ioannis@67 12
ioannis@67 13 Several shortcut functions are defined to perform specific tasks using the SCC class (e.g. process_file, delete_measurements etc).
ioannis@67 14 """
ioannis@43 15 import sys
ioannis@43 16
victor@7 17 import requests
victor@7 18
ioannis@43 19 try:
ioannis@43 20 import urllib.parse as urlparse # Python 3
ioannis@43 21 except ImportError:
ioannis@17 22 import urlparse # Python 2
ioannis@43 23
victor@7 24 import argparse
madrouin@24 25 import datetime
madrouin@24 26 import logging
victor@7 27 import os
victor@7 28 import re
ioannis@32 29 from io import BytesIO
ioannis@45 30
victor@7 31 import time
i@40 32
victor@7 33 from zipfile import ZipFile
madrouin@24 34
i@14 35 import yaml
victor@7 36
ioannis@43 37 import netCDF4 as netcdf
ioannis@43 38
ioannis@43 39 requests.packages.urllib3.disable_warnings()
i@14 40 logger = logging.getLogger(__name__)
victor@7 41
victor@7 42 # The regex to find the measurement id from the measurement page
victor@7 43 # This should be read from the uploaded file, but would require an extra NetCDF module.
i@36 44 regex = "<h3>Measurement (?P<measurement_id>.{12,15}) <small>" # {12, 15} to handle both old- and new-style measurement ids.
victor@7 45
victor@7 46
victor@7 47 class SCC:
ioannis@67 48 """A class that will attempt to interact SCC server.
i@14 49
ioannis@67 50 Most interactions are by simulating a normal browser session. In the current
ioannis@67 51 version few checks are performed before upload a file, and no feedback is given in case the upload
ioannis@67 52 fails.
victor@7 53 """
victor@7 54
i@14 55 def __init__(self, auth, output_dir, base_url):
moritz@29 56
victor@7 57 self.auth = auth
victor@7 58 self.output_dir = output_dir
i@14 59 self.base_url = base_url
victor@7 60 self.session = requests.Session()
moritz@29 61 self.session.auth = auth
moritz@29 62 self.session.verify = False
victor@7 63
ioannis@67 64 # Setup SCC server URLS for later use
i@14 65 self.login_url = urlparse.urljoin(self.base_url, 'accounts/login/')
i@31 66 self.logout_url = urlparse.urljoin(self.base_url, 'accounts/logout/')
i@31 67 self.list_measurements_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/')
i@31 68
i@14 69 self.upload_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/quick/')
ioannis@54 70 self.measurement_page_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/')
ioannis@43 71 self.download_hirelpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 72 'data_processing/measurements/{0}/download-hirelpp/')
ioannis@43 73 self.download_cloudmask_pattern = urlparse.urljoin(self.base_url,
ioannis@67 74 'data_processing/measurements/{0}/download-cloudmask/')
ioannis@34 75
ioannis@43 76 self.download_elpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 77 'data_processing/measurements/{0}/download-preprocessed/')
ioannis@43 78 self.download_elda_pattern = urlparse.urljoin(self.base_url,
ioannis@67 79 'data_processing/measurements/{0}/download-optical/')
ioannis@45 80 self.download_plots_pattern = urlparse.urljoin(self.base_url,
moritz@29 81 'data_processing/measurements/{0}/download-plots/')
ioannis@43 82 self.download_elic_pattern = urlparse.urljoin(self.base_url,
ioannis@67 83 'data_processing/measurements/{0}/download-elic/')
i@14 84 self.delete_measurement_pattern = urlparse.urljoin(self.base_url, 'admin/database/measurements/{0}/delete/')
i@31 85
ioannis@67 86 # Setup API URLs for later use
i@14 87 self.api_base_url = urlparse.urljoin(self.base_url, 'api/v1/')
i@31 88 self.api_measurement_pattern = urlparse.urljoin(self.api_base_url, 'measurements/{0}/')
i@31 89 self.api_measurements_url = urlparse.urljoin(self.api_base_url, 'measurements')
i@38 90 self.api_sounding_search_pattern = urlparse.urljoin(self.api_base_url, 'sounding_files/?filename={0}')
i@38 91 self.api_lidarratio_search_pattern = urlparse.urljoin(self.api_base_url, 'lidarratio_files/?filename={0}')
i@38 92 self.api_overlap_search_pattern = urlparse.urljoin(self.api_base_url, 'overlap_files/?filename={0}')
ioannis@43 93
i@14 94 def login(self, credentials):
ioannis@67 95 """ Login to the SCC.
ioannis@67 96
ioannis@67 97 Parameters
ioannis@67 98 ----------
ioannis@67 99 credentials : tuple or list
ioannis@67 100 A list or tuple in the form (username, password).
ioannis@67 101 """
victor@7 102 logger.debug("Attempting to login to SCC, username %s." % credentials[0])
moritz@29 103 login_credentials = {'username': credentials[0],
moritz@29 104 'password': credentials[1]}
victor@7 105
i@14 106 logger.debug("Accessing login page at %s." % self.login_url)
victor@7 107
ioannis@67 108 # Get login form
moritz@29 109 login_page = self.session.get(self.login_url)
i@14 110
i@31 111 if not login_page.ok:
i@31 112 raise self.PageNotAccessibleError('Could not access login pages. Status code %s' % login_page.status_code)
victor@7 113
i@31 114 logger.debug("Submitting credentials.")
victor@7 115 # Submit the login data
i@14 116 login_submit = self.session.post(self.login_url,
moritz@29 117 data=login_credentials,
victor@7 118 headers={'X-CSRFToken': login_page.cookies['csrftoken'],
moritz@29 119 'referer': self.login_url})
victor@7 120 return login_submit
victor@7 121
victor@7 122 def logout(self):
ioannis@67 123 """ Logout from the SCC """
i@31 124 return self.session.get(self.logout_url, stream=True)
victor@7 125
ioannis@67 126 def upload_file(self, filename, system_id, force_upload, delete_related, delay=0, rs_filename=None,
ioannis@67 127 ov_filename=None, lr_filename=None):
ioannis@67 128 """ Upload a file for processing.
ioannis@67 129
ioannis@67 130 If the upload is successful, it returns the measurement id.
ioannis@67 131
ioannis@67 132
ioannis@67 133 Parameters
ioannis@67 134 ----------
ioannis@67 135 filename : str
ioannis@67 136 File path of the file to upload
ioannis@67 137 system_id : int
ioannis@67 138 System id to be used in the processing
ioannis@67 139 force_upload : bool
ioannis@67 140 If True, if a measurement with the same ID is found on the server, it will be first deleted and the
ioannis@67 141 file current file will be uploaded. If False, the file will not be uploaded if the measurement ID is
ioannis@67 142 already present on the SCC server.
ioannis@67 143 delete_related : bool
ioannis@67 144 Answer to delete related question when deleting existing measurements from the SCC.
ioannis@67 145 rs_filename, ov_filename, lr_filename : str
ioannis@67 146 Ancillary files pahts to be uploaded.
ioannis@67 147 """
ioannis@67 148 # Get the measurement ID from the netcdf file
ioannis@43 149 measurement_id = self.measurement_id_from_file(filename)
ioannis@43 150
ioannis@67 151 # Handle possible existing measurements with the same ID on the SCC server.
ioannis@43 152 logger.debug('Checking if a measurement with the same id already exists on the SCC server.')
ioannis@50 153 existing_measurement, _ = self.get_measurement(measurement_id)
ioannis@43 154
ioannis@43 155 if existing_measurement:
ioannis@43 156 if force_upload:
ioannis@43 157 logger.info(
ioannis@43 158 "Measurement with id {} already exists on the SCC. Trying to delete it...".format(measurement_id))
ioannis@43 159 self.delete_measurement(measurement_id, delete_related)
ioannis@43 160 else:
ioannis@43 161 logger.error(
ioannis@43 162 "Measurement with id {} already exists on the SCC. Use --force_upload flag to overwrite it.".format(
ioannis@43 163 measurement_id))
ioannis@67 164 # TODO: Implement handling at the proper place. Exiting here does not allow the SCC class to be
ioannis@67 165 # used by external programs. Instead an exception should be raised.
ioannis@43 166 sys.exit(1)
ioannis@43 167
ioannis@67 168 # Upload the file(s)
ioannis@67 169
victor@7 170 # Get submit page
moritz@29 171 upload_page = self.session.get(self.upload_url)
victor@7 172
victor@7 173 # Submit the data
ioannis@54 174 upload_data = {'system': system_id,
ioannis@54 175 'delay': delay}
ioannis@54 176
ioannis@54 177 logger.debug("Submitted processing parameters - System: {}, Delay: {}".format(system_id, delay))
ioannis@54 178
victor@7 179 files = {'data': open(filename, 'rb')}
victor@7 180
ioannis@67 181 # Add ancillary files to be uploaded
madrouin@20 182 if rs_filename is not None:
i@38 183 ancillary_file, _ = self.get_ancillary(rs_filename, 'sounding')
i@38 184
i@38 185 if ancillary_file.already_on_scc:
ioannis@67 186 logger.warning(
ioannis@67 187 "Sounding file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 188 else:
i@38 189 logger.debug('Adding sounding file %s' % rs_filename)
i@38 190 files['sounding_file'] = open(rs_filename, 'rb')
madrouin@20 191
ioannis@32 192 if ov_filename is not None:
i@38 193 ancillary_file, _ = self.get_ancillary(ov_filename, 'overlap')
i@38 194
i@38 195 if ancillary_file.already_on_scc:
ioannis@67 196 logger.warning(
ioannis@67 197 "Overlap file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 198 else:
i@38 199 logger.debug('Adding overlap file %s' % ov_filename)
i@38 200 files['overlap_file'] = open(ov_filename, 'rb')
i@31 201
i@31 202 if lr_filename is not None:
i@38 203 ancillary_file, _ = self.get_ancillary(lr_filename, 'lidarratio')
i@38 204
i@38 205 if ancillary_file.already_on_scc:
i@38 206 logger.warning(
ioannis@67 207 "Lidar ratio file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(
ioannis@67 208 ancillary_file))
i@38 209 else:
i@38 210 logger.debug('Adding lidar ratio file %s' % lr_filename)
i@38 211 files['lidar_ratio_file'] = open(lr_filename, 'rb')
i@31 212
ioannis@67 213 # Upload the files
i@14 214 logger.info("Uploading of file %s started." % filename)
victor@7 215
i@14 216 upload_submit = self.session.post(self.upload_url,
victor@7 217 data=upload_data,
victor@7 218 files=files,
victor@7 219 headers={'X-CSRFToken': upload_page.cookies['csrftoken'],
moritz@29 220 'referer': self.upload_url})
victor@7 221
victor@7 222 if upload_submit.status_code != 200:
i@14 223 logger.warning("Connection error. Status code: %s" % upload_submit.status_code)
victor@7 224 return False
victor@7 225
ioannis@67 226 # Check if there was a redirect to a new page. If not, something went wrong
i@14 227 if upload_submit.url == self.upload_url:
victor@7 228 measurement_id = False
ioannis@32 229 logger.error("Uploaded file(s) rejected! Try to upload manually to see the error.")
victor@7 230 else:
ioannis@67 231 # TODO: Check if this is needed. This was used when the measurement ID was not read from the input file.
ioannis@67 232 measurement_id = re.findall(regex, upload_submit.text)[0] # Get the measurement ID from the output page
ioannis@43 233 logger.info("Successfully uploaded measurement with id %s." % measurement_id)
ioannis@67 234 logger.info("You can monitor the processing progress online: {}".format(
ioannis@67 235 self.measurement_page_pattern.format(measurement_id)))
ioannis@43 236 return measurement_id
ioannis@43 237
ioannis@43 238 @staticmethod
ioannis@43 239 def measurement_id_from_file(filename):
ioannis@67 240 """ Get the measurement id from the input file.
ioannis@67 241
ioannis@67 242 Parameters
ioannis@67 243 ----------
ioannis@67 244 filename : str
ioannis@67 245 File path of the input file.
ioannis@67 246 """
ioannis@43 247
ioannis@43 248 if not os.path.isfile(filename):
ioannis@43 249 logger.error("File {} does not exist.".format(filename))
ioannis@43 250 sys.exit(1)
ioannis@43 251
ioannis@43 252 with netcdf.Dataset(filename) as f:
ioannis@43 253 try:
ioannis@43 254 measurement_id = f.Measurement_ID
ioannis@43 255 except AttributeError:
ioannis@43 256 logger.error(
ioannis@43 257 "Input file {} does not contain a Measurement_ID global attribute. Wrong file format?".format(
ioannis@43 258 filename))
ioannis@43 259 sys.exit(1)
victor@7 260
victor@7 261 return measurement_id
victor@7 262
victor@7 263 def download_files(self, measurement_id, subdir, download_url):
victor@7 264 """ Downloads some files from the download_url to the specified
ioannis@67 265 subdir.
ioannis@67 266
ioannis@67 267 This is a general method used to download preprocessed file, optical
ioannis@67 268 files by other, file-specific, methods.
victor@7 269 """
ioannis@32 270 # TODO: Make downloading more robust (e.g. in case that files do not exist on server).
victor@7 271 # Get the file
moritz@29 272 request = self.session.get(download_url, stream=True)
moritz@29 273
moritz@29 274 if not request.ok:
moritz@29 275 raise Exception("Could not download files for measurement '%s'" % measurement_id)
victor@7 276
victor@7 277 # Create the dir if it does not exist
victor@7 278 local_dir = os.path.join(self.output_dir, measurement_id, subdir)
victor@7 279 if not os.path.exists(local_dir):
victor@7 280 os.makedirs(local_dir)
victor@7 281
victor@7 282 # Save the file by chunk, needed if the file is big.
ioannis@43 283 memory_file = BytesIO()
victor@7 284
victor@7 285 for chunk in request.iter_content(chunk_size=1024):
victor@7 286 if chunk: # filter out keep-alive new chunks
victor@7 287 memory_file.write(chunk)
victor@7 288 memory_file.flush()
victor@7 289
victor@7 290 zip_file = ZipFile(memory_file)
victor@7 291
victor@7 292 for ziped_name in zip_file.namelist():
victor@7 293 basename = os.path.basename(ziped_name)
victor@7 294
victor@7 295 local_file = os.path.join(local_dir, basename)
victor@7 296
victor@7 297 with open(local_file, 'wb') as f:
victor@7 298 f.write(zip_file.read(ziped_name))
victor@7 299
ioannis@43 300 def download_hirelpp(self, measurement_id):
ioannis@43 301 """ Download hirelpp files for the measurement id. """
ioannis@43 302 # Construct the download url
ioannis@43 303 download_url = self.download_hirelpp_pattern.format(measurement_id)
ioannis@43 304 try:
ioannis@50 305 self.download_files(measurement_id, 'hirelpp', download_url)
ioannis@43 306 except Exception as e:
ioannis@43 307 logger.error("Could not download HiRElPP files. Error message: {}".format(e))
ioannis@43 308 logger.debug('Download exception:', exc_info=True)
ioannis@43 309
ioannis@43 310 def download_cloudmask(self, measurement_id):
ioannis@43 311 """ Download cloudmask files for the measurement id. """
ioannis@43 312 # Construct the download url
ioannis@43 313 download_url = self.download_cloudmask_pattern.format(measurement_id)
ioannis@43 314 try:
ioannis@50 315 self.download_files(measurement_id, 'cloudscreen', download_url)
ioannis@43 316 except Exception as e:
ioannis@43 317 logger.error("Could not download cloudscreen files. Error message: {}".format(e))
ioannis@43 318 logger.debug('Download exception:', exc_info=True)
ioannis@43 319
ioannis@43 320 def download_elpp(self, measurement_id):
victor@7 321 """ Download preprocessed files for the measurement id. """
victor@7 322 # Construct the download url
ioannis@43 323 download_url = self.download_elpp_pattern.format(measurement_id)
ioannis@43 324 try:
ioannis@50 325 self.download_files(measurement_id, 'elpp', download_url)
ioannis@43 326 except Exception as e:
ioannis@43 327 logger.error("Could not download ElPP files. Error message: {}".format(e))
ioannis@43 328 logger.debug('Download exception:', exc_info=True)
victor@7 329
ioannis@43 330 def download_elda(self, measurement_id):
victor@7 331 """ Download optical files for the measurement id. """
victor@7 332 # Construct the download url
ioannis@43 333 download_url = self.download_elda_pattern.format(measurement_id)
ioannis@43 334 try:
ioannis@50 335 self.download_files(measurement_id, 'elda', download_url)
ioannis@43 336 except Exception as e:
ioannis@43 337 logger.error("Could not download ELDA files. Error message: {}".format(e))
ioannis@43 338 logger.debug('Download exception:', exc_info=True)
victor@7 339
ioannis@43 340 def download_plots(self, measurement_id):
victor@7 341 """ Download profile graphs for the measurement id. """
victor@7 342 # Construct the download url
ioannis@45 343 download_url = self.download_plots_pattern.format(measurement_id)
ioannis@43 344 try:
ioannis@50 345 self.download_files(measurement_id, 'elda_plots', download_url)
ioannis@43 346 except Exception as e:
ioannis@43 347 logger.error("Could not download ELDA plots. Error message: {}".format(e))
ioannis@43 348 logger.debug('Download exception:', exc_info=True)
victor@7 349
ioannis@43 350 def download_elic(self, measurement_id):
ioannis@43 351 """ Download ELIC files for the measurement id. """
ioannis@43 352 # Construct the download url
ioannis@43 353 download_url = self.download_elic_pattern.format(measurement_id)
ioannis@43 354 try:
ioannis@50 355 self.download_files(measurement_id, 'elic', download_url)
ioannis@43 356 except Exception as e:
ioannis@43 357 logger.error("Could not download ELIC files. Error message: {}".format(e))
ioannis@43 358 logger.debug('Download exception:', exc_info=True)
ioannis@43 359
ioannis@43 360 def download_eldec(self, measurement_id):
ioannis@43 361 """ Download ELDEC files for the measurement id. """
ioannis@43 362 # Construct the download url
ioannis@43 363 download_url = self.download_elda_pattern.format(measurement_id) # ELDA patter is used for now
ioannis@43 364 try:
ioannis@50 365 self.download_files(measurement_id, 'eldec', download_url)
ioannis@43 366 except Exception as e:
ioannis@43 367 logger.error("Could not download EDELC files. Error message: {}".format(e))
ioannis@43 368 logger.debug('Download exception:', exc_info=True)
ioannis@43 369
ioannis@43 370 def rerun_elpp(self, measurement_id, monitor=True):
ioannis@45 371 logger.debug("Started rerun_elpp procedure.")
ioannis@45 372
ioannis@45 373 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 374 measurement, status = self.get_measurement(measurement_id)
victor@7 375
victor@7 376 if measurement:
ioannis@45 377 logger.debug("Attempting to rerun ElPP through %s." % measurement.rerun_all_url)
ioannis@45 378 request = self.session.get(measurement.rerun_elpp_url, stream=True)
victor@7 379
victor@7 380 if request.status_code != 200:
i@14 381 logger.error(
i@14 382 "Could not rerun processing for %s. Status code: %s" % (measurement_id, request.status_code))
ioannis@45 383 else:
ioannis@45 384 logger.info("Rerun-elpp command submitted successfully for id {}.".format(measurement_id))
victor@7 385
victor@7 386 if monitor:
victor@7 387 self.monitor_processing(measurement_id)
victor@7 388
victor@7 389 def rerun_all(self, measurement_id, monitor=True):
victor@7 390 logger.debug("Started rerun_all procedure.")
victor@7 391
victor@7 392 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 393 measurement, status = self.get_measurement(measurement_id)
victor@7 394
victor@7 395 if measurement:
victor@7 396 logger.debug("Attempting to rerun all processing through %s." % measurement.rerun_all_url)
victor@7 397
moritz@29 398 request = self.session.get(measurement.rerun_all_url, stream=True)
victor@7 399
victor@7 400 if request.status_code != 200:
victor@7 401 logger.error("Could not rerun pre processing for %s. Status code: %s" %
victor@7 402 (measurement_id, request.status_code))
ioannis@45 403 else:
ioannis@45 404 logger.info("Rerun-all command submitted successfully for id {}.".format(measurement_id))
victor@7 405
victor@7 406 if monitor:
victor@7 407 self.monitor_processing(measurement_id)
victor@7 408
ioannis@67 409 def process(self, filename, system_id, monitor, force_upload, delete_related, delay=0, rs_filename=None,
ioannis@67 410 lr_filename=None, ov_filename=None):
victor@7 411 """ Upload a file for processing and wait for the processing to finish.
victor@7 412 If the processing is successful, it will download all produced files.
victor@7 413 """
victor@7 414 logger.info("--- Processing started on %s. ---" % datetime.datetime.now())
victor@7 415 # Upload file
ioannis@50 416 logger.info("Uploading file.")
ioannis@45 417 measurement_id = self.upload_file(filename, system_id, force_upload, delete_related,
ioannis@54 418 delay=delay,
ioannis@32 419 rs_filename=rs_filename,
ioannis@32 420 lr_filename=lr_filename,
ioannis@32 421 ov_filename=ov_filename)
ioannis@43 422
ioannis@54 423 if monitor and (delay > 0):
ioannis@54 424 logger.warning("Will not start monitoring, since a delay was specified: {} hours.".format(delay))
ioannis@54 425 return None
ioannis@54 426
ioannis@32 427 if measurement_id and monitor:
ioannis@54 428 logger.info("Monitoring processing.")
moritz@29 429 return self.monitor_processing(measurement_id)
victor@7 430
moritz@29 431 return None
victor@7 432
ioannis@61 433 def monitor_processing(self, measurement_id, retry_max=2, time_sleep=2, exit_if_missing=True):
victor@7 434 """ Monitor the processing progress of a measurement id"""
victor@7 435
madrouin@24 436 # try to deal with error 404
ioannis@61 437 attempts_count = 0
ioannis@61 438 max_attempts = retry_max + 1
madrouin@24 439
ioannis@67 440 # try to wait for measurement to appear in API. A user has reported that this does not happen immediately.
madrouin@24 441 measurement = None
ioannis@50 442 logger.info("Looking for measurement %s on the SCC.", measurement_id)
ioannis@62 443
ioannis@61 444 while attempts_count < max_attempts:
ioannis@61 445 attempts_count += 1
madrouin@26 446 measurement, status = self.get_measurement(measurement_id)
ioannis@61 447 if status != 200:
ioannis@61 448 logger.warning("Measurement not found.")
ioannis@61 449 if attempts_count < max_attempts:
ioannis@61 450 logger.warning("Waiting %ds.", time_sleep)
ioannis@61 451 time.sleep(time_sleep)
madrouin@26 452 else:
madrouin@26 453 break
ioannis@62 454 print("Measurement: {}".format(measurement))
madrouin@24 455
ioannis@62 456 if measurement is None:
ioannis@61 457 logger.error("Measurement %s doesn't seem to exist.", measurement_id)
ioannis@61 458 if exit_if_missing:
ioannis@61 459 sys.exit(1)
ioannis@61 460 else:
ioannis@61 461 return measurement
madrouin@26 462
ioannis@45 463 logger.info('Measurement %s found.', measurement_id)
ioannis@62 464 while not measurement.has_finished:
ioannis@62 465 measurement.log_processing_status()
ioannis@62 466 time.sleep(10)
ioannis@62 467 measurement, status = self.get_measurement(measurement_id)
madrouin@24 468
ioannis@62 469 logger.info("Measurement processing finished.")
ioannis@62 470 measurement.log_detailed_status()
ioannis@53 471
ioannis@62 472 if measurement.hirelpp == 127:
ioannis@62 473 logger.info("Downloading HiRElPP files.")
ioannis@62 474 self.download_hirelpp(measurement_id)
ioannis@62 475 if measurement.cloudmask == 127:
ioannis@62 476 logger.info("Downloading cloud screening files.")
ioannis@62 477 self.download_cloudmask(measurement_id)
ioannis@62 478 if measurement.elpp == 127:
ioannis@62 479 logger.info("Downloading ElPP files.")
ioannis@62 480 self.download_elpp(measurement_id)
ioannis@62 481 if measurement.elda == 127:
ioannis@62 482 logger.info("Downloading ELDA files.")
ioannis@62 483 self.download_elda(measurement_id)
ioannis@62 484 logger.info("Downloading ELDA plots.")
ioannis@62 485 self.download_plots(measurement_id)
ioannis@62 486 if measurement.elic == 127:
ioannis@62 487 logger.info("Downloading ELIC files.")
ioannis@62 488 self.download_elic(measurement_id)
ioannis@67 489 if measurement.is_calibration and measurement.eldec == 0:
ioannis@62 490 logger.info("Downloading ELDEC files.")
ioannis@62 491 self.download_eldec(measurement_id)
ioannis@62 492 logger.info("--- Processing finished. ---")
ioannis@43 493
victor@7 494 return measurement
victor@7 495
claudio@68 496 def download_products(self, measurement, dir_name):
claudio@68 497 """ Download all the products of a measurement id (used only for E-SHAPE"""
claudio@68 498 measurement_id = measurement.id
claudio@68 499 base_output_dir = self.output_dir
claudio@68 500 self.output_dir = self.output_dir + dir_name + "/"
claudio@68 501
claudio@68 502 if measurement.hirelpp == 127:
claudio@68 503 logger.info("Downloading HiRElPP files.")
claudio@68 504 self.download_hirelpp(measurement_id)
claudio@68 505 if measurement.cloudmask == 127:
claudio@68 506 logger.info("Downloading cloud screening files.")
claudio@68 507 self.download_cloudmask(measurement_id)
claudio@68 508 if measurement.elpp == 127:
claudio@68 509 logger.info("Downloading ElPP files.")
claudio@68 510 self.download_elpp(measurement_id)
claudio@68 511 if measurement.elda == 127:
claudio@68 512 logger.info("Downloading ELDA files.")
claudio@68 513 self.download_elda(measurement_id)
claudio@68 514 logger.info("Downloading ELDA plots.")
claudio@68 515 self.download_plots(measurement_id)
claudio@68 516 if measurement.elic == 127:
claudio@68 517 logger.info("Downloading ELIC files.")
claudio@68 518 self.download_elic(measurement_id)
claudio@68 519 if measurement.is_calibration and measurement.eldec == 0:
claudio@68 520 logger.info("Downloading ELDEC files.")
claudio@68 521 self.download_eldec(measurement_id)
claudio@68 522 logger.info("--- Processing finished. ---")
claudio@68 523
claudio@68 524 self.output_dir = base_output_dir
claudio@68 525 return measurement
claudio@68 526
ioannis@43 527 def get_measurement(self, measurement_id):
ioannis@67 528 """ Get a measurement information from the SCC API.
victor@7 529
ioannis@67 530 Parameters
ioannis@67 531 ----------
ioannis@67 532 measurement_id : str
ioannis@67 533 The measurement ID to search.
ioannis@67 534
ioannis@67 535 Returns
ioannis@67 536 -------
ioannis@67 537 : Measurement object or None
ioannis@67 538 If the measurement is found, a Measurement object is returned. If not, it returns None
ioannis@67 539 """
ioannis@67 540 # TODO: Consider to homogenize with get_ancillary method (i.e. always return a Measurement object).
ioannis@67 541
ioannis@67 542 if measurement_id is None: # TODO: Is this still required?
victor@7 543 return None
victor@7 544
ioannis@67 545 # Access the API
i@31 546 measurement_url = self.api_measurement_pattern.format(measurement_id)
i@31 547 logger.debug("Measurement API URL: %s" % measurement_url)
victor@7 548
moritz@29 549 response = self.session.get(measurement_url)
victor@7 550
ioannis@43 551 response_dict = None
ioannis@45 552
ioannis@43 553 if response.status_code == 200:
ioannis@43 554 response_dict = response.json()
ioannis@45 555 elif response.status_code == 404:
ioannis@43 556 logger.info("No measurement with id %s found on the SCC." % measurement_id)
ioannis@45 557 else:
i@14 558 logger.error('Could not access API. Status code %s.' % response.status_code)
victor@7 559
ioannis@55 560 # TODO: Implement better handling for status 401.
ioannis@55 561
victor@7 562 if response_dict:
ioannis@43 563 measurement = Measurement(self.base_url, response_dict)
victor@7 564 else:
ioannis@45 565 measurement = None
victor@7 566
ioannis@45 567 return measurement, response.status_code
victor@7 568
ioannis@45 569 def delete_measurement(self, measurement_id, delete_related):
victor@7 570 """ Deletes a measurement with the provided measurement id. The user
ioannis@67 571 should have the appropriate permissions (i.e. access to the admin site).
madrouin@20 572
victor@7 573 The procedures is performed directly through the web interface and
victor@7 574 NOT through the API.
victor@7 575 """
victor@7 576 # Get the measurement object
i@31 577 measurement, _ = self.get_measurement(measurement_id)
victor@7 578
victor@7 579 # Check that it exists
victor@7 580 if measurement is None:
victor@7 581 logger.warning("Nothing to delete.")
victor@7 582 return None
victor@7 583
victor@7 584 # Go the the page confirming the deletion
moritz@29 585 delete_url = self.delete_measurement_pattern.format(measurement_id)
ioannis@43 586
moritz@29 587 confirm_page = self.session.get(delete_url)
victor@7 588
victor@7 589 # Check that the page opened properly
victor@7 590 if confirm_page.status_code != 200:
victor@7 591 logger.warning("Could not open delete page. Status: {0}".format(confirm_page.status_code))
victor@7 592 return None
victor@7 593
ioannis@43 594 # Get the delete related value
ioannis@43 595 if delete_related:
ioannis@43 596 delete_related_option = 'delete_related'
ioannis@43 597 else:
ioannis@43 598 delete_related_option = 'not_delete_related'
ioannis@43 599
victor@7 600 # Delete the measurement
victor@7 601 delete_page = self.session.post(delete_url,
ioannis@43 602 data={'post': 'yes',
ioannis@43 603 'select_delete_related_measurements': delete_related_option},
victor@7 604 headers={'X-CSRFToken': confirm_page.cookies['csrftoken'],
victor@7 605 'referer': delete_url}
victor@7 606 )
i@31 607 if not delete_page.ok:
victor@7 608 logger.warning("Something went wrong. Delete page status: {0}".format(
victor@7 609 delete_page.status_code))
victor@7 610 return None
victor@7 611
victor@7 612 logger.info("Deleted measurement {0}".format(measurement_id))
victor@7 613 return True
victor@7 614
claudio@68 615 def available_measurements(self, start_gte=None, stop_lte=None):
ioannis@67 616 """ Get a list of available measurement on the SCC.
ioannis@67 617
ioannis@67 618 The methods is currently not used, could be merged with list_measurements.
ioannis@67 619 """
claudio@68 620
claudio@68 621 params = {}
claudio@68 622 if start_gte is not None:
claudio@68 623 params['start__gte'] = start_gte
claudio@68 624 if stop_lte is not None:
claudio@68 625 params['stop__lte'] = stop_lte
claudio@68 626
claudio@68 627 response = self.session.get(self.api_measurements_url, params=params)
victor@7 628 response_dict = response.json()
victor@7 629
victor@7 630 if response_dict:
victor@7 631 measurement_list = response_dict['objects']
i@14 632 measurements = [Measurement(self.base_url, measurement_dict) for measurement_dict in measurement_list]
victor@7 633 logger.info("Found %s measurements on the SCC." % len(measurements))
victor@7 634 else:
victor@7 635 logger.warning("No response received from the SCC when asked for available measurements.")
ioannis@43 636 measurements = None
victor@7 637
victor@7 638 return measurements
victor@7 639
claudio@68 640 def list_measurements(self, id_exact=None, id_startswith=None,
claudio@68 641 start_exact=None, start_gte=None, start_lte=None,
claudio@68 642 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 643 station_exact=None, station_in=None):
ioannis@67 644 """ Get the response text from the API. """
moritz@29 645
ioannis@67 646 # TODO: Add some error handling, e.g. as per available_measurements method
i@31 647
moritz@29 648 # Need to set to empty string if not specified, we won't get any results
ioannis@65 649 params = {}
i@31 650
ioannis@65 651 if id_exact is not None:
ioannis@65 652 params['id__exact'] = id_exact
claudio@68 653 elif id_startswith is not None:
claudio@68 654 params['id__startswith'] = id_startswith
claudio@68 655
claudio@68 656 if start_exact is not None:
claudio@68 657 params['start__exact'] = start_exact
ioannis@65 658 else:
claudio@68 659 if start_gte is not None:
claudio@68 660 params['start__gte'] = start_gte
claudio@68 661 if start_lte is not None:
claudio@68 662 params['start__lte'] = start_lte
claudio@68 663
claudio@68 664 if stop_exact is not None:
claudio@68 665 params['stop__exact'] = stop_exact
claudio@68 666 else:
claudio@68 667 if stop_gte is not None:
claudio@68 668 params['stop__gte'] = stop_gte
claudio@68 669 if stop_lte is not None:
claudio@68 670 params['stop__lte'] = stop_lte
claudio@68 671
claudio@68 672 if station_exact is not None:
claudio@68 673 params['station__exact'] = station_exact
claudio@68 674 elif station_in is not None:
claudio@68 675 params['station__in'] = station_in
moritz@29 676
ioannis@65 677 response_json = self.session.get(self.api_measurements_url, params=params).text
moritz@29 678
ioannis@65 679 return response_json
moritz@29 680
ioannis@43 681 def measurement_id_for_date(self, t1, call_sign, base_number=0):
victor@7 682 """ Give the first available measurement id on the SCC for the specific
madrouin@20 683 date.
victor@7 684 """
ioannis@67 685 # TODO: Check if this method needs updating to handle all measurement_ID formats.
victor@7 686 date_str = t1.strftime('%Y%m%d')
i@31 687 base_id = "%s%s" % (date_str, call_sign)
i@31 688 search_url = urlparse.urljoin(self.api_base_url, 'measurements/?id__startswith=%s' % base_id)
victor@7 689
moritz@29 690 response = self.session.get(search_url)
victor@7 691
victor@7 692 response_dict = response.json()
victor@7 693
victor@7 694 measurement_id = None
victor@7 695
victor@7 696 if response_dict:
victor@7 697 measurement_list = response_dict['objects']
i@31 698
i@31 699 if len(measurement_list) == 100:
i@31 700 raise ValueError('No available measurement id found.')
i@31 701
victor@7 702 existing_ids = [measurement_dict['id'] for measurement_dict in measurement_list]
victor@7 703
victor@7 704 measurement_number = base_number
i@31 705 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 706
victor@7 707 while measurement_id in existing_ids:
victor@7 708 measurement_number = measurement_number + 1
i@31 709 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 710
victor@7 711 return measurement_id
victor@7 712
i@40 713 def get_ancillary(self, file_path, file_type):
i@38 714 """
i@38 715 Try to get the ancillary file data from the SCC API.
i@38 716
i@38 717 The result will always be an API object. If the file does not exist, the .exists property is set to False.
i@38 718
i@38 719 Parameters
i@38 720 ----------
i@40 721 file_path : str
i@40 722 Path of the uploaded file.
i@38 723 file_type : str
i@38 724 Type of ancillary file. One of 'sounding', 'overlap', 'lidarratio'.
i@38 725
i@38 726 Returns
i@38 727 : AncillaryFile
i@38 728 The api object.
i@38 729 """
i@38 730 assert file_type in ['sounding', 'overlap', 'lidarratio']
i@38 731
i@40 732 filename = os.path.basename(file_path)
i@40 733
i@38 734 if file_type == 'sounding':
i@38 735 file_url = self.api_sounding_search_pattern.format(filename)
i@38 736 elif file_type == 'overlap':
i@38 737 file_url = self.api_overlap_search_pattern.format(filename)
i@38 738 else:
i@38 739 file_url = self.api_lidarratio_search_pattern.format(filename)
i@38 740
i@38 741 response = self.session.get(file_url)
i@38 742
i@38 743 if not response.ok:
i@38 744 logger.error('Could not access API. Status code %s.' % response.status_code)
i@38 745 return None, response.status_code
i@38 746
i@38 747 response_dict = response.json()
i@38 748 object_list = response_dict['objects']
i@38 749
i@38 750 logger.debug("Ancillary file JSON: {0}".format(object_list))
i@38 751
i@38 752 if object_list:
i@38 753 ancillary_file = AncillaryFile(self.api_base_url, object_list[0]) # Assume only one file is returned
i@38 754 else:
i@38 755 ancillary_file = AncillaryFile(self.api_base_url, None) # Create an empty object
i@38 756
i@38 757 return ancillary_file, response.status_code
i@38 758
ioannis@43 759 def __enter__(self):
ioannis@43 760 return self
victor@7 761
ioannis@43 762 def __exit__(self, *args):
ioannis@43 763 logger.debug("Closing SCC connection session.")
ioannis@43 764 self.session.close()
ioannis@43 765
i@31 766 class PageNotAccessibleError(RuntimeError):
i@31 767 pass
ioannis@43 768
victor@7 769
ioannis@17 770 class ApiObject(object):
victor@7 771 """ A generic class object. """
victor@7 772
i@14 773 def __init__(self, base_url, dict_response):
i@14 774 self.base_url = base_url
victor@7 775
victor@7 776 if dict_response:
victor@7 777 # Add the dictionary key value pairs as object properties
victor@7 778 for key, value in dict_response.items():
ioannis@17 779 # logger.debug('Setting key {0} to value {1}'.format(key, value))
ioannis@17 780 try:
ioannis@17 781 setattr(self, key, value)
ioannis@17 782 except:
ioannis@17 783 logger.warning('Could not set attribute {0} to value {1}'.format(key, value))
victor@7 784 self.exists = True
victor@7 785 else:
victor@7 786 self.exists = False
victor@7 787
victor@7 788
victor@7 789 class Measurement(ApiObject):
ioannis@43 790 """ This class represents the measurement object as returned in the SCC API.
ioannis@43 791 """
victor@7 792
i@14 793 def __init__(self, base_url, dict_response):
victor@7 794
ioannis@45 795 # Define expected attributes to assist debugging
ioannis@53 796
ioannis@53 797 self.hirelpp = None
ioannis@53 798 self.hirelpp_exit_code = None
ioannis@43 799 self.cloudmask = None
ioannis@53 800 self.cloudmask_exit_code = None
ioannis@53 801 self.elpp = None
ioannis@53 802 self.elpp_exit_code = None
ioannis@43 803 self.elda = None
ioannis@53 804 self.elda_exit_code = None
ioannis@43 805 self.elic = None
ioannis@53 806 self.elic_exit_code = None
ioannis@53 807 self.eldec = None
ioannis@53 808 self.eldec_exit_code = None
ioannis@53 809 self.elquick = None
ioannis@53 810 self.elquick_exit_code = None
ioannis@53 811
ioannis@43 812 self.id = None
claudio@68 813 self.num_id = None
ioannis@43 814 self.is_calibration = None
ioannis@43 815 self.is_running = None
claudio@68 816 self.is_queued = None
ioannis@53 817
ioannis@43 818 self.resource_uri = None
ioannis@43 819 self.start = None
ioannis@43 820 self.stop = None
ioannis@43 821 self.system = None
claudio@68 822 self.station = None
ioannis@43 823 self.upload = None
ioannis@43 824
ioannis@45 825 super().__init__(base_url, dict_response)
victor@7 826
ioannis@57 827 @property
ioannis@57 828 def has_finished(self):
ioannis@57 829 """ Temporary implementation for SCC version 5.2.0, until the API returns a flag indicating if the
ioannis@57 830 processing measurement has finished. """
ioannis@57 831 if (self.is_running is False) and (self.hirelpp != 0 or self.elpp != 0):
ioannis@57 832 return True
ioannis@57 833 else:
ioannis@57 834 return False
ioannis@57 835
ioannis@53 836 def log_processing_status(self):
ioannis@53 837 """ Log module status. """
claudio@68 838 logger.info("Measurement is being processed. Status: {}, {}, {}, {}, {}, {}, {}). Please wait.".format(
ioannis@53 839 self.upload,
ioannis@53 840 self.hirelpp,
ioannis@53 841 self.cloudmask,
ioannis@53 842 self.elpp,
ioannis@53 843 self.elda,
claudio@68 844 self.elic,
claudio@68 845 self.elquick))
ioannis@53 846
ioannis@53 847 def log_detailed_status(self):
ioannis@53 848 """ Log module exit and status codes."""
ioannis@53 849 logger.info("Measurement exit status:".format(self.id))
ioannis@53 850 if self.is_calibration:
ioannis@53 851 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 852 self._log_module_status('ElDEC', self.eldec, self.eldec_exit_code)
ioannis@53 853 else:
ioannis@53 854 self._log_module_status('HiRElPP', self.hirelpp, self.hirelpp_exit_code)
ioannis@53 855 self._log_module_status('CloudScreen', self.cloudmask, self.cloudmask_exit_code)
ioannis@53 856 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 857 self._log_module_status('ELDA', self.elda, self.elda_exit_code)
ioannis@53 858 self._log_module_status('ELIC', self.elic, self.elic_exit_code)
ioannis@53 859 self._log_module_status('ELQuick', self.elquick, self.elquick_exit_code)
ioannis@53 860
ioannis@53 861 def _log_module_status(self, name, status, exit_code):
ioannis@53 862 if exit_code:
ioannis@54 863 if exit_code['exit_code'] > 0:
ioannis@54 864 logger.warning("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@54 865 else:
ioannis@54 866 logger.info("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@53 867 else:
ioannis@53 868 logger.info("{0} exit code: {2}".format(name, status, exit_code))
ioannis@53 869
ioannis@43 870 @property
ioannis@43 871 def rerun_elda_url(self):
ioannis@43 872 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elda/')
ioannis@43 873 return url_pattern.format(self.id)
victor@7 874
victor@7 875 @property
ioannis@43 876 def rerun_elpp_url(self):
ioannis@43 877 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elpp/')
i@14 878 return url_pattern.format(self.id)
victor@7 879
victor@7 880 @property
victor@7 881 def rerun_all_url(self):
i@14 882 ulr_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-all/')
i@14 883 return ulr_pattern.format(self.id)
victor@7 884
victor@7 885 def __str__(self):
ioannis@43 886 return "Measurement {}".format(self.id)
victor@7 887
victor@7 888
i@38 889 class AncillaryFile(ApiObject):
i@38 890 """ This class represents the ancilalry file object as returned in the SCC API.
i@38 891 """
ioannis@67 892
i@38 893 @property
i@38 894 def already_on_scc(self):
i@38 895 if self.exists is False:
i@38 896 return False
i@38 897
i@38 898 return not self.status == 'missing'
i@38 899
i@38 900 def __str__(self):
i@38 901 return "%s: %s, %s" % (self.id,
i@38 902 self.filename,
i@38 903 self.status)
i@38 904
i@38 905
ioannis@67 906 # Methods that use the SCC class to perform specific tasks.
ioannis@45 907 def process_file(filename, system_id, settings, force_upload, delete_related,
ioannis@54 908 delay=0, monitor=True, rs_filename=None, lr_filename=None, ov_filename=None):
ioannis@32 909 """ Shortcut function to process a file to the SCC. """
ioannis@32 910 logger.info("Processing file %s, using system %s" % (filename, system_id))
victor@7 911
ioannis@43 912 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 913 scc.login(settings['website_credentials'])
ioannis@45 914 measurement = scc.process(filename, system_id,
ioannis@45 915 force_upload=force_upload,
ioannis@45 916 delete_related=delete_related,
ioannis@54 917 delay=delay,
ioannis@45 918 monitor=monitor,
ioannis@45 919 rs_filename=rs_filename,
ioannis@45 920 lr_filename=lr_filename,
ioannis@45 921 ov_filename=ov_filename)
ioannis@43 922 scc.logout()
victor@7 923 return measurement
victor@7 924
victor@7 925
ioannis@45 926 def delete_measurements(measurement_ids, delete_related, settings):
moritz@29 927 """ Shortcut function to delete measurements from the SCC. """
ioannis@45 928 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 929 scc.login(settings['website_credentials'])
ioannis@45 930 for m_id in measurement_ids:
ioannis@54 931 logger.info("Deleting %s." % m_id)
ioannis@45 932 scc.delete_measurement(m_id, delete_related)
ioannis@45 933 scc.logout()
moritz@29 934
moritz@29 935
moritz@29 936 def rerun_all(measurement_ids, monitor, settings):
moritz@29 937 """ Shortcut function to rerun measurements from the SCC. """
i@14 938
ioannis@43 939 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 940 scc.login(settings['website_credentials'])
ioannis@45 941 for m_id in measurement_ids:
ioannis@54 942 logger.info("Rerunning all products for %s." % m_id)
ioannis@45 943 scc.rerun_all(m_id, monitor)
ioannis@43 944 scc.logout()
victor@7 945
victor@7 946
moritz@29 947 def rerun_processing(measurement_ids, monitor, settings):
victor@7 948 """ Shortcut function to delete a measurement from the SCC. """
i@14 949
ioannis@43 950 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 951 scc.login(settings['website_credentials'])
ioannis@45 952 for m_id in measurement_ids:
ioannis@45 953 logger.info("Rerunning (optical) processing for %s" % m_id)
ioannis@45 954 scc.rerun_elpp(m_id, monitor)
ioannis@45 955 scc.logout()
moritz@29 956
moritz@29 957
claudio@68 958 def list_measurements(settings, id_exact=None, id_startswith=None,
claudio@68 959 start_exact=None, start_gte=None, start_lte=None,
claudio@68 960 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 961 station_exact=None, station_in=None):
moritz@29 962 """List all available measurements"""
ioannis@45 963 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 964 scc.login(settings['website_credentials'])
ioannis@65 965
claudio@68 966 results_json = scc.list_measurements(id_exact=id_exact, id_startswith=id_startswith,
claudio@68 967 start_exact=start_exact, start_gte=start_gte, start_lte=start_lte,
claudio@68 968 stop_exact=stop_exact, stop_gte=stop_gte, stop_lte=stop_lte,
claudio@68 969 station_exact=station_exact, station_in=station_in)
ioannis@65 970 print(results_json)
ioannis@65 971
ioannis@43 972 scc.logout()
victor@7 973
victor@7 974
ioannis@61 975 def download_measurements(measurement_ids, max_retries, exit_if_missing, settings):
moritz@29 976 """Download all measurements for the specified IDs"""
ioannis@43 977 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 978 scc.login(settings['website_credentials'])
ioannis@45 979 for m_id in measurement_ids:
ioannis@61 980 scc.monitor_processing(m_id, retry_max=max_retries, time_sleep=3, exit_if_missing=exit_if_missing)
ioannis@61 981
ioannis@43 982 scc.logout()
i@14 983
i@14 984
claudio@68 985 def eshape_downloader(settings):
claudio@68 986 eshape_dir = settings['output_dir']
claudio@68 987 #directories = [[x[0] for x in os.walk(eshape_dir)]]
claudio@68 988 all_directories = [f.name for f in os.scandir(eshape_dir) if f.is_dir()]
claudio@68 989 folders_pattern = re.compile("^(\d{6}_{1}\d{12})+$")
claudio@68 990 directories = [dir_name for dir_name in all_directories if folders_pattern.match(dir_name)]
claudio@68 991 for dir_name in directories:
claudio@68 992 start_string = dir_name.split("_")[1]
claudio@68 993 date_time_start = datetime.datetime.strptime(start_string, '%Y%m%d%H%M')
claudio@68 994 if (datetime.datetime.now() - datetime.timedelta(days=3)) <= date_time_start:
claudio@68 995 start_parameter = date_time_start.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 996 date_time_stop = datetime.datetime.now()
claudio@68 997 stop_parameter = date_time_stop.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 998
claudio@68 999 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
claudio@68 1000 scc.login(settings['website_credentials'])
claudio@68 1001
claudio@68 1002 measurements = scc.available_measurements(start_gte=start_parameter, stop_lte=stop_parameter)
claudio@68 1003 if measurements is not None:
claudio@68 1004 for meas in measurements:
claudio@68 1005 scc.download_products(meas, dir_name)
claudio@68 1006
claudio@68 1007 scc.logout()
claudio@68 1008
claudio@68 1009
moritz@29 1010 def settings_from_path(config_file_path):
i@14 1011 """ Read the configuration file.
i@14 1012
i@14 1013 The file should be in YAML syntax."""
i@14 1014
i@14 1015 if not os.path.isfile(config_file_path):
moritz@29 1016 raise argparse.ArgumentTypeError("Wrong path for configuration file (%s)" % config_file_path)
i@14 1017
i@14 1018 with open(config_file_path) as yaml_file:
i@14 1019 try:
i@14 1020 settings = yaml.safe_load(yaml_file)
i@14 1021 logger.debug("Read settings file(%s)" % config_file_path)
moritz@29 1022 except Exception:
moritz@29 1023 raise argparse.ArgumentTypeError("Could not parse YAML file (%s)" % config_file_path)
i@14 1024
i@14 1025 # YAML limitation: does not read tuples
i@14 1026 settings['basic_credentials'] = tuple(settings['basic_credentials'])
i@14 1027 settings['website_credentials'] = tuple(settings['website_credentials'])
i@14 1028 return settings
i@14 1029
i@14 1030
moritz@29 1031 # Setup for command specific parsers
moritz@29 1032 def setup_delete(parser):
moritz@29 1033 def delete_from_args(parsed):
ioannis@45 1034 delete_measurements(parsed.IDs,
ioannis@45 1035 delete_related=False,
ioannis@45 1036 settings=parsed.config)
moritz@29 1037
moritz@29 1038 parser.add_argument("IDs", nargs="+", help="measurement IDs to delete.")
moritz@29 1039 parser.set_defaults(execute=delete_from_args)
moritz@29 1040
moritz@29 1041
moritz@29 1042 def setup_rerun_all(parser):
moritz@29 1043 def rerun_all_from_args(parsed):
moritz@29 1044 rerun_all(parsed.IDs, parsed.process, parsed.config)
moritz@29 1045
moritz@29 1046 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun.")
moritz@29 1047 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1048 action="store_true")
moritz@29 1049 parser.set_defaults(execute=rerun_all_from_args)
moritz@29 1050
moritz@29 1051
ioannis@45 1052 def setup_rerun_elpp(parser):
moritz@29 1053 def rerun_processing_from_args(parsed):
moritz@29 1054 rerun_processing(parsed.IDs, parsed.process, parsed.config)
moritz@29 1055
moritz@29 1056 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun the processing on.")
moritz@29 1057 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1058 action="store_true")
moritz@29 1059 parser.set_defaults(execute=rerun_processing_from_args)
moritz@29 1060
moritz@29 1061
ioannis@45 1062 def setup_upload_file(parser):
ioannis@45 1063 """ Upload but do not monitor processing progress. """
ioannis@67 1064
ioannis@45 1065 def upload_file_from_args(parsed):
ioannis@45 1066 process_file(parsed.filename, parsed.system, parsed.config,
ioannis@54 1067 delay=parsed.delay,
ioannis@45 1068 monitor=parsed.process,
ioannis@45 1069 force_upload=parsed.force_upload,
ioannis@45 1070 delete_related=False, # For now, use this as default
ioannis@32 1071 rs_filename=parsed.radiosounding,
ioannis@32 1072 ov_filename=parsed.overlap,
ioannis@32 1073 lr_filename=parsed.lidarratio)
moritz@29 1074
ioannis@54 1075 def delay(arg):
ioannis@54 1076 try:
ioannis@54 1077 int_arg = int(arg)
ioannis@54 1078 except ValueError:
ioannis@54 1079 raise argparse.ArgumentTypeError("Could not convert delay argument {} to integer.".format(arg))
ioannis@54 1080
ioannis@54 1081 if 0 <= int_arg <= 96:
ioannis@54 1082 return int_arg
ioannis@54 1083 else:
ioannis@54 1084 raise argparse.ArgumentTypeError("Delay should be an integer between 0 and 96.")
ioannis@54 1085
moritz@29 1086 parser.add_argument("filename", help="Measurement file name or path.")
moritz@29 1087 parser.add_argument("system", help="Processing system id.")
ioannis@54 1088 parser.add_argument("--delay", help="Delay processing by the specified number of hours (0 to 96).",
ioannis@54 1089 default=0, type=delay)
ioannis@45 1090 parser.add_argument("-p", "--process", help="Wait for the processing results.",
ioannis@45 1091 action="store_true")
ioannis@45 1092 parser.add_argument("--force_upload", help="If measurement ID exists on SCC, delete before uploading.",
ioannis@45 1093 action="store_true")
i@30 1094 parser.add_argument("--radiosounding", default=None, help="Radiosounding file name or path")
ioannis@32 1095 parser.add_argument("--overlap", default=None, help="Overlap file name or path")
ioannis@32 1096 parser.add_argument("--lidarratio", default=None, help="Lidar ratio file name or path")
i@30 1097
moritz@29 1098 parser.set_defaults(execute=upload_file_from_args)
moritz@29 1099
moritz@29 1100
moritz@29 1101 def setup_list_measurements(parser):
moritz@29 1102 def list_measurements_from_args(parsed):
claudio@68 1103 list_measurements(parsed.config, id_exact=parsed.id_exact, id_startswith=parsed.id_startswith,
claudio@68 1104 start_exact=parsed.start_exact, start_gte=parsed.start_gte, start_lte=parsed.start_lte,
claudio@68 1105 stop_exact=parsed.stop_exact, stop_gte=parsed.stop_gte, stop_lte=parsed.stop_lte,
claudio@68 1106 station_exact=parsed.station_exact, station_in=parsed.station_in)
claudio@68 1107
claudio@68 1108 group = parser.add_argument_group()
claudio@68 1109
claudio@68 1110 group_id = group.add_mutually_exclusive_group()
claudio@68 1111 group_id.add_argument("--id_exact", help="Exact measurement id.")
claudio@68 1112 group_id.add_argument("--id_startswith", help="Initial part of measurement id.")
moritz@29 1113
claudio@68 1114 group_start = group.add_argument_group()
claudio@68 1115 group_start.add_argument("--start_exact", help="Exact start date of the measurement.")
claudio@68 1116 group_start.add_argument("--start_gte", help="Start date of the measurement after the given date.")
claudio@68 1117 group_start.add_argument("--start_lte", help="Start date of the measurement before the given date.")
claudio@68 1118
claudio@68 1119 group_stop = group.add_argument_group()
claudio@68 1120 group_stop.add_argument("--stop_exact", help="Exact stop date of the measurement.")
claudio@68 1121 group_stop.add_argument("--stop_gte", help="Stop date of the measurement after the given date.")
claudio@68 1122 group_stop.add_argument("--stop_lte", help="Stop date of the measurement before the given date.")
claudio@68 1123
claudio@68 1124 group_station = group.add_mutually_exclusive_group()
claudio@68 1125 group_station.add_argument("--station_exact", help="Station the performed the measurement.")
claudio@68 1126 group_station.add_argument("--station_in", help="List of stations (separated by comma) that performed the measurement.")
moritz@29 1127
moritz@29 1128 parser.set_defaults(execute=list_measurements_from_args)
moritz@29 1129
moritz@29 1130
moritz@29 1131 def setup_download_measurements(parser):
moritz@29 1132 def download_measurements_from_args(parsed):
ioannis@61 1133 download_measurements(parsed.IDs, parsed.max_retries, parsed.ignore_errors, parsed.config)
moritz@29 1134
moritz@29 1135 parser.add_argument("IDs", help="Measurement IDs that should be downloaded.", nargs="+")
ioannis@67 1136 parser.add_argument("--max_retries", help="Number of times to retry in cases of missing measurement id.", default=0,
ioannis@67 1137 type=int)
ioannis@67 1138 parser.add_argument("--ignore_errors", help="Ignore errors when downloading multiple measurements.",
ioannis@67 1139 action="store_false")
moritz@29 1140 parser.set_defaults(execute=download_measurements_from_args)
moritz@29 1141
moritz@29 1142
claudio@68 1143 def setup_eshape_downloader(parser):
claudio@68 1144 def run_eshape_downloader(parsed):
claudio@68 1145 eshape_downloader(parsed.config)
claudio@68 1146
claudio@68 1147 parser.set_defaults(execute=run_eshape_downloader)
claudio@68 1148
claudio@68 1149
victor@7 1150 def main():
victor@7 1151 # Define the command line arguments.
victor@7 1152 parser = argparse.ArgumentParser()
moritz@29 1153 subparsers = parser.add_subparsers()
moritz@29 1154
moritz@29 1155 delete_parser = subparsers.add_parser("delete", help="Deletes a measurement.")
ioannis@67 1156 rerun_all_parser = subparsers.add_parser("rerun-all",
ioannis@67 1157 help="Rerun all processing steps for the provided measurement IDs.")
ioannis@45 1158 rerun_processing_parser = subparsers.add_parser("rerun-elpp",
ioannis@45 1159 help="Rerun low-resolution processing steps for the provided measurement ID.")
ioannis@67 1160 upload_file_parser = subparsers.add_parser("upload-file",
ioannis@67 1161 help="Submit a file and, optionally, download the output products.")
ioannis@32 1162 list_parser = subparsers.add_parser("list", help="List measurements registered on the SCC.")
moritz@29 1163 download_parser = subparsers.add_parser("download", help="Download selected measurements.")
claudio@68 1164 eshape_parser = subparsers.add_parser("eshape-downloader", help="Search and download relevant products for E-SHAPE.")
moritz@29 1165
moritz@29 1166 setup_delete(delete_parser)
moritz@29 1167 setup_rerun_all(rerun_all_parser)
ioannis@45 1168 setup_rerun_elpp(rerun_processing_parser)
ioannis@45 1169
moritz@29 1170 setup_upload_file(upload_file_parser)
moritz@29 1171 setup_list_measurements(list_parser)
moritz@29 1172 setup_download_measurements(download_parser)
claudio@68 1173 setup_eshape_downloader(eshape_parser)
victor@7 1174
victor@7 1175 # Verbosity settings from http://stackoverflow.com/a/20663028
victor@7 1176 parser.add_argument('-d', '--debug', help="Print debugging information.", action="store_const",
victor@7 1177 dest="loglevel", const=logging.DEBUG, default=logging.INFO,
victor@7 1178 )
victor@7 1179 parser.add_argument('-s', '--silent', help="Show only warning and error messages.", action="store_const",
victor@7 1180 dest="loglevel", const=logging.WARNING
victor@7 1181 )
victor@7 1182
ioannis@32 1183 # Setup default config location
moritz@29 1184 home = os.path.expanduser("~")
moritz@29 1185 default_config_location = os.path.abspath(os.path.join(home, ".scc_access.yaml"))
moritz@29 1186 parser.add_argument("-c", "--config", help="Path to the config file.", type=settings_from_path,
moritz@29 1187 default=default_config_location)
victor@7 1188
victor@7 1189 args = parser.parse_args()
ioannis@43 1190
victor@7 1191 # Get the logger with the appropriate level
victor@7 1192 logging.basicConfig(format='%(levelname)s: %(message)s', level=args.loglevel)
victor@7 1193
moritz@29 1194 # Dispatch to appropriate function
moritz@29 1195 args.execute(args)
moritz@29 1196
i@14 1197
moritz@29 1198 # When running through terminal
moritz@29 1199 if __name__ == '__main__':
moritz@29 1200 main()

mercurial