scc_access/scc_access.py

Wed, 28 Sep 2022 11:10:08 +0200

author
Claudio Dema <claudio.dema@imaa.cnr.it>
date
Wed, 28 Sep 2022 11:10:08 +0200
changeset 69
cd8bc07f8419
parent 68
70c869fa3242
child 70
4ef6f2102a61
permissions
-rw-r--r--

Option --cloudfree added to upload-file method to manually set a measurement as cloud free during the upload

ioannis@67 1 """ This is a script that allows interaction with the SCC through the command line.
ioannis@67 2
ioannis@67 3 It is based on the requests module for accessing the server.
ioannis@67 4
ioannis@67 5 Most of the interactions are done through the web interface, i.e. by mimicking user interaction with the
ioannis@67 6 SCC website (i.e. user login, data submission, etc.). In few cases, the SCC API is also used.
ioannis@67 7
ioannis@67 8 Most of the functionality is included in the SCC class. The class is used to login into the SCC website and automate
ioannis@67 9 interaction with the site (i.e. upload a file, get measurement status, etc.).
ioannis@67 10
ioannis@67 11 Two other classes (Measurement, AncillaryFile) are used in some cases to handle the output of the SCC API.
ioannis@67 12
ioannis@67 13 Several shortcut functions are defined to perform specific tasks using the SCC class (e.g. process_file, delete_measurements etc).
ioannis@67 14 """
ioannis@43 15 import sys
ioannis@43 16
victor@7 17 import requests
victor@7 18
ioannis@43 19 try:
ioannis@43 20 import urllib.parse as urlparse # Python 3
ioannis@43 21 except ImportError:
ioannis@17 22 import urlparse # Python 2
ioannis@43 23
victor@7 24 import argparse
madrouin@24 25 import datetime
madrouin@24 26 import logging
victor@7 27 import os
victor@7 28 import re
ioannis@32 29 from io import BytesIO
ioannis@45 30
victor@7 31 import time
i@40 32
victor@7 33 from zipfile import ZipFile
madrouin@24 34
i@14 35 import yaml
victor@7 36
ioannis@43 37 import netCDF4 as netcdf
ioannis@43 38
ioannis@43 39 requests.packages.urllib3.disable_warnings()
i@14 40 logger = logging.getLogger(__name__)
victor@7 41
victor@7 42 # The regex to find the measurement id from the measurement page
victor@7 43 # This should be read from the uploaded file, but would require an extra NetCDF module.
i@36 44 regex = "<h3>Measurement (?P<measurement_id>.{12,15}) <small>" # {12, 15} to handle both old- and new-style measurement ids.
victor@7 45
victor@7 46
victor@7 47 class SCC:
ioannis@67 48 """A class that will attempt to interact SCC server.
i@14 49
ioannis@67 50 Most interactions are by simulating a normal browser session. In the current
ioannis@67 51 version few checks are performed before upload a file, and no feedback is given in case the upload
ioannis@67 52 fails.
victor@7 53 """
victor@7 54
i@14 55 def __init__(self, auth, output_dir, base_url):
moritz@29 56
victor@7 57 self.auth = auth
victor@7 58 self.output_dir = output_dir
i@14 59 self.base_url = base_url
victor@7 60 self.session = requests.Session()
moritz@29 61 self.session.auth = auth
moritz@29 62 self.session.verify = False
victor@7 63
ioannis@67 64 # Setup SCC server URLS for later use
i@14 65 self.login_url = urlparse.urljoin(self.base_url, 'accounts/login/')
i@31 66 self.logout_url = urlparse.urljoin(self.base_url, 'accounts/logout/')
i@31 67 self.list_measurements_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/')
i@31 68
i@14 69 self.upload_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/quick/')
ioannis@54 70 self.measurement_page_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/')
ioannis@43 71 self.download_hirelpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 72 'data_processing/measurements/{0}/download-hirelpp/')
ioannis@43 73 self.download_cloudmask_pattern = urlparse.urljoin(self.base_url,
ioannis@67 74 'data_processing/measurements/{0}/download-cloudmask/')
ioannis@34 75
ioannis@43 76 self.download_elpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 77 'data_processing/measurements/{0}/download-preprocessed/')
ioannis@43 78 self.download_elda_pattern = urlparse.urljoin(self.base_url,
ioannis@67 79 'data_processing/measurements/{0}/download-optical/')
ioannis@45 80 self.download_plots_pattern = urlparse.urljoin(self.base_url,
moritz@29 81 'data_processing/measurements/{0}/download-plots/')
ioannis@43 82 self.download_elic_pattern = urlparse.urljoin(self.base_url,
ioannis@67 83 'data_processing/measurements/{0}/download-elic/')
i@14 84 self.delete_measurement_pattern = urlparse.urljoin(self.base_url, 'admin/database/measurements/{0}/delete/')
i@31 85
ioannis@67 86 # Setup API URLs for later use
i@14 87 self.api_base_url = urlparse.urljoin(self.base_url, 'api/v1/')
i@31 88 self.api_measurement_pattern = urlparse.urljoin(self.api_base_url, 'measurements/{0}/')
i@31 89 self.api_measurements_url = urlparse.urljoin(self.api_base_url, 'measurements')
i@38 90 self.api_sounding_search_pattern = urlparse.urljoin(self.api_base_url, 'sounding_files/?filename={0}')
i@38 91 self.api_lidarratio_search_pattern = urlparse.urljoin(self.api_base_url, 'lidarratio_files/?filename={0}')
i@38 92 self.api_overlap_search_pattern = urlparse.urljoin(self.api_base_url, 'overlap_files/?filename={0}')
ioannis@43 93
i@14 94 def login(self, credentials):
ioannis@67 95 """ Login to the SCC.
ioannis@67 96
ioannis@67 97 Parameters
ioannis@67 98 ----------
ioannis@67 99 credentials : tuple or list
ioannis@67 100 A list or tuple in the form (username, password).
ioannis@67 101 """
victor@7 102 logger.debug("Attempting to login to SCC, username %s." % credentials[0])
moritz@29 103 login_credentials = {'username': credentials[0],
moritz@29 104 'password': credentials[1]}
victor@7 105
i@14 106 logger.debug("Accessing login page at %s." % self.login_url)
victor@7 107
ioannis@67 108 # Get login form
moritz@29 109 login_page = self.session.get(self.login_url)
i@14 110
i@31 111 if not login_page.ok:
i@31 112 raise self.PageNotAccessibleError('Could not access login pages. Status code %s' % login_page.status_code)
victor@7 113
i@31 114 logger.debug("Submitting credentials.")
victor@7 115 # Submit the login data
i@14 116 login_submit = self.session.post(self.login_url,
moritz@29 117 data=login_credentials,
victor@7 118 headers={'X-CSRFToken': login_page.cookies['csrftoken'],
moritz@29 119 'referer': self.login_url})
victor@7 120 return login_submit
victor@7 121
victor@7 122 def logout(self):
ioannis@67 123 """ Logout from the SCC """
i@31 124 return self.session.get(self.logout_url, stream=True)
victor@7 125
claudio@69 126 def upload_file(self, filename, system_id, force_upload, delete_related, delay=0, cloudfree=False,
claudio@69 127 rs_filename=None, ov_filename=None, lr_filename=None):
ioannis@67 128 """ Upload a file for processing.
ioannis@67 129
ioannis@67 130 If the upload is successful, it returns the measurement id.
ioannis@67 131
ioannis@67 132
ioannis@67 133 Parameters
ioannis@67 134 ----------
ioannis@67 135 filename : str
ioannis@67 136 File path of the file to upload
ioannis@67 137 system_id : int
ioannis@67 138 System id to be used in the processing
ioannis@67 139 force_upload : bool
ioannis@67 140 If True, if a measurement with the same ID is found on the server, it will be first deleted and the
ioannis@67 141 file current file will be uploaded. If False, the file will not be uploaded if the measurement ID is
ioannis@67 142 already present on the SCC server.
ioannis@67 143 delete_related : bool
ioannis@67 144 Answer to delete related question when deleting existing measurements from the SCC.
claudio@69 145 cloudfree : bool
claudio@69 146 Manually set the measurement as cloud free
ioannis@67 147 rs_filename, ov_filename, lr_filename : str
ioannis@67 148 Ancillary files pahts to be uploaded.
ioannis@67 149 """
ioannis@67 150 # Get the measurement ID from the netcdf file
ioannis@43 151 measurement_id = self.measurement_id_from_file(filename)
ioannis@43 152
ioannis@67 153 # Handle possible existing measurements with the same ID on the SCC server.
ioannis@43 154 logger.debug('Checking if a measurement with the same id already exists on the SCC server.')
ioannis@50 155 existing_measurement, _ = self.get_measurement(measurement_id)
ioannis@43 156
ioannis@43 157 if existing_measurement:
ioannis@43 158 if force_upload:
ioannis@43 159 logger.info(
ioannis@43 160 "Measurement with id {} already exists on the SCC. Trying to delete it...".format(measurement_id))
ioannis@43 161 self.delete_measurement(measurement_id, delete_related)
ioannis@43 162 else:
ioannis@43 163 logger.error(
ioannis@43 164 "Measurement with id {} already exists on the SCC. Use --force_upload flag to overwrite it.".format(
ioannis@43 165 measurement_id))
ioannis@67 166 # TODO: Implement handling at the proper place. Exiting here does not allow the SCC class to be
ioannis@67 167 # used by external programs. Instead an exception should be raised.
ioannis@43 168 sys.exit(1)
ioannis@43 169
ioannis@67 170 # Upload the file(s)
ioannis@67 171
victor@7 172 # Get submit page
moritz@29 173 upload_page = self.session.get(self.upload_url)
victor@7 174
victor@7 175 # Submit the data
ioannis@54 176 upload_data = {'system': system_id,
claudio@69 177 'delay': delay,
claudio@69 178 'manually_cloud_free': cloudfree, }
ioannis@54 179
claudio@69 180 logger.debug("Submitted processing parameters - System: {}, Delay: {}, Manually Cloud Free: {}".format(system_id, delay, cloudfree))
ioannis@54 181
victor@7 182 files = {'data': open(filename, 'rb')}
victor@7 183
ioannis@67 184 # Add ancillary files to be uploaded
madrouin@20 185 if rs_filename is not None:
i@38 186 ancillary_file, _ = self.get_ancillary(rs_filename, 'sounding')
i@38 187
i@38 188 if ancillary_file.already_on_scc:
ioannis@67 189 logger.warning(
ioannis@67 190 "Sounding file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 191 else:
i@38 192 logger.debug('Adding sounding file %s' % rs_filename)
i@38 193 files['sounding_file'] = open(rs_filename, 'rb')
madrouin@20 194
ioannis@32 195 if ov_filename is not None:
i@38 196 ancillary_file, _ = self.get_ancillary(ov_filename, 'overlap')
i@38 197
i@38 198 if ancillary_file.already_on_scc:
ioannis@67 199 logger.warning(
ioannis@67 200 "Overlap file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 201 else:
i@38 202 logger.debug('Adding overlap file %s' % ov_filename)
i@38 203 files['overlap_file'] = open(ov_filename, 'rb')
i@31 204
i@31 205 if lr_filename is not None:
i@38 206 ancillary_file, _ = self.get_ancillary(lr_filename, 'lidarratio')
i@38 207
i@38 208 if ancillary_file.already_on_scc:
i@38 209 logger.warning(
ioannis@67 210 "Lidar ratio file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(
ioannis@67 211 ancillary_file))
i@38 212 else:
i@38 213 logger.debug('Adding lidar ratio file %s' % lr_filename)
i@38 214 files['lidar_ratio_file'] = open(lr_filename, 'rb')
i@31 215
ioannis@67 216 # Upload the files
i@14 217 logger.info("Uploading of file %s started." % filename)
victor@7 218
i@14 219 upload_submit = self.session.post(self.upload_url,
victor@7 220 data=upload_data,
victor@7 221 files=files,
victor@7 222 headers={'X-CSRFToken': upload_page.cookies['csrftoken'],
moritz@29 223 'referer': self.upload_url})
victor@7 224
victor@7 225 if upload_submit.status_code != 200:
i@14 226 logger.warning("Connection error. Status code: %s" % upload_submit.status_code)
victor@7 227 return False
victor@7 228
ioannis@67 229 # Check if there was a redirect to a new page. If not, something went wrong
i@14 230 if upload_submit.url == self.upload_url:
victor@7 231 measurement_id = False
ioannis@32 232 logger.error("Uploaded file(s) rejected! Try to upload manually to see the error.")
victor@7 233 else:
ioannis@67 234 # TODO: Check if this is needed. This was used when the measurement ID was not read from the input file.
ioannis@67 235 measurement_id = re.findall(regex, upload_submit.text)[0] # Get the measurement ID from the output page
ioannis@43 236 logger.info("Successfully uploaded measurement with id %s." % measurement_id)
ioannis@67 237 logger.info("You can monitor the processing progress online: {}".format(
ioannis@67 238 self.measurement_page_pattern.format(measurement_id)))
ioannis@43 239 return measurement_id
ioannis@43 240
ioannis@43 241 @staticmethod
ioannis@43 242 def measurement_id_from_file(filename):
ioannis@67 243 """ Get the measurement id from the input file.
ioannis@67 244
ioannis@67 245 Parameters
ioannis@67 246 ----------
ioannis@67 247 filename : str
ioannis@67 248 File path of the input file.
ioannis@67 249 """
ioannis@43 250
ioannis@43 251 if not os.path.isfile(filename):
ioannis@43 252 logger.error("File {} does not exist.".format(filename))
ioannis@43 253 sys.exit(1)
ioannis@43 254
ioannis@43 255 with netcdf.Dataset(filename) as f:
ioannis@43 256 try:
ioannis@43 257 measurement_id = f.Measurement_ID
ioannis@43 258 except AttributeError:
ioannis@43 259 logger.error(
ioannis@43 260 "Input file {} does not contain a Measurement_ID global attribute. Wrong file format?".format(
ioannis@43 261 filename))
ioannis@43 262 sys.exit(1)
victor@7 263
victor@7 264 return measurement_id
victor@7 265
victor@7 266 def download_files(self, measurement_id, subdir, download_url):
victor@7 267 """ Downloads some files from the download_url to the specified
ioannis@67 268 subdir.
ioannis@67 269
ioannis@67 270 This is a general method used to download preprocessed file, optical
ioannis@67 271 files by other, file-specific, methods.
victor@7 272 """
ioannis@32 273 # TODO: Make downloading more robust (e.g. in case that files do not exist on server).
victor@7 274 # Get the file
moritz@29 275 request = self.session.get(download_url, stream=True)
moritz@29 276
moritz@29 277 if not request.ok:
moritz@29 278 raise Exception("Could not download files for measurement '%s'" % measurement_id)
victor@7 279
victor@7 280 # Create the dir if it does not exist
victor@7 281 local_dir = os.path.join(self.output_dir, measurement_id, subdir)
victor@7 282 if not os.path.exists(local_dir):
victor@7 283 os.makedirs(local_dir)
victor@7 284
victor@7 285 # Save the file by chunk, needed if the file is big.
ioannis@43 286 memory_file = BytesIO()
victor@7 287
victor@7 288 for chunk in request.iter_content(chunk_size=1024):
victor@7 289 if chunk: # filter out keep-alive new chunks
victor@7 290 memory_file.write(chunk)
victor@7 291 memory_file.flush()
victor@7 292
victor@7 293 zip_file = ZipFile(memory_file)
victor@7 294
victor@7 295 for ziped_name in zip_file.namelist():
victor@7 296 basename = os.path.basename(ziped_name)
victor@7 297
victor@7 298 local_file = os.path.join(local_dir, basename)
victor@7 299
victor@7 300 with open(local_file, 'wb') as f:
victor@7 301 f.write(zip_file.read(ziped_name))
victor@7 302
ioannis@43 303 def download_hirelpp(self, measurement_id):
ioannis@43 304 """ Download hirelpp files for the measurement id. """
ioannis@43 305 # Construct the download url
ioannis@43 306 download_url = self.download_hirelpp_pattern.format(measurement_id)
ioannis@43 307 try:
ioannis@50 308 self.download_files(measurement_id, 'hirelpp', download_url)
ioannis@43 309 except Exception as e:
ioannis@43 310 logger.error("Could not download HiRElPP files. Error message: {}".format(e))
ioannis@43 311 logger.debug('Download exception:', exc_info=True)
ioannis@43 312
ioannis@43 313 def download_cloudmask(self, measurement_id):
ioannis@43 314 """ Download cloudmask files for the measurement id. """
ioannis@43 315 # Construct the download url
ioannis@43 316 download_url = self.download_cloudmask_pattern.format(measurement_id)
ioannis@43 317 try:
ioannis@50 318 self.download_files(measurement_id, 'cloudscreen', download_url)
ioannis@43 319 except Exception as e:
ioannis@43 320 logger.error("Could not download cloudscreen files. Error message: {}".format(e))
ioannis@43 321 logger.debug('Download exception:', exc_info=True)
ioannis@43 322
ioannis@43 323 def download_elpp(self, measurement_id):
victor@7 324 """ Download preprocessed files for the measurement id. """
victor@7 325 # Construct the download url
ioannis@43 326 download_url = self.download_elpp_pattern.format(measurement_id)
ioannis@43 327 try:
ioannis@50 328 self.download_files(measurement_id, 'elpp', download_url)
ioannis@43 329 except Exception as e:
ioannis@43 330 logger.error("Could not download ElPP files. Error message: {}".format(e))
ioannis@43 331 logger.debug('Download exception:', exc_info=True)
victor@7 332
ioannis@43 333 def download_elda(self, measurement_id):
victor@7 334 """ Download optical files for the measurement id. """
victor@7 335 # Construct the download url
ioannis@43 336 download_url = self.download_elda_pattern.format(measurement_id)
ioannis@43 337 try:
ioannis@50 338 self.download_files(measurement_id, 'elda', download_url)
ioannis@43 339 except Exception as e:
ioannis@43 340 logger.error("Could not download ELDA files. Error message: {}".format(e))
ioannis@43 341 logger.debug('Download exception:', exc_info=True)
victor@7 342
ioannis@43 343 def download_plots(self, measurement_id):
victor@7 344 """ Download profile graphs for the measurement id. """
victor@7 345 # Construct the download url
ioannis@45 346 download_url = self.download_plots_pattern.format(measurement_id)
ioannis@43 347 try:
ioannis@50 348 self.download_files(measurement_id, 'elda_plots', download_url)
ioannis@43 349 except Exception as e:
ioannis@43 350 logger.error("Could not download ELDA plots. Error message: {}".format(e))
ioannis@43 351 logger.debug('Download exception:', exc_info=True)
victor@7 352
ioannis@43 353 def download_elic(self, measurement_id):
ioannis@43 354 """ Download ELIC files for the measurement id. """
ioannis@43 355 # Construct the download url
ioannis@43 356 download_url = self.download_elic_pattern.format(measurement_id)
ioannis@43 357 try:
ioannis@50 358 self.download_files(measurement_id, 'elic', download_url)
ioannis@43 359 except Exception as e:
ioannis@43 360 logger.error("Could not download ELIC files. Error message: {}".format(e))
ioannis@43 361 logger.debug('Download exception:', exc_info=True)
ioannis@43 362
ioannis@43 363 def download_eldec(self, measurement_id):
ioannis@43 364 """ Download ELDEC files for the measurement id. """
ioannis@43 365 # Construct the download url
ioannis@43 366 download_url = self.download_elda_pattern.format(measurement_id) # ELDA patter is used for now
ioannis@43 367 try:
ioannis@50 368 self.download_files(measurement_id, 'eldec', download_url)
ioannis@43 369 except Exception as e:
ioannis@43 370 logger.error("Could not download EDELC files. Error message: {}".format(e))
ioannis@43 371 logger.debug('Download exception:', exc_info=True)
ioannis@43 372
ioannis@43 373 def rerun_elpp(self, measurement_id, monitor=True):
ioannis@45 374 logger.debug("Started rerun_elpp procedure.")
ioannis@45 375
ioannis@45 376 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 377 measurement, status = self.get_measurement(measurement_id)
victor@7 378
victor@7 379 if measurement:
ioannis@45 380 logger.debug("Attempting to rerun ElPP through %s." % measurement.rerun_all_url)
ioannis@45 381 request = self.session.get(measurement.rerun_elpp_url, stream=True)
victor@7 382
victor@7 383 if request.status_code != 200:
i@14 384 logger.error(
i@14 385 "Could not rerun processing for %s. Status code: %s" % (measurement_id, request.status_code))
ioannis@45 386 else:
ioannis@45 387 logger.info("Rerun-elpp command submitted successfully for id {}.".format(measurement_id))
victor@7 388
victor@7 389 if monitor:
victor@7 390 self.monitor_processing(measurement_id)
victor@7 391
victor@7 392 def rerun_all(self, measurement_id, monitor=True):
victor@7 393 logger.debug("Started rerun_all procedure.")
victor@7 394
victor@7 395 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 396 measurement, status = self.get_measurement(measurement_id)
victor@7 397
victor@7 398 if measurement:
victor@7 399 logger.debug("Attempting to rerun all processing through %s." % measurement.rerun_all_url)
victor@7 400
moritz@29 401 request = self.session.get(measurement.rerun_all_url, stream=True)
victor@7 402
victor@7 403 if request.status_code != 200:
victor@7 404 logger.error("Could not rerun pre processing for %s. Status code: %s" %
victor@7 405 (measurement_id, request.status_code))
ioannis@45 406 else:
ioannis@45 407 logger.info("Rerun-all command submitted successfully for id {}.".format(measurement_id))
victor@7 408
victor@7 409 if monitor:
victor@7 410 self.monitor_processing(measurement_id)
victor@7 411
claudio@69 412 def process(self, filename, system_id, monitor, force_upload, delete_related, delay=0, cloudfree=False,
claudio@69 413 rs_filename=None, lr_filename=None, ov_filename=None):
victor@7 414 """ Upload a file for processing and wait for the processing to finish.
victor@7 415 If the processing is successful, it will download all produced files.
victor@7 416 """
victor@7 417 logger.info("--- Processing started on %s. ---" % datetime.datetime.now())
victor@7 418 # Upload file
ioannis@50 419 logger.info("Uploading file.")
ioannis@45 420 measurement_id = self.upload_file(filename, system_id, force_upload, delete_related,
ioannis@54 421 delay=delay,
claudio@69 422 cloudfree=cloudfree,
ioannis@32 423 rs_filename=rs_filename,
ioannis@32 424 lr_filename=lr_filename,
ioannis@32 425 ov_filename=ov_filename)
ioannis@43 426
ioannis@54 427 if monitor and (delay > 0):
ioannis@54 428 logger.warning("Will not start monitoring, since a delay was specified: {} hours.".format(delay))
ioannis@54 429 return None
ioannis@54 430
ioannis@32 431 if measurement_id and monitor:
ioannis@54 432 logger.info("Monitoring processing.")
moritz@29 433 return self.monitor_processing(measurement_id)
victor@7 434
moritz@29 435 return None
victor@7 436
ioannis@61 437 def monitor_processing(self, measurement_id, retry_max=2, time_sleep=2, exit_if_missing=True):
victor@7 438 """ Monitor the processing progress of a measurement id"""
victor@7 439
madrouin@24 440 # try to deal with error 404
ioannis@61 441 attempts_count = 0
ioannis@61 442 max_attempts = retry_max + 1
madrouin@24 443
ioannis@67 444 # try to wait for measurement to appear in API. A user has reported that this does not happen immediately.
madrouin@24 445 measurement = None
ioannis@50 446 logger.info("Looking for measurement %s on the SCC.", measurement_id)
ioannis@62 447
ioannis@61 448 while attempts_count < max_attempts:
ioannis@61 449 attempts_count += 1
madrouin@26 450 measurement, status = self.get_measurement(measurement_id)
ioannis@61 451 if status != 200:
ioannis@61 452 logger.warning("Measurement not found.")
ioannis@61 453 if attempts_count < max_attempts:
ioannis@61 454 logger.warning("Waiting %ds.", time_sleep)
ioannis@61 455 time.sleep(time_sleep)
madrouin@26 456 else:
madrouin@26 457 break
ioannis@62 458 print("Measurement: {}".format(measurement))
madrouin@24 459
ioannis@62 460 if measurement is None:
ioannis@61 461 logger.error("Measurement %s doesn't seem to exist.", measurement_id)
ioannis@61 462 if exit_if_missing:
ioannis@61 463 sys.exit(1)
ioannis@61 464 else:
ioannis@61 465 return measurement
madrouin@26 466
ioannis@45 467 logger.info('Measurement %s found.', measurement_id)
ioannis@62 468 while not measurement.has_finished:
ioannis@62 469 measurement.log_processing_status()
ioannis@62 470 time.sleep(10)
ioannis@62 471 measurement, status = self.get_measurement(measurement_id)
madrouin@24 472
ioannis@62 473 logger.info("Measurement processing finished.")
ioannis@62 474 measurement.log_detailed_status()
ioannis@53 475
ioannis@62 476 if measurement.hirelpp == 127:
ioannis@62 477 logger.info("Downloading HiRElPP files.")
ioannis@62 478 self.download_hirelpp(measurement_id)
ioannis@62 479 if measurement.cloudmask == 127:
ioannis@62 480 logger.info("Downloading cloud screening files.")
ioannis@62 481 self.download_cloudmask(measurement_id)
ioannis@62 482 if measurement.elpp == 127:
ioannis@62 483 logger.info("Downloading ElPP files.")
ioannis@62 484 self.download_elpp(measurement_id)
ioannis@62 485 if measurement.elda == 127:
ioannis@62 486 logger.info("Downloading ELDA files.")
ioannis@62 487 self.download_elda(measurement_id)
ioannis@62 488 logger.info("Downloading ELDA plots.")
ioannis@62 489 self.download_plots(measurement_id)
ioannis@62 490 if measurement.elic == 127:
ioannis@62 491 logger.info("Downloading ELIC files.")
ioannis@62 492 self.download_elic(measurement_id)
ioannis@67 493 if measurement.is_calibration and measurement.eldec == 0:
ioannis@62 494 logger.info("Downloading ELDEC files.")
ioannis@62 495 self.download_eldec(measurement_id)
ioannis@62 496 logger.info("--- Processing finished. ---")
ioannis@43 497
victor@7 498 return measurement
victor@7 499
claudio@68 500 def download_products(self, measurement, dir_name):
claudio@68 501 """ Download all the products of a measurement id (used only for E-SHAPE"""
claudio@68 502 measurement_id = measurement.id
claudio@68 503 base_output_dir = self.output_dir
claudio@68 504 self.output_dir = self.output_dir + dir_name + "/"
claudio@68 505
claudio@68 506 if measurement.hirelpp == 127:
claudio@68 507 logger.info("Downloading HiRElPP files.")
claudio@68 508 self.download_hirelpp(measurement_id)
claudio@68 509 if measurement.cloudmask == 127:
claudio@68 510 logger.info("Downloading cloud screening files.")
claudio@68 511 self.download_cloudmask(measurement_id)
claudio@68 512 if measurement.elpp == 127:
claudio@68 513 logger.info("Downloading ElPP files.")
claudio@68 514 self.download_elpp(measurement_id)
claudio@68 515 if measurement.elda == 127:
claudio@68 516 logger.info("Downloading ELDA files.")
claudio@68 517 self.download_elda(measurement_id)
claudio@68 518 logger.info("Downloading ELDA plots.")
claudio@68 519 self.download_plots(measurement_id)
claudio@68 520 if measurement.elic == 127:
claudio@68 521 logger.info("Downloading ELIC files.")
claudio@68 522 self.download_elic(measurement_id)
claudio@68 523 if measurement.is_calibration and measurement.eldec == 0:
claudio@68 524 logger.info("Downloading ELDEC files.")
claudio@68 525 self.download_eldec(measurement_id)
claudio@68 526 logger.info("--- Processing finished. ---")
claudio@68 527
claudio@68 528 self.output_dir = base_output_dir
claudio@68 529 return measurement
claudio@68 530
ioannis@43 531 def get_measurement(self, measurement_id):
ioannis@67 532 """ Get a measurement information from the SCC API.
victor@7 533
ioannis@67 534 Parameters
ioannis@67 535 ----------
ioannis@67 536 measurement_id : str
ioannis@67 537 The measurement ID to search.
ioannis@67 538
ioannis@67 539 Returns
ioannis@67 540 -------
ioannis@67 541 : Measurement object or None
ioannis@67 542 If the measurement is found, a Measurement object is returned. If not, it returns None
ioannis@67 543 """
ioannis@67 544 # TODO: Consider to homogenize with get_ancillary method (i.e. always return a Measurement object).
ioannis@67 545
ioannis@67 546 if measurement_id is None: # TODO: Is this still required?
victor@7 547 return None
victor@7 548
ioannis@67 549 # Access the API
i@31 550 measurement_url = self.api_measurement_pattern.format(measurement_id)
i@31 551 logger.debug("Measurement API URL: %s" % measurement_url)
victor@7 552
moritz@29 553 response = self.session.get(measurement_url)
victor@7 554
ioannis@43 555 response_dict = None
ioannis@45 556
ioannis@43 557 if response.status_code == 200:
ioannis@43 558 response_dict = response.json()
ioannis@45 559 elif response.status_code == 404:
ioannis@43 560 logger.info("No measurement with id %s found on the SCC." % measurement_id)
ioannis@45 561 else:
i@14 562 logger.error('Could not access API. Status code %s.' % response.status_code)
victor@7 563
ioannis@55 564 # TODO: Implement better handling for status 401.
ioannis@55 565
victor@7 566 if response_dict:
ioannis@43 567 measurement = Measurement(self.base_url, response_dict)
victor@7 568 else:
ioannis@45 569 measurement = None
victor@7 570
ioannis@45 571 return measurement, response.status_code
victor@7 572
ioannis@45 573 def delete_measurement(self, measurement_id, delete_related):
victor@7 574 """ Deletes a measurement with the provided measurement id. The user
ioannis@67 575 should have the appropriate permissions (i.e. access to the admin site).
madrouin@20 576
victor@7 577 The procedures is performed directly through the web interface and
victor@7 578 NOT through the API.
victor@7 579 """
victor@7 580 # Get the measurement object
i@31 581 measurement, _ = self.get_measurement(measurement_id)
victor@7 582
victor@7 583 # Check that it exists
victor@7 584 if measurement is None:
victor@7 585 logger.warning("Nothing to delete.")
victor@7 586 return None
victor@7 587
victor@7 588 # Go the the page confirming the deletion
moritz@29 589 delete_url = self.delete_measurement_pattern.format(measurement_id)
ioannis@43 590
moritz@29 591 confirm_page = self.session.get(delete_url)
victor@7 592
victor@7 593 # Check that the page opened properly
victor@7 594 if confirm_page.status_code != 200:
victor@7 595 logger.warning("Could not open delete page. Status: {0}".format(confirm_page.status_code))
victor@7 596 return None
victor@7 597
ioannis@43 598 # Get the delete related value
ioannis@43 599 if delete_related:
ioannis@43 600 delete_related_option = 'delete_related'
ioannis@43 601 else:
ioannis@43 602 delete_related_option = 'not_delete_related'
ioannis@43 603
victor@7 604 # Delete the measurement
victor@7 605 delete_page = self.session.post(delete_url,
ioannis@43 606 data={'post': 'yes',
ioannis@43 607 'select_delete_related_measurements': delete_related_option},
victor@7 608 headers={'X-CSRFToken': confirm_page.cookies['csrftoken'],
victor@7 609 'referer': delete_url}
victor@7 610 )
i@31 611 if not delete_page.ok:
victor@7 612 logger.warning("Something went wrong. Delete page status: {0}".format(
victor@7 613 delete_page.status_code))
victor@7 614 return None
victor@7 615
victor@7 616 logger.info("Deleted measurement {0}".format(measurement_id))
victor@7 617 return True
victor@7 618
claudio@68 619 def available_measurements(self, start_gte=None, stop_lte=None):
ioannis@67 620 """ Get a list of available measurement on the SCC.
ioannis@67 621
ioannis@67 622 The methods is currently not used, could be merged with list_measurements.
ioannis@67 623 """
claudio@68 624
claudio@68 625 params = {}
claudio@68 626 if start_gte is not None:
claudio@68 627 params['start__gte'] = start_gte
claudio@68 628 if stop_lte is not None:
claudio@68 629 params['stop__lte'] = stop_lte
claudio@68 630
claudio@68 631 response = self.session.get(self.api_measurements_url, params=params)
victor@7 632 response_dict = response.json()
victor@7 633
victor@7 634 if response_dict:
victor@7 635 measurement_list = response_dict['objects']
i@14 636 measurements = [Measurement(self.base_url, measurement_dict) for measurement_dict in measurement_list]
victor@7 637 logger.info("Found %s measurements on the SCC." % len(measurements))
victor@7 638 else:
victor@7 639 logger.warning("No response received from the SCC when asked for available measurements.")
ioannis@43 640 measurements = None
victor@7 641
victor@7 642 return measurements
victor@7 643
claudio@68 644 def list_measurements(self, id_exact=None, id_startswith=None,
claudio@68 645 start_exact=None, start_gte=None, start_lte=None,
claudio@68 646 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 647 station_exact=None, station_in=None):
ioannis@67 648 """ Get the response text from the API. """
moritz@29 649
ioannis@67 650 # TODO: Add some error handling, e.g. as per available_measurements method
i@31 651
moritz@29 652 # Need to set to empty string if not specified, we won't get any results
ioannis@65 653 params = {}
i@31 654
ioannis@65 655 if id_exact is not None:
ioannis@65 656 params['id__exact'] = id_exact
claudio@68 657 elif id_startswith is not None:
claudio@68 658 params['id__startswith'] = id_startswith
claudio@68 659
claudio@68 660 if start_exact is not None:
claudio@68 661 params['start__exact'] = start_exact
ioannis@65 662 else:
claudio@68 663 if start_gte is not None:
claudio@68 664 params['start__gte'] = start_gte
claudio@68 665 if start_lte is not None:
claudio@68 666 params['start__lte'] = start_lte
claudio@68 667
claudio@68 668 if stop_exact is not None:
claudio@68 669 params['stop__exact'] = stop_exact
claudio@68 670 else:
claudio@68 671 if stop_gte is not None:
claudio@68 672 params['stop__gte'] = stop_gte
claudio@68 673 if stop_lte is not None:
claudio@68 674 params['stop__lte'] = stop_lte
claudio@68 675
claudio@68 676 if station_exact is not None:
claudio@68 677 params['station__exact'] = station_exact
claudio@68 678 elif station_in is not None:
claudio@68 679 params['station__in'] = station_in
moritz@29 680
ioannis@65 681 response_json = self.session.get(self.api_measurements_url, params=params).text
moritz@29 682
ioannis@65 683 return response_json
moritz@29 684
ioannis@43 685 def measurement_id_for_date(self, t1, call_sign, base_number=0):
victor@7 686 """ Give the first available measurement id on the SCC for the specific
madrouin@20 687 date.
victor@7 688 """
ioannis@67 689 # TODO: Check if this method needs updating to handle all measurement_ID formats.
victor@7 690 date_str = t1.strftime('%Y%m%d')
i@31 691 base_id = "%s%s" % (date_str, call_sign)
i@31 692 search_url = urlparse.urljoin(self.api_base_url, 'measurements/?id__startswith=%s' % base_id)
victor@7 693
moritz@29 694 response = self.session.get(search_url)
victor@7 695
victor@7 696 response_dict = response.json()
victor@7 697
victor@7 698 measurement_id = None
victor@7 699
victor@7 700 if response_dict:
victor@7 701 measurement_list = response_dict['objects']
i@31 702
i@31 703 if len(measurement_list) == 100:
i@31 704 raise ValueError('No available measurement id found.')
i@31 705
victor@7 706 existing_ids = [measurement_dict['id'] for measurement_dict in measurement_list]
victor@7 707
victor@7 708 measurement_number = base_number
i@31 709 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 710
victor@7 711 while measurement_id in existing_ids:
victor@7 712 measurement_number = measurement_number + 1
i@31 713 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 714
victor@7 715 return measurement_id
victor@7 716
i@40 717 def get_ancillary(self, file_path, file_type):
i@38 718 """
i@38 719 Try to get the ancillary file data from the SCC API.
i@38 720
i@38 721 The result will always be an API object. If the file does not exist, the .exists property is set to False.
i@38 722
i@38 723 Parameters
i@38 724 ----------
i@40 725 file_path : str
i@40 726 Path of the uploaded file.
i@38 727 file_type : str
i@38 728 Type of ancillary file. One of 'sounding', 'overlap', 'lidarratio'.
i@38 729
i@38 730 Returns
i@38 731 : AncillaryFile
i@38 732 The api object.
i@38 733 """
i@38 734 assert file_type in ['sounding', 'overlap', 'lidarratio']
i@38 735
i@40 736 filename = os.path.basename(file_path)
i@40 737
i@38 738 if file_type == 'sounding':
i@38 739 file_url = self.api_sounding_search_pattern.format(filename)
i@38 740 elif file_type == 'overlap':
i@38 741 file_url = self.api_overlap_search_pattern.format(filename)
i@38 742 else:
i@38 743 file_url = self.api_lidarratio_search_pattern.format(filename)
i@38 744
i@38 745 response = self.session.get(file_url)
i@38 746
i@38 747 if not response.ok:
i@38 748 logger.error('Could not access API. Status code %s.' % response.status_code)
i@38 749 return None, response.status_code
i@38 750
i@38 751 response_dict = response.json()
i@38 752 object_list = response_dict['objects']
i@38 753
i@38 754 logger.debug("Ancillary file JSON: {0}".format(object_list))
i@38 755
i@38 756 if object_list:
i@38 757 ancillary_file = AncillaryFile(self.api_base_url, object_list[0]) # Assume only one file is returned
i@38 758 else:
i@38 759 ancillary_file = AncillaryFile(self.api_base_url, None) # Create an empty object
i@38 760
i@38 761 return ancillary_file, response.status_code
i@38 762
ioannis@43 763 def __enter__(self):
ioannis@43 764 return self
victor@7 765
ioannis@43 766 def __exit__(self, *args):
ioannis@43 767 logger.debug("Closing SCC connection session.")
ioannis@43 768 self.session.close()
ioannis@43 769
i@31 770 class PageNotAccessibleError(RuntimeError):
i@31 771 pass
ioannis@43 772
victor@7 773
ioannis@17 774 class ApiObject(object):
victor@7 775 """ A generic class object. """
victor@7 776
i@14 777 def __init__(self, base_url, dict_response):
i@14 778 self.base_url = base_url
victor@7 779
victor@7 780 if dict_response:
victor@7 781 # Add the dictionary key value pairs as object properties
victor@7 782 for key, value in dict_response.items():
ioannis@17 783 # logger.debug('Setting key {0} to value {1}'.format(key, value))
ioannis@17 784 try:
ioannis@17 785 setattr(self, key, value)
ioannis@17 786 except:
ioannis@17 787 logger.warning('Could not set attribute {0} to value {1}'.format(key, value))
victor@7 788 self.exists = True
victor@7 789 else:
victor@7 790 self.exists = False
victor@7 791
victor@7 792
victor@7 793 class Measurement(ApiObject):
ioannis@43 794 """ This class represents the measurement object as returned in the SCC API.
ioannis@43 795 """
victor@7 796
i@14 797 def __init__(self, base_url, dict_response):
victor@7 798
ioannis@45 799 # Define expected attributes to assist debugging
ioannis@53 800
ioannis@53 801 self.hirelpp = None
ioannis@53 802 self.hirelpp_exit_code = None
ioannis@43 803 self.cloudmask = None
ioannis@53 804 self.cloudmask_exit_code = None
ioannis@53 805 self.elpp = None
ioannis@53 806 self.elpp_exit_code = None
ioannis@43 807 self.elda = None
ioannis@53 808 self.elda_exit_code = None
ioannis@43 809 self.elic = None
ioannis@53 810 self.elic_exit_code = None
ioannis@53 811 self.eldec = None
ioannis@53 812 self.eldec_exit_code = None
ioannis@53 813 self.elquick = None
ioannis@53 814 self.elquick_exit_code = None
ioannis@53 815
ioannis@43 816 self.id = None
claudio@68 817 self.num_id = None
ioannis@43 818 self.is_calibration = None
ioannis@43 819 self.is_running = None
claudio@68 820 self.is_queued = None
ioannis@53 821
ioannis@43 822 self.resource_uri = None
ioannis@43 823 self.start = None
ioannis@43 824 self.stop = None
ioannis@43 825 self.system = None
claudio@68 826 self.station = None
ioannis@43 827 self.upload = None
ioannis@43 828
ioannis@45 829 super().__init__(base_url, dict_response)
victor@7 830
ioannis@57 831 @property
ioannis@57 832 def has_finished(self):
ioannis@57 833 """ Temporary implementation for SCC version 5.2.0, until the API returns a flag indicating if the
ioannis@57 834 processing measurement has finished. """
ioannis@57 835 if (self.is_running is False) and (self.hirelpp != 0 or self.elpp != 0):
ioannis@57 836 return True
ioannis@57 837 else:
ioannis@57 838 return False
ioannis@57 839
ioannis@53 840 def log_processing_status(self):
ioannis@53 841 """ Log module status. """
claudio@68 842 logger.info("Measurement is being processed. Status: {}, {}, {}, {}, {}, {}, {}). Please wait.".format(
ioannis@53 843 self.upload,
ioannis@53 844 self.hirelpp,
ioannis@53 845 self.cloudmask,
ioannis@53 846 self.elpp,
ioannis@53 847 self.elda,
claudio@68 848 self.elic,
claudio@68 849 self.elquick))
ioannis@53 850
ioannis@53 851 def log_detailed_status(self):
ioannis@53 852 """ Log module exit and status codes."""
ioannis@53 853 logger.info("Measurement exit status:".format(self.id))
ioannis@53 854 if self.is_calibration:
ioannis@53 855 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 856 self._log_module_status('ElDEC', self.eldec, self.eldec_exit_code)
ioannis@53 857 else:
ioannis@53 858 self._log_module_status('HiRElPP', self.hirelpp, self.hirelpp_exit_code)
ioannis@53 859 self._log_module_status('CloudScreen', self.cloudmask, self.cloudmask_exit_code)
ioannis@53 860 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 861 self._log_module_status('ELDA', self.elda, self.elda_exit_code)
ioannis@53 862 self._log_module_status('ELIC', self.elic, self.elic_exit_code)
ioannis@53 863 self._log_module_status('ELQuick', self.elquick, self.elquick_exit_code)
ioannis@53 864
ioannis@53 865 def _log_module_status(self, name, status, exit_code):
ioannis@53 866 if exit_code:
ioannis@54 867 if exit_code['exit_code'] > 0:
ioannis@54 868 logger.warning("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@54 869 else:
ioannis@54 870 logger.info("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@53 871 else:
ioannis@53 872 logger.info("{0} exit code: {2}".format(name, status, exit_code))
ioannis@53 873
ioannis@43 874 @property
ioannis@43 875 def rerun_elda_url(self):
ioannis@43 876 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elda/')
ioannis@43 877 return url_pattern.format(self.id)
victor@7 878
victor@7 879 @property
ioannis@43 880 def rerun_elpp_url(self):
ioannis@43 881 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elpp/')
i@14 882 return url_pattern.format(self.id)
victor@7 883
victor@7 884 @property
victor@7 885 def rerun_all_url(self):
i@14 886 ulr_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-all/')
i@14 887 return ulr_pattern.format(self.id)
victor@7 888
victor@7 889 def __str__(self):
ioannis@43 890 return "Measurement {}".format(self.id)
victor@7 891
victor@7 892
i@38 893 class AncillaryFile(ApiObject):
i@38 894 """ This class represents the ancilalry file object as returned in the SCC API.
i@38 895 """
ioannis@67 896
i@38 897 @property
i@38 898 def already_on_scc(self):
i@38 899 if self.exists is False:
i@38 900 return False
i@38 901
i@38 902 return not self.status == 'missing'
i@38 903
i@38 904 def __str__(self):
i@38 905 return "%s: %s, %s" % (self.id,
i@38 906 self.filename,
i@38 907 self.status)
i@38 908
i@38 909
ioannis@67 910 # Methods that use the SCC class to perform specific tasks.
ioannis@45 911 def process_file(filename, system_id, settings, force_upload, delete_related,
claudio@69 912 delay=0, cloudfree=False, monitor=True, rs_filename=None, lr_filename=None, ov_filename=None):
ioannis@32 913 """ Shortcut function to process a file to the SCC. """
ioannis@32 914 logger.info("Processing file %s, using system %s" % (filename, system_id))
victor@7 915
ioannis@43 916 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 917 scc.login(settings['website_credentials'])
ioannis@45 918 measurement = scc.process(filename, system_id,
ioannis@45 919 force_upload=force_upload,
ioannis@45 920 delete_related=delete_related,
ioannis@54 921 delay=delay,
claudio@69 922 cloudfree=cloudfree,
ioannis@45 923 monitor=monitor,
ioannis@45 924 rs_filename=rs_filename,
ioannis@45 925 lr_filename=lr_filename,
ioannis@45 926 ov_filename=ov_filename)
ioannis@43 927 scc.logout()
victor@7 928 return measurement
victor@7 929
victor@7 930
ioannis@45 931 def delete_measurements(measurement_ids, delete_related, settings):
moritz@29 932 """ Shortcut function to delete measurements from the SCC. """
ioannis@45 933 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 934 scc.login(settings['website_credentials'])
ioannis@45 935 for m_id in measurement_ids:
ioannis@54 936 logger.info("Deleting %s." % m_id)
ioannis@45 937 scc.delete_measurement(m_id, delete_related)
ioannis@45 938 scc.logout()
moritz@29 939
moritz@29 940
moritz@29 941 def rerun_all(measurement_ids, monitor, settings):
moritz@29 942 """ Shortcut function to rerun measurements from the SCC. """
i@14 943
ioannis@43 944 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 945 scc.login(settings['website_credentials'])
ioannis@45 946 for m_id in measurement_ids:
ioannis@54 947 logger.info("Rerunning all products for %s." % m_id)
ioannis@45 948 scc.rerun_all(m_id, monitor)
ioannis@43 949 scc.logout()
victor@7 950
victor@7 951
moritz@29 952 def rerun_processing(measurement_ids, monitor, settings):
victor@7 953 """ Shortcut function to delete a measurement from the SCC. """
i@14 954
ioannis@43 955 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 956 scc.login(settings['website_credentials'])
ioannis@45 957 for m_id in measurement_ids:
ioannis@45 958 logger.info("Rerunning (optical) processing for %s" % m_id)
ioannis@45 959 scc.rerun_elpp(m_id, monitor)
ioannis@45 960 scc.logout()
moritz@29 961
moritz@29 962
claudio@68 963 def list_measurements(settings, id_exact=None, id_startswith=None,
claudio@68 964 start_exact=None, start_gte=None, start_lte=None,
claudio@68 965 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 966 station_exact=None, station_in=None):
moritz@29 967 """List all available measurements"""
ioannis@45 968 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 969 scc.login(settings['website_credentials'])
ioannis@65 970
claudio@68 971 results_json = scc.list_measurements(id_exact=id_exact, id_startswith=id_startswith,
claudio@68 972 start_exact=start_exact, start_gte=start_gte, start_lte=start_lte,
claudio@68 973 stop_exact=stop_exact, stop_gte=stop_gte, stop_lte=stop_lte,
claudio@68 974 station_exact=station_exact, station_in=station_in)
ioannis@65 975 print(results_json)
ioannis@65 976
ioannis@43 977 scc.logout()
victor@7 978
victor@7 979
ioannis@61 980 def download_measurements(measurement_ids, max_retries, exit_if_missing, settings):
moritz@29 981 """Download all measurements for the specified IDs"""
ioannis@43 982 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 983 scc.login(settings['website_credentials'])
ioannis@45 984 for m_id in measurement_ids:
ioannis@61 985 scc.monitor_processing(m_id, retry_max=max_retries, time_sleep=3, exit_if_missing=exit_if_missing)
ioannis@61 986
ioannis@43 987 scc.logout()
i@14 988
i@14 989
claudio@68 990 def eshape_downloader(settings):
claudio@68 991 eshape_dir = settings['output_dir']
claudio@68 992 #directories = [[x[0] for x in os.walk(eshape_dir)]]
claudio@68 993 all_directories = [f.name for f in os.scandir(eshape_dir) if f.is_dir()]
claudio@68 994 folders_pattern = re.compile("^(\d{6}_{1}\d{12})+$")
claudio@68 995 directories = [dir_name for dir_name in all_directories if folders_pattern.match(dir_name)]
claudio@68 996 for dir_name in directories:
claudio@68 997 start_string = dir_name.split("_")[1]
claudio@68 998 date_time_start = datetime.datetime.strptime(start_string, '%Y%m%d%H%M')
claudio@68 999 if (datetime.datetime.now() - datetime.timedelta(days=3)) <= date_time_start:
claudio@68 1000 start_parameter = date_time_start.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 1001 date_time_stop = datetime.datetime.now()
claudio@68 1002 stop_parameter = date_time_stop.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 1003
claudio@68 1004 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
claudio@68 1005 scc.login(settings['website_credentials'])
claudio@68 1006
claudio@68 1007 measurements = scc.available_measurements(start_gte=start_parameter, stop_lte=stop_parameter)
claudio@68 1008 if measurements is not None:
claudio@68 1009 for meas in measurements:
claudio@68 1010 scc.download_products(meas, dir_name)
claudio@68 1011
claudio@68 1012 scc.logout()
claudio@68 1013
claudio@68 1014
moritz@29 1015 def settings_from_path(config_file_path):
i@14 1016 """ Read the configuration file.
i@14 1017
i@14 1018 The file should be in YAML syntax."""
i@14 1019
i@14 1020 if not os.path.isfile(config_file_path):
moritz@29 1021 raise argparse.ArgumentTypeError("Wrong path for configuration file (%s)" % config_file_path)
i@14 1022
i@14 1023 with open(config_file_path) as yaml_file:
i@14 1024 try:
i@14 1025 settings = yaml.safe_load(yaml_file)
i@14 1026 logger.debug("Read settings file(%s)" % config_file_path)
moritz@29 1027 except Exception:
moritz@29 1028 raise argparse.ArgumentTypeError("Could not parse YAML file (%s)" % config_file_path)
i@14 1029
i@14 1030 # YAML limitation: does not read tuples
i@14 1031 settings['basic_credentials'] = tuple(settings['basic_credentials'])
i@14 1032 settings['website_credentials'] = tuple(settings['website_credentials'])
i@14 1033 return settings
i@14 1034
i@14 1035
moritz@29 1036 # Setup for command specific parsers
moritz@29 1037 def setup_delete(parser):
moritz@29 1038 def delete_from_args(parsed):
ioannis@45 1039 delete_measurements(parsed.IDs,
ioannis@45 1040 delete_related=False,
ioannis@45 1041 settings=parsed.config)
moritz@29 1042
moritz@29 1043 parser.add_argument("IDs", nargs="+", help="measurement IDs to delete.")
moritz@29 1044 parser.set_defaults(execute=delete_from_args)
moritz@29 1045
moritz@29 1046
moritz@29 1047 def setup_rerun_all(parser):
moritz@29 1048 def rerun_all_from_args(parsed):
moritz@29 1049 rerun_all(parsed.IDs, parsed.process, parsed.config)
moritz@29 1050
moritz@29 1051 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun.")
moritz@29 1052 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1053 action="store_true")
moritz@29 1054 parser.set_defaults(execute=rerun_all_from_args)
moritz@29 1055
moritz@29 1056
ioannis@45 1057 def setup_rerun_elpp(parser):
moritz@29 1058 def rerun_processing_from_args(parsed):
moritz@29 1059 rerun_processing(parsed.IDs, parsed.process, parsed.config)
moritz@29 1060
moritz@29 1061 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun the processing on.")
moritz@29 1062 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1063 action="store_true")
moritz@29 1064 parser.set_defaults(execute=rerun_processing_from_args)
moritz@29 1065
moritz@29 1066
ioannis@45 1067 def setup_upload_file(parser):
ioannis@45 1068 """ Upload but do not monitor processing progress. """
ioannis@67 1069
ioannis@45 1070 def upload_file_from_args(parsed):
ioannis@45 1071 process_file(parsed.filename, parsed.system, parsed.config,
ioannis@54 1072 delay=parsed.delay,
claudio@69 1073 cloudfree=parsed.cloudfree,
ioannis@45 1074 monitor=parsed.process,
ioannis@45 1075 force_upload=parsed.force_upload,
ioannis@45 1076 delete_related=False, # For now, use this as default
ioannis@32 1077 rs_filename=parsed.radiosounding,
ioannis@32 1078 ov_filename=parsed.overlap,
ioannis@32 1079 lr_filename=parsed.lidarratio)
moritz@29 1080
ioannis@54 1081 def delay(arg):
ioannis@54 1082 try:
ioannis@54 1083 int_arg = int(arg)
ioannis@54 1084 except ValueError:
ioannis@54 1085 raise argparse.ArgumentTypeError("Could not convert delay argument {} to integer.".format(arg))
ioannis@54 1086
ioannis@54 1087 if 0 <= int_arg <= 96:
ioannis@54 1088 return int_arg
ioannis@54 1089 else:
ioannis@54 1090 raise argparse.ArgumentTypeError("Delay should be an integer between 0 and 96.")
ioannis@54 1091
moritz@29 1092 parser.add_argument("filename", help="Measurement file name or path.")
moritz@29 1093 parser.add_argument("system", help="Processing system id.")
ioannis@54 1094 parser.add_argument("--delay", help="Delay processing by the specified number of hours (0 to 96).",
ioannis@54 1095 default=0, type=delay)
claudio@69 1096 parser.add_argument("--cloudfree", help="Manually assume this measurement as cloud free.",
claudio@69 1097 action="store_true", default=False)
ioannis@45 1098 parser.add_argument("-p", "--process", help="Wait for the processing results.",
ioannis@45 1099 action="store_true")
ioannis@45 1100 parser.add_argument("--force_upload", help="If measurement ID exists on SCC, delete before uploading.",
ioannis@45 1101 action="store_true")
i@30 1102 parser.add_argument("--radiosounding", default=None, help="Radiosounding file name or path")
ioannis@32 1103 parser.add_argument("--overlap", default=None, help="Overlap file name or path")
ioannis@32 1104 parser.add_argument("--lidarratio", default=None, help="Lidar ratio file name or path")
i@30 1105
moritz@29 1106 parser.set_defaults(execute=upload_file_from_args)
moritz@29 1107
moritz@29 1108
moritz@29 1109 def setup_list_measurements(parser):
moritz@29 1110 def list_measurements_from_args(parsed):
claudio@68 1111 list_measurements(parsed.config, id_exact=parsed.id_exact, id_startswith=parsed.id_startswith,
claudio@68 1112 start_exact=parsed.start_exact, start_gte=parsed.start_gte, start_lte=parsed.start_lte,
claudio@68 1113 stop_exact=parsed.stop_exact, stop_gte=parsed.stop_gte, stop_lte=parsed.stop_lte,
claudio@68 1114 station_exact=parsed.station_exact, station_in=parsed.station_in)
claudio@68 1115
claudio@68 1116 group = parser.add_argument_group()
claudio@68 1117
claudio@68 1118 group_id = group.add_mutually_exclusive_group()
claudio@68 1119 group_id.add_argument("--id_exact", help="Exact measurement id.")
claudio@68 1120 group_id.add_argument("--id_startswith", help="Initial part of measurement id.")
moritz@29 1121
claudio@68 1122 group_start = group.add_argument_group()
claudio@68 1123 group_start.add_argument("--start_exact", help="Exact start date of the measurement.")
claudio@68 1124 group_start.add_argument("--start_gte", help="Start date of the measurement after the given date.")
claudio@68 1125 group_start.add_argument("--start_lte", help="Start date of the measurement before the given date.")
claudio@68 1126
claudio@68 1127 group_stop = group.add_argument_group()
claudio@68 1128 group_stop.add_argument("--stop_exact", help="Exact stop date of the measurement.")
claudio@68 1129 group_stop.add_argument("--stop_gte", help="Stop date of the measurement after the given date.")
claudio@68 1130 group_stop.add_argument("--stop_lte", help="Stop date of the measurement before the given date.")
claudio@68 1131
claudio@68 1132 group_station = group.add_mutually_exclusive_group()
claudio@68 1133 group_station.add_argument("--station_exact", help="Station the performed the measurement.")
claudio@68 1134 group_station.add_argument("--station_in", help="List of stations (separated by comma) that performed the measurement.")
moritz@29 1135
moritz@29 1136 parser.set_defaults(execute=list_measurements_from_args)
moritz@29 1137
moritz@29 1138
moritz@29 1139 def setup_download_measurements(parser):
moritz@29 1140 def download_measurements_from_args(parsed):
ioannis@61 1141 download_measurements(parsed.IDs, parsed.max_retries, parsed.ignore_errors, parsed.config)
moritz@29 1142
moritz@29 1143 parser.add_argument("IDs", help="Measurement IDs that should be downloaded.", nargs="+")
ioannis@67 1144 parser.add_argument("--max_retries", help="Number of times to retry in cases of missing measurement id.", default=0,
ioannis@67 1145 type=int)
ioannis@67 1146 parser.add_argument("--ignore_errors", help="Ignore errors when downloading multiple measurements.",
ioannis@67 1147 action="store_false")
moritz@29 1148 parser.set_defaults(execute=download_measurements_from_args)
moritz@29 1149
moritz@29 1150
claudio@68 1151 def setup_eshape_downloader(parser):
claudio@68 1152 def run_eshape_downloader(parsed):
claudio@68 1153 eshape_downloader(parsed.config)
claudio@68 1154
claudio@68 1155 parser.set_defaults(execute=run_eshape_downloader)
claudio@68 1156
claudio@68 1157
victor@7 1158 def main():
victor@7 1159 # Define the command line arguments.
victor@7 1160 parser = argparse.ArgumentParser()
moritz@29 1161 subparsers = parser.add_subparsers()
moritz@29 1162
moritz@29 1163 delete_parser = subparsers.add_parser("delete", help="Deletes a measurement.")
ioannis@67 1164 rerun_all_parser = subparsers.add_parser("rerun-all",
ioannis@67 1165 help="Rerun all processing steps for the provided measurement IDs.")
ioannis@45 1166 rerun_processing_parser = subparsers.add_parser("rerun-elpp",
ioannis@45 1167 help="Rerun low-resolution processing steps for the provided measurement ID.")
ioannis@67 1168 upload_file_parser = subparsers.add_parser("upload-file",
ioannis@67 1169 help="Submit a file and, optionally, download the output products.")
ioannis@32 1170 list_parser = subparsers.add_parser("list", help="List measurements registered on the SCC.")
moritz@29 1171 download_parser = subparsers.add_parser("download", help="Download selected measurements.")
claudio@68 1172 eshape_parser = subparsers.add_parser("eshape-downloader", help="Search and download relevant products for E-SHAPE.")
moritz@29 1173
moritz@29 1174 setup_delete(delete_parser)
moritz@29 1175 setup_rerun_all(rerun_all_parser)
ioannis@45 1176 setup_rerun_elpp(rerun_processing_parser)
ioannis@45 1177
moritz@29 1178 setup_upload_file(upload_file_parser)
moritz@29 1179 setup_list_measurements(list_parser)
moritz@29 1180 setup_download_measurements(download_parser)
claudio@68 1181 setup_eshape_downloader(eshape_parser)
victor@7 1182
victor@7 1183 # Verbosity settings from http://stackoverflow.com/a/20663028
victor@7 1184 parser.add_argument('-d', '--debug', help="Print debugging information.", action="store_const",
victor@7 1185 dest="loglevel", const=logging.DEBUG, default=logging.INFO,
victor@7 1186 )
victor@7 1187 parser.add_argument('-s', '--silent', help="Show only warning and error messages.", action="store_const",
victor@7 1188 dest="loglevel", const=logging.WARNING
victor@7 1189 )
victor@7 1190
ioannis@32 1191 # Setup default config location
moritz@29 1192 home = os.path.expanduser("~")
moritz@29 1193 default_config_location = os.path.abspath(os.path.join(home, ".scc_access.yaml"))
moritz@29 1194 parser.add_argument("-c", "--config", help="Path to the config file.", type=settings_from_path,
moritz@29 1195 default=default_config_location)
victor@7 1196
victor@7 1197 args = parser.parse_args()
ioannis@43 1198
victor@7 1199 # Get the logger with the appropriate level
victor@7 1200 logging.basicConfig(format='%(levelname)s: %(message)s', level=args.loglevel)
victor@7 1201
moritz@29 1202 # Dispatch to appropriate function
moritz@29 1203 args.execute(args)
moritz@29 1204
i@14 1205
moritz@29 1206 # When running through terminal
moritz@29 1207 if __name__ == '__main__':
moritz@29 1208 main()

mercurial