scc_access/scc_access.py

Tue, 26 Sep 2023 16:56:35 +0200

author
Claudio Dema <claudio.dema@imaa.cnr.it>
date
Tue, 26 Sep 2023 16:56:35 +0200
changeset 70
4ef6f2102a61
parent 69
cd8bc07f8419
child 71
bf545d90784d
permissions
-rw-r--r--

Filter available measurements for is_being_processed and is_queued parameters

ioannis@67 1 """ This is a script that allows interaction with the SCC through the command line.
ioannis@67 2
ioannis@67 3 It is based on the requests module for accessing the server.
ioannis@67 4
ioannis@67 5 Most of the interactions are done through the web interface, i.e. by mimicking user interaction with the
ioannis@67 6 SCC website (i.e. user login, data submission, etc.). In few cases, the SCC API is also used.
ioannis@67 7
ioannis@67 8 Most of the functionality is included in the SCC class. The class is used to login into the SCC website and automate
ioannis@67 9 interaction with the site (i.e. upload a file, get measurement status, etc.).
ioannis@67 10
ioannis@67 11 Two other classes (Measurement, AncillaryFile) are used in some cases to handle the output of the SCC API.
ioannis@67 12
ioannis@67 13 Several shortcut functions are defined to perform specific tasks using the SCC class (e.g. process_file, delete_measurements etc).
ioannis@67 14 """
ioannis@43 15 import sys
ioannis@43 16
victor@7 17 import requests
victor@7 18
ioannis@43 19 try:
ioannis@43 20 import urllib.parse as urlparse # Python 3
ioannis@43 21 except ImportError:
ioannis@17 22 import urlparse # Python 2
ioannis@43 23
victor@7 24 import argparse
madrouin@24 25 import datetime
madrouin@24 26 import logging
victor@7 27 import os
victor@7 28 import re
ioannis@32 29 from io import BytesIO
ioannis@45 30
victor@7 31 import time
i@40 32
victor@7 33 from zipfile import ZipFile
madrouin@24 34
i@14 35 import yaml
victor@7 36
ioannis@43 37 import netCDF4 as netcdf
ioannis@43 38
ioannis@43 39 requests.packages.urllib3.disable_warnings()
i@14 40 logger = logging.getLogger(__name__)
victor@7 41
victor@7 42 # The regex to find the measurement id from the measurement page
victor@7 43 # This should be read from the uploaded file, but would require an extra NetCDF module.
i@36 44 regex = "<h3>Measurement (?P<measurement_id>.{12,15}) <small>" # {12, 15} to handle both old- and new-style measurement ids.
victor@7 45
victor@7 46
victor@7 47 class SCC:
ioannis@67 48 """A class that will attempt to interact SCC server.
i@14 49
ioannis@67 50 Most interactions are by simulating a normal browser session. In the current
ioannis@67 51 version few checks are performed before upload a file, and no feedback is given in case the upload
ioannis@67 52 fails.
victor@7 53 """
victor@7 54
i@14 55 def __init__(self, auth, output_dir, base_url):
moritz@29 56
victor@7 57 self.auth = auth
victor@7 58 self.output_dir = output_dir
i@14 59 self.base_url = base_url
victor@7 60 self.session = requests.Session()
moritz@29 61 self.session.auth = auth
moritz@29 62 self.session.verify = False
victor@7 63
ioannis@67 64 # Setup SCC server URLS for later use
i@14 65 self.login_url = urlparse.urljoin(self.base_url, 'accounts/login/')
i@31 66 self.logout_url = urlparse.urljoin(self.base_url, 'accounts/logout/')
i@31 67 self.list_measurements_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/')
i@31 68
i@14 69 self.upload_url = urlparse.urljoin(self.base_url, 'data_processing/measurements/quick/')
ioannis@54 70 self.measurement_page_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/')
ioannis@43 71 self.download_hirelpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 72 'data_processing/measurements/{0}/download-hirelpp/')
ioannis@43 73 self.download_cloudmask_pattern = urlparse.urljoin(self.base_url,
ioannis@67 74 'data_processing/measurements/{0}/download-cloudmask/')
ioannis@34 75
ioannis@43 76 self.download_elpp_pattern = urlparse.urljoin(self.base_url,
ioannis@67 77 'data_processing/measurements/{0}/download-preprocessed/')
ioannis@43 78 self.download_elda_pattern = urlparse.urljoin(self.base_url,
ioannis@67 79 'data_processing/measurements/{0}/download-optical/')
ioannis@45 80 self.download_plots_pattern = urlparse.urljoin(self.base_url,
moritz@29 81 'data_processing/measurements/{0}/download-plots/')
ioannis@43 82 self.download_elic_pattern = urlparse.urljoin(self.base_url,
ioannis@67 83 'data_processing/measurements/{0}/download-elic/')
i@14 84 self.delete_measurement_pattern = urlparse.urljoin(self.base_url, 'admin/database/measurements/{0}/delete/')
i@31 85
ioannis@67 86 # Setup API URLs for later use
i@14 87 self.api_base_url = urlparse.urljoin(self.base_url, 'api/v1/')
i@31 88 self.api_measurement_pattern = urlparse.urljoin(self.api_base_url, 'measurements/{0}/')
i@31 89 self.api_measurements_url = urlparse.urljoin(self.api_base_url, 'measurements')
i@38 90 self.api_sounding_search_pattern = urlparse.urljoin(self.api_base_url, 'sounding_files/?filename={0}')
i@38 91 self.api_lidarratio_search_pattern = urlparse.urljoin(self.api_base_url, 'lidarratio_files/?filename={0}')
i@38 92 self.api_overlap_search_pattern = urlparse.urljoin(self.api_base_url, 'overlap_files/?filename={0}')
ioannis@43 93
i@14 94 def login(self, credentials):
ioannis@67 95 """ Login to the SCC.
ioannis@67 96
ioannis@67 97 Parameters
ioannis@67 98 ----------
ioannis@67 99 credentials : tuple or list
ioannis@67 100 A list or tuple in the form (username, password).
ioannis@67 101 """
victor@7 102 logger.debug("Attempting to login to SCC, username %s." % credentials[0])
moritz@29 103 login_credentials = {'username': credentials[0],
moritz@29 104 'password': credentials[1]}
victor@7 105
i@14 106 logger.debug("Accessing login page at %s." % self.login_url)
victor@7 107
ioannis@67 108 # Get login form
moritz@29 109 login_page = self.session.get(self.login_url)
i@14 110
i@31 111 if not login_page.ok:
i@31 112 raise self.PageNotAccessibleError('Could not access login pages. Status code %s' % login_page.status_code)
victor@7 113
i@31 114 logger.debug("Submitting credentials.")
victor@7 115 # Submit the login data
i@14 116 login_submit = self.session.post(self.login_url,
moritz@29 117 data=login_credentials,
victor@7 118 headers={'X-CSRFToken': login_page.cookies['csrftoken'],
moritz@29 119 'referer': self.login_url})
victor@7 120 return login_submit
victor@7 121
victor@7 122 def logout(self):
ioannis@67 123 """ Logout from the SCC """
i@31 124 return self.session.get(self.logout_url, stream=True)
victor@7 125
claudio@69 126 def upload_file(self, filename, system_id, force_upload, delete_related, delay=0, cloudfree=False,
claudio@69 127 rs_filename=None, ov_filename=None, lr_filename=None):
ioannis@67 128 """ Upload a file for processing.
ioannis@67 129
ioannis@67 130 If the upload is successful, it returns the measurement id.
ioannis@67 131
ioannis@67 132
ioannis@67 133 Parameters
ioannis@67 134 ----------
ioannis@67 135 filename : str
ioannis@67 136 File path of the file to upload
ioannis@67 137 system_id : int
ioannis@67 138 System id to be used in the processing
ioannis@67 139 force_upload : bool
ioannis@67 140 If True, if a measurement with the same ID is found on the server, it will be first deleted and the
ioannis@67 141 file current file will be uploaded. If False, the file will not be uploaded if the measurement ID is
ioannis@67 142 already present on the SCC server.
ioannis@67 143 delete_related : bool
ioannis@67 144 Answer to delete related question when deleting existing measurements from the SCC.
claudio@69 145 cloudfree : bool
claudio@69 146 Manually set the measurement as cloud free
ioannis@67 147 rs_filename, ov_filename, lr_filename : str
ioannis@67 148 Ancillary files pahts to be uploaded.
ioannis@67 149 """
ioannis@67 150 # Get the measurement ID from the netcdf file
ioannis@43 151 measurement_id = self.measurement_id_from_file(filename)
ioannis@43 152
ioannis@67 153 # Handle possible existing measurements with the same ID on the SCC server.
ioannis@43 154 logger.debug('Checking if a measurement with the same id already exists on the SCC server.')
ioannis@50 155 existing_measurement, _ = self.get_measurement(measurement_id)
ioannis@43 156
ioannis@43 157 if existing_measurement:
ioannis@43 158 if force_upload:
ioannis@43 159 logger.info(
ioannis@43 160 "Measurement with id {} already exists on the SCC. Trying to delete it...".format(measurement_id))
ioannis@43 161 self.delete_measurement(measurement_id, delete_related)
ioannis@43 162 else:
ioannis@43 163 logger.error(
ioannis@43 164 "Measurement with id {} already exists on the SCC. Use --force_upload flag to overwrite it.".format(
ioannis@43 165 measurement_id))
ioannis@67 166 # TODO: Implement handling at the proper place. Exiting here does not allow the SCC class to be
ioannis@67 167 # used by external programs. Instead an exception should be raised.
ioannis@43 168 sys.exit(1)
ioannis@43 169
ioannis@67 170 # Upload the file(s)
ioannis@67 171
victor@7 172 # Get submit page
moritz@29 173 upload_page = self.session.get(self.upload_url)
victor@7 174
victor@7 175 # Submit the data
ioannis@54 176 upload_data = {'system': system_id,
claudio@69 177 'delay': delay,
claudio@69 178 'manually_cloud_free': cloudfree, }
ioannis@54 179
claudio@69 180 logger.debug("Submitted processing parameters - System: {}, Delay: {}, Manually Cloud Free: {}".format(system_id, delay, cloudfree))
ioannis@54 181
victor@7 182 files = {'data': open(filename, 'rb')}
victor@7 183
ioannis@67 184 # Add ancillary files to be uploaded
madrouin@20 185 if rs_filename is not None:
i@38 186 ancillary_file, _ = self.get_ancillary(rs_filename, 'sounding')
i@38 187
i@38 188 if ancillary_file.already_on_scc:
ioannis@67 189 logger.warning(
ioannis@67 190 "Sounding file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 191 else:
i@38 192 logger.debug('Adding sounding file %s' % rs_filename)
i@38 193 files['sounding_file'] = open(rs_filename, 'rb')
madrouin@20 194
ioannis@32 195 if ov_filename is not None:
i@38 196 ancillary_file, _ = self.get_ancillary(ov_filename, 'overlap')
i@38 197
i@38 198 if ancillary_file.already_on_scc:
ioannis@67 199 logger.warning(
ioannis@67 200 "Overlap file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(ancillary_file))
i@38 201 else:
i@38 202 logger.debug('Adding overlap file %s' % ov_filename)
i@38 203 files['overlap_file'] = open(ov_filename, 'rb')
i@31 204
i@31 205 if lr_filename is not None:
i@38 206 ancillary_file, _ = self.get_ancillary(lr_filename, 'lidarratio')
i@38 207
i@38 208 if ancillary_file.already_on_scc:
i@38 209 logger.warning(
ioannis@67 210 "Lidar ratio file {0.filename} already on the SCC with id {0.id}. Ignoring it.".format(
ioannis@67 211 ancillary_file))
i@38 212 else:
i@38 213 logger.debug('Adding lidar ratio file %s' % lr_filename)
i@38 214 files['lidar_ratio_file'] = open(lr_filename, 'rb')
i@31 215
ioannis@67 216 # Upload the files
i@14 217 logger.info("Uploading of file %s started." % filename)
victor@7 218
i@14 219 upload_submit = self.session.post(self.upload_url,
victor@7 220 data=upload_data,
victor@7 221 files=files,
victor@7 222 headers={'X-CSRFToken': upload_page.cookies['csrftoken'],
moritz@29 223 'referer': self.upload_url})
victor@7 224
victor@7 225 if upload_submit.status_code != 200:
i@14 226 logger.warning("Connection error. Status code: %s" % upload_submit.status_code)
victor@7 227 return False
victor@7 228
ioannis@67 229 # Check if there was a redirect to a new page. If not, something went wrong
i@14 230 if upload_submit.url == self.upload_url:
victor@7 231 measurement_id = False
ioannis@32 232 logger.error("Uploaded file(s) rejected! Try to upload manually to see the error.")
victor@7 233 else:
ioannis@67 234 # TODO: Check if this is needed. This was used when the measurement ID was not read from the input file.
ioannis@67 235 measurement_id = re.findall(regex, upload_submit.text)[0] # Get the measurement ID from the output page
ioannis@43 236 logger.info("Successfully uploaded measurement with id %s." % measurement_id)
ioannis@67 237 logger.info("You can monitor the processing progress online: {}".format(
ioannis@67 238 self.measurement_page_pattern.format(measurement_id)))
ioannis@43 239 return measurement_id
ioannis@43 240
ioannis@43 241 @staticmethod
ioannis@43 242 def measurement_id_from_file(filename):
ioannis@67 243 """ Get the measurement id from the input file.
ioannis@67 244
ioannis@67 245 Parameters
ioannis@67 246 ----------
ioannis@67 247 filename : str
ioannis@67 248 File path of the input file.
ioannis@67 249 """
ioannis@43 250
ioannis@43 251 if not os.path.isfile(filename):
ioannis@43 252 logger.error("File {} does not exist.".format(filename))
ioannis@43 253 sys.exit(1)
ioannis@43 254
ioannis@43 255 with netcdf.Dataset(filename) as f:
ioannis@43 256 try:
ioannis@43 257 measurement_id = f.Measurement_ID
ioannis@43 258 except AttributeError:
ioannis@43 259 logger.error(
ioannis@43 260 "Input file {} does not contain a Measurement_ID global attribute. Wrong file format?".format(
ioannis@43 261 filename))
ioannis@43 262 sys.exit(1)
victor@7 263
victor@7 264 return measurement_id
victor@7 265
victor@7 266 def download_files(self, measurement_id, subdir, download_url):
victor@7 267 """ Downloads some files from the download_url to the specified
ioannis@67 268 subdir.
ioannis@67 269
ioannis@67 270 This is a general method used to download preprocessed file, optical
ioannis@67 271 files by other, file-specific, methods.
victor@7 272 """
ioannis@32 273 # TODO: Make downloading more robust (e.g. in case that files do not exist on server).
victor@7 274 # Get the file
moritz@29 275 request = self.session.get(download_url, stream=True)
moritz@29 276
moritz@29 277 if not request.ok:
moritz@29 278 raise Exception("Could not download files for measurement '%s'" % measurement_id)
victor@7 279
victor@7 280 # Create the dir if it does not exist
victor@7 281 local_dir = os.path.join(self.output_dir, measurement_id, subdir)
victor@7 282 if not os.path.exists(local_dir):
victor@7 283 os.makedirs(local_dir)
victor@7 284
victor@7 285 # Save the file by chunk, needed if the file is big.
ioannis@43 286 memory_file = BytesIO()
victor@7 287
victor@7 288 for chunk in request.iter_content(chunk_size=1024):
victor@7 289 if chunk: # filter out keep-alive new chunks
victor@7 290 memory_file.write(chunk)
victor@7 291 memory_file.flush()
victor@7 292
victor@7 293 zip_file = ZipFile(memory_file)
victor@7 294
victor@7 295 for ziped_name in zip_file.namelist():
victor@7 296 basename = os.path.basename(ziped_name)
victor@7 297
victor@7 298 local_file = os.path.join(local_dir, basename)
victor@7 299
victor@7 300 with open(local_file, 'wb') as f:
victor@7 301 f.write(zip_file.read(ziped_name))
victor@7 302
ioannis@43 303 def download_hirelpp(self, measurement_id):
ioannis@43 304 """ Download hirelpp files for the measurement id. """
ioannis@43 305 # Construct the download url
ioannis@43 306 download_url = self.download_hirelpp_pattern.format(measurement_id)
ioannis@43 307 try:
ioannis@50 308 self.download_files(measurement_id, 'hirelpp', download_url)
ioannis@43 309 except Exception as e:
ioannis@43 310 logger.error("Could not download HiRElPP files. Error message: {}".format(e))
ioannis@43 311 logger.debug('Download exception:', exc_info=True)
ioannis@43 312
ioannis@43 313 def download_cloudmask(self, measurement_id):
ioannis@43 314 """ Download cloudmask files for the measurement id. """
ioannis@43 315 # Construct the download url
ioannis@43 316 download_url = self.download_cloudmask_pattern.format(measurement_id)
ioannis@43 317 try:
ioannis@50 318 self.download_files(measurement_id, 'cloudscreen', download_url)
ioannis@43 319 except Exception as e:
ioannis@43 320 logger.error("Could not download cloudscreen files. Error message: {}".format(e))
ioannis@43 321 logger.debug('Download exception:', exc_info=True)
ioannis@43 322
ioannis@43 323 def download_elpp(self, measurement_id):
victor@7 324 """ Download preprocessed files for the measurement id. """
victor@7 325 # Construct the download url
ioannis@43 326 download_url = self.download_elpp_pattern.format(measurement_id)
ioannis@43 327 try:
ioannis@50 328 self.download_files(measurement_id, 'elpp', download_url)
ioannis@43 329 except Exception as e:
ioannis@43 330 logger.error("Could not download ElPP files. Error message: {}".format(e))
ioannis@43 331 logger.debug('Download exception:', exc_info=True)
victor@7 332
ioannis@43 333 def download_elda(self, measurement_id):
victor@7 334 """ Download optical files for the measurement id. """
victor@7 335 # Construct the download url
ioannis@43 336 download_url = self.download_elda_pattern.format(measurement_id)
ioannis@43 337 try:
ioannis@50 338 self.download_files(measurement_id, 'elda', download_url)
ioannis@43 339 except Exception as e:
ioannis@43 340 logger.error("Could not download ELDA files. Error message: {}".format(e))
ioannis@43 341 logger.debug('Download exception:', exc_info=True)
victor@7 342
ioannis@43 343 def download_plots(self, measurement_id):
victor@7 344 """ Download profile graphs for the measurement id. """
victor@7 345 # Construct the download url
ioannis@45 346 download_url = self.download_plots_pattern.format(measurement_id)
ioannis@43 347 try:
ioannis@50 348 self.download_files(measurement_id, 'elda_plots', download_url)
ioannis@43 349 except Exception as e:
ioannis@43 350 logger.error("Could not download ELDA plots. Error message: {}".format(e))
ioannis@43 351 logger.debug('Download exception:', exc_info=True)
victor@7 352
ioannis@43 353 def download_elic(self, measurement_id):
ioannis@43 354 """ Download ELIC files for the measurement id. """
ioannis@43 355 # Construct the download url
ioannis@43 356 download_url = self.download_elic_pattern.format(measurement_id)
ioannis@43 357 try:
ioannis@50 358 self.download_files(measurement_id, 'elic', download_url)
ioannis@43 359 except Exception as e:
ioannis@43 360 logger.error("Could not download ELIC files. Error message: {}".format(e))
ioannis@43 361 logger.debug('Download exception:', exc_info=True)
ioannis@43 362
ioannis@43 363 def download_eldec(self, measurement_id):
ioannis@43 364 """ Download ELDEC files for the measurement id. """
ioannis@43 365 # Construct the download url
ioannis@43 366 download_url = self.download_elda_pattern.format(measurement_id) # ELDA patter is used for now
ioannis@43 367 try:
ioannis@50 368 self.download_files(measurement_id, 'eldec', download_url)
ioannis@43 369 except Exception as e:
ioannis@43 370 logger.error("Could not download EDELC files. Error message: {}".format(e))
ioannis@43 371 logger.debug('Download exception:', exc_info=True)
ioannis@43 372
ioannis@43 373 def rerun_elpp(self, measurement_id, monitor=True):
ioannis@45 374 logger.debug("Started rerun_elpp procedure.")
ioannis@45 375
ioannis@45 376 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 377 measurement, status = self.get_measurement(measurement_id)
victor@7 378
victor@7 379 if measurement:
ioannis@45 380 logger.debug("Attempting to rerun ElPP through %s." % measurement.rerun_all_url)
ioannis@45 381 request = self.session.get(measurement.rerun_elpp_url, stream=True)
victor@7 382
victor@7 383 if request.status_code != 200:
i@14 384 logger.error(
i@14 385 "Could not rerun processing for %s. Status code: %s" % (measurement_id, request.status_code))
ioannis@45 386 else:
ioannis@45 387 logger.info("Rerun-elpp command submitted successfully for id {}.".format(measurement_id))
victor@7 388
victor@7 389 if monitor:
victor@7 390 self.monitor_processing(measurement_id)
victor@7 391
victor@7 392 def rerun_all(self, measurement_id, monitor=True):
victor@7 393 logger.debug("Started rerun_all procedure.")
victor@7 394
victor@7 395 logger.debug("Getting measurement %s" % measurement_id)
madrouin@26 396 measurement, status = self.get_measurement(measurement_id)
victor@7 397
victor@7 398 if measurement:
victor@7 399 logger.debug("Attempting to rerun all processing through %s." % measurement.rerun_all_url)
victor@7 400
moritz@29 401 request = self.session.get(measurement.rerun_all_url, stream=True)
victor@7 402
victor@7 403 if request.status_code != 200:
victor@7 404 logger.error("Could not rerun pre processing for %s. Status code: %s" %
victor@7 405 (measurement_id, request.status_code))
ioannis@45 406 else:
ioannis@45 407 logger.info("Rerun-all command submitted successfully for id {}.".format(measurement_id))
victor@7 408
victor@7 409 if monitor:
victor@7 410 self.monitor_processing(measurement_id)
victor@7 411
claudio@69 412 def process(self, filename, system_id, monitor, force_upload, delete_related, delay=0, cloudfree=False,
claudio@69 413 rs_filename=None, lr_filename=None, ov_filename=None):
victor@7 414 """ Upload a file for processing and wait for the processing to finish.
victor@7 415 If the processing is successful, it will download all produced files.
victor@7 416 """
victor@7 417 logger.info("--- Processing started on %s. ---" % datetime.datetime.now())
victor@7 418 # Upload file
ioannis@50 419 logger.info("Uploading file.")
ioannis@45 420 measurement_id = self.upload_file(filename, system_id, force_upload, delete_related,
ioannis@54 421 delay=delay,
claudio@69 422 cloudfree=cloudfree,
ioannis@32 423 rs_filename=rs_filename,
ioannis@32 424 lr_filename=lr_filename,
ioannis@32 425 ov_filename=ov_filename)
ioannis@43 426
ioannis@54 427 if monitor and (delay > 0):
ioannis@54 428 logger.warning("Will not start monitoring, since a delay was specified: {} hours.".format(delay))
ioannis@54 429 return None
ioannis@54 430
ioannis@32 431 if measurement_id and monitor:
ioannis@54 432 logger.info("Monitoring processing.")
moritz@29 433 return self.monitor_processing(measurement_id)
victor@7 434
moritz@29 435 return None
victor@7 436
ioannis@61 437 def monitor_processing(self, measurement_id, retry_max=2, time_sleep=2, exit_if_missing=True):
victor@7 438 """ Monitor the processing progress of a measurement id"""
victor@7 439
madrouin@24 440 # try to deal with error 404
ioannis@61 441 attempts_count = 0
ioannis@61 442 max_attempts = retry_max + 1
madrouin@24 443
ioannis@67 444 # try to wait for measurement to appear in API. A user has reported that this does not happen immediately.
madrouin@24 445 measurement = None
ioannis@50 446 logger.info("Looking for measurement %s on the SCC.", measurement_id)
ioannis@62 447
ioannis@61 448 while attempts_count < max_attempts:
ioannis@61 449 attempts_count += 1
madrouin@26 450 measurement, status = self.get_measurement(measurement_id)
ioannis@61 451 if status != 200:
ioannis@61 452 logger.warning("Measurement not found.")
ioannis@61 453 if attempts_count < max_attempts:
ioannis@61 454 logger.warning("Waiting %ds.", time_sleep)
ioannis@61 455 time.sleep(time_sleep)
madrouin@26 456 else:
madrouin@26 457 break
ioannis@62 458 print("Measurement: {}".format(measurement))
madrouin@24 459
ioannis@62 460 if measurement is None:
ioannis@61 461 logger.error("Measurement %s doesn't seem to exist.", measurement_id)
ioannis@61 462 if exit_if_missing:
ioannis@61 463 sys.exit(1)
ioannis@61 464 else:
ioannis@61 465 return measurement
madrouin@26 466
ioannis@45 467 logger.info('Measurement %s found.', measurement_id)
ioannis@62 468 while not measurement.has_finished:
ioannis@62 469 measurement.log_processing_status()
ioannis@62 470 time.sleep(10)
ioannis@62 471 measurement, status = self.get_measurement(measurement_id)
madrouin@24 472
ioannis@62 473 logger.info("Measurement processing finished.")
ioannis@62 474 measurement.log_detailed_status()
ioannis@53 475
ioannis@62 476 if measurement.hirelpp == 127:
ioannis@62 477 logger.info("Downloading HiRElPP files.")
ioannis@62 478 self.download_hirelpp(measurement_id)
ioannis@62 479 if measurement.cloudmask == 127:
ioannis@62 480 logger.info("Downloading cloud screening files.")
ioannis@62 481 self.download_cloudmask(measurement_id)
ioannis@62 482 if measurement.elpp == 127:
ioannis@62 483 logger.info("Downloading ElPP files.")
ioannis@62 484 self.download_elpp(measurement_id)
ioannis@62 485 if measurement.elda == 127:
ioannis@62 486 logger.info("Downloading ELDA files.")
ioannis@62 487 self.download_elda(measurement_id)
ioannis@62 488 logger.info("Downloading ELDA plots.")
ioannis@62 489 self.download_plots(measurement_id)
ioannis@62 490 if measurement.elic == 127:
ioannis@62 491 logger.info("Downloading ELIC files.")
ioannis@62 492 self.download_elic(measurement_id)
ioannis@67 493 if measurement.is_calibration and measurement.eldec == 0:
ioannis@62 494 logger.info("Downloading ELDEC files.")
ioannis@62 495 self.download_eldec(measurement_id)
ioannis@62 496 logger.info("--- Processing finished. ---")
ioannis@43 497
victor@7 498 return measurement
victor@7 499
claudio@68 500 def download_products(self, measurement, dir_name):
claudio@70 501 """ Download all the products of a measurement id (used only for E-SHAPE)"""
claudio@68 502 measurement_id = measurement.id
claudio@68 503 base_output_dir = self.output_dir
claudio@68 504 self.output_dir = self.output_dir + dir_name + "/"
claudio@68 505
claudio@68 506 if measurement.hirelpp == 127:
claudio@68 507 logger.info("Downloading HiRElPP files.")
claudio@68 508 self.download_hirelpp(measurement_id)
claudio@68 509 if measurement.cloudmask == 127:
claudio@68 510 logger.info("Downloading cloud screening files.")
claudio@68 511 self.download_cloudmask(measurement_id)
claudio@68 512 if measurement.elpp == 127:
claudio@68 513 logger.info("Downloading ElPP files.")
claudio@68 514 self.download_elpp(measurement_id)
claudio@68 515 if measurement.elda == 127:
claudio@68 516 logger.info("Downloading ELDA files.")
claudio@68 517 self.download_elda(measurement_id)
claudio@68 518 logger.info("Downloading ELDA plots.")
claudio@68 519 self.download_plots(measurement_id)
claudio@68 520 if measurement.elic == 127:
claudio@68 521 logger.info("Downloading ELIC files.")
claudio@68 522 self.download_elic(measurement_id)
claudio@68 523 if measurement.is_calibration and measurement.eldec == 0:
claudio@68 524 logger.info("Downloading ELDEC files.")
claudio@68 525 self.download_eldec(measurement_id)
claudio@68 526 logger.info("--- Processing finished. ---")
claudio@68 527
claudio@68 528 self.output_dir = base_output_dir
claudio@68 529 return measurement
claudio@68 530
ioannis@43 531 def get_measurement(self, measurement_id):
ioannis@67 532 """ Get a measurement information from the SCC API.
victor@7 533
ioannis@67 534 Parameters
ioannis@67 535 ----------
ioannis@67 536 measurement_id : str
ioannis@67 537 The measurement ID to search.
ioannis@67 538
ioannis@67 539 Returns
ioannis@67 540 -------
ioannis@67 541 : Measurement object or None
ioannis@67 542 If the measurement is found, a Measurement object is returned. If not, it returns None
ioannis@67 543 """
ioannis@67 544 # TODO: Consider to homogenize with get_ancillary method (i.e. always return a Measurement object).
ioannis@67 545
ioannis@67 546 if measurement_id is None: # TODO: Is this still required?
victor@7 547 return None
victor@7 548
ioannis@67 549 # Access the API
i@31 550 measurement_url = self.api_measurement_pattern.format(measurement_id)
i@31 551 logger.debug("Measurement API URL: %s" % measurement_url)
victor@7 552
moritz@29 553 response = self.session.get(measurement_url)
victor@7 554
ioannis@43 555 response_dict = None
ioannis@45 556
ioannis@43 557 if response.status_code == 200:
ioannis@43 558 response_dict = response.json()
ioannis@45 559 elif response.status_code == 404:
ioannis@43 560 logger.info("No measurement with id %s found on the SCC." % measurement_id)
ioannis@45 561 else:
i@14 562 logger.error('Could not access API. Status code %s.' % response.status_code)
victor@7 563
ioannis@55 564 # TODO: Implement better handling for status 401.
ioannis@55 565
victor@7 566 if response_dict:
ioannis@43 567 measurement = Measurement(self.base_url, response_dict)
victor@7 568 else:
ioannis@45 569 measurement = None
victor@7 570
ioannis@45 571 return measurement, response.status_code
victor@7 572
ioannis@45 573 def delete_measurement(self, measurement_id, delete_related):
victor@7 574 """ Deletes a measurement with the provided measurement id. The user
ioannis@67 575 should have the appropriate permissions (i.e. access to the admin site).
madrouin@20 576
victor@7 577 The procedures is performed directly through the web interface and
victor@7 578 NOT through the API.
victor@7 579 """
victor@7 580 # Get the measurement object
i@31 581 measurement, _ = self.get_measurement(measurement_id)
victor@7 582
victor@7 583 # Check that it exists
victor@7 584 if measurement is None:
victor@7 585 logger.warning("Nothing to delete.")
victor@7 586 return None
victor@7 587
victor@7 588 # Go the the page confirming the deletion
moritz@29 589 delete_url = self.delete_measurement_pattern.format(measurement_id)
ioannis@43 590
moritz@29 591 confirm_page = self.session.get(delete_url)
victor@7 592
victor@7 593 # Check that the page opened properly
victor@7 594 if confirm_page.status_code != 200:
victor@7 595 logger.warning("Could not open delete page. Status: {0}".format(confirm_page.status_code))
victor@7 596 return None
victor@7 597
ioannis@43 598 # Get the delete related value
ioannis@43 599 if delete_related:
ioannis@43 600 delete_related_option = 'delete_related'
ioannis@43 601 else:
ioannis@43 602 delete_related_option = 'not_delete_related'
ioannis@43 603
victor@7 604 # Delete the measurement
victor@7 605 delete_page = self.session.post(delete_url,
ioannis@43 606 data={'post': 'yes',
ioannis@43 607 'select_delete_related_measurements': delete_related_option},
victor@7 608 headers={'X-CSRFToken': confirm_page.cookies['csrftoken'],
victor@7 609 'referer': delete_url}
victor@7 610 )
i@31 611 if not delete_page.ok:
victor@7 612 logger.warning("Something went wrong. Delete page status: {0}".format(
victor@7 613 delete_page.status_code))
victor@7 614 return None
victor@7 615
victor@7 616 logger.info("Deleted measurement {0}".format(measurement_id))
victor@7 617 return True
victor@7 618
claudio@70 619 def available_measurements(self, start_gte=None, stop_lte=None, is_being_processed=None, is_queued=None):
ioannis@67 620 """ Get a list of available measurement on the SCC.
ioannis@67 621
ioannis@67 622 The methods is currently not used, could be merged with list_measurements.
ioannis@67 623 """
claudio@68 624
claudio@68 625 params = {}
claudio@68 626 if start_gte is not None:
claudio@68 627 params['start__gte'] = start_gte
claudio@68 628 if stop_lte is not None:
claudio@68 629 params['stop__lte'] = stop_lte
claudio@70 630 if is_being_processed is not None:
claudio@70 631 params['is_being_processed'] = is_being_processed
claudio@70 632 if is_queued is not None:
claudio@70 633 params['is_queued'] = is_queued
claudio@70 634
claudio@68 635
claudio@68 636 response = self.session.get(self.api_measurements_url, params=params)
victor@7 637 response_dict = response.json()
victor@7 638
victor@7 639 if response_dict:
victor@7 640 measurement_list = response_dict['objects']
i@14 641 measurements = [Measurement(self.base_url, measurement_dict) for measurement_dict in measurement_list]
victor@7 642 logger.info("Found %s measurements on the SCC." % len(measurements))
victor@7 643 else:
victor@7 644 logger.warning("No response received from the SCC when asked for available measurements.")
ioannis@43 645 measurements = None
victor@7 646
victor@7 647 return measurements
victor@7 648
claudio@68 649 def list_measurements(self, id_exact=None, id_startswith=None,
claudio@68 650 start_exact=None, start_gte=None, start_lte=None,
claudio@68 651 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 652 station_exact=None, station_in=None):
ioannis@67 653 """ Get the response text from the API. """
moritz@29 654
ioannis@67 655 # TODO: Add some error handling, e.g. as per available_measurements method
i@31 656
moritz@29 657 # Need to set to empty string if not specified, we won't get any results
ioannis@65 658 params = {}
i@31 659
ioannis@65 660 if id_exact is not None:
ioannis@65 661 params['id__exact'] = id_exact
claudio@68 662 elif id_startswith is not None:
claudio@68 663 params['id__startswith'] = id_startswith
claudio@68 664
claudio@68 665 if start_exact is not None:
claudio@68 666 params['start__exact'] = start_exact
ioannis@65 667 else:
claudio@68 668 if start_gte is not None:
claudio@68 669 params['start__gte'] = start_gte
claudio@68 670 if start_lte is not None:
claudio@68 671 params['start__lte'] = start_lte
claudio@68 672
claudio@68 673 if stop_exact is not None:
claudio@68 674 params['stop__exact'] = stop_exact
claudio@68 675 else:
claudio@68 676 if stop_gte is not None:
claudio@68 677 params['stop__gte'] = stop_gte
claudio@68 678 if stop_lte is not None:
claudio@68 679 params['stop__lte'] = stop_lte
claudio@68 680
claudio@68 681 if station_exact is not None:
claudio@68 682 params['station__exact'] = station_exact
claudio@68 683 elif station_in is not None:
claudio@68 684 params['station__in'] = station_in
moritz@29 685
ioannis@65 686 response_json = self.session.get(self.api_measurements_url, params=params).text
moritz@29 687
ioannis@65 688 return response_json
moritz@29 689
ioannis@43 690 def measurement_id_for_date(self, t1, call_sign, base_number=0):
victor@7 691 """ Give the first available measurement id on the SCC for the specific
madrouin@20 692 date.
victor@7 693 """
ioannis@67 694 # TODO: Check if this method needs updating to handle all measurement_ID formats.
victor@7 695 date_str = t1.strftime('%Y%m%d')
i@31 696 base_id = "%s%s" % (date_str, call_sign)
i@31 697 search_url = urlparse.urljoin(self.api_base_url, 'measurements/?id__startswith=%s' % base_id)
victor@7 698
moritz@29 699 response = self.session.get(search_url)
victor@7 700
victor@7 701 response_dict = response.json()
victor@7 702
victor@7 703 measurement_id = None
victor@7 704
victor@7 705 if response_dict:
victor@7 706 measurement_list = response_dict['objects']
i@31 707
i@31 708 if len(measurement_list) == 100:
i@31 709 raise ValueError('No available measurement id found.')
i@31 710
victor@7 711 existing_ids = [measurement_dict['id'] for measurement_dict in measurement_list]
victor@7 712
victor@7 713 measurement_number = base_number
i@31 714 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 715
victor@7 716 while measurement_id in existing_ids:
victor@7 717 measurement_number = measurement_number + 1
i@31 718 measurement_id = "%s%02i" % (base_id, measurement_number)
victor@7 719
victor@7 720 return measurement_id
victor@7 721
i@40 722 def get_ancillary(self, file_path, file_type):
i@38 723 """
i@38 724 Try to get the ancillary file data from the SCC API.
i@38 725
i@38 726 The result will always be an API object. If the file does not exist, the .exists property is set to False.
i@38 727
i@38 728 Parameters
i@38 729 ----------
i@40 730 file_path : str
i@40 731 Path of the uploaded file.
i@38 732 file_type : str
i@38 733 Type of ancillary file. One of 'sounding', 'overlap', 'lidarratio'.
i@38 734
i@38 735 Returns
i@38 736 : AncillaryFile
i@38 737 The api object.
i@38 738 """
i@38 739 assert file_type in ['sounding', 'overlap', 'lidarratio']
i@38 740
i@40 741 filename = os.path.basename(file_path)
i@40 742
i@38 743 if file_type == 'sounding':
i@38 744 file_url = self.api_sounding_search_pattern.format(filename)
i@38 745 elif file_type == 'overlap':
i@38 746 file_url = self.api_overlap_search_pattern.format(filename)
i@38 747 else:
i@38 748 file_url = self.api_lidarratio_search_pattern.format(filename)
i@38 749
i@38 750 response = self.session.get(file_url)
i@38 751
i@38 752 if not response.ok:
i@38 753 logger.error('Could not access API. Status code %s.' % response.status_code)
i@38 754 return None, response.status_code
i@38 755
i@38 756 response_dict = response.json()
i@38 757 object_list = response_dict['objects']
i@38 758
i@38 759 logger.debug("Ancillary file JSON: {0}".format(object_list))
i@38 760
i@38 761 if object_list:
i@38 762 ancillary_file = AncillaryFile(self.api_base_url, object_list[0]) # Assume only one file is returned
i@38 763 else:
i@38 764 ancillary_file = AncillaryFile(self.api_base_url, None) # Create an empty object
i@38 765
i@38 766 return ancillary_file, response.status_code
i@38 767
ioannis@43 768 def __enter__(self):
ioannis@43 769 return self
victor@7 770
ioannis@43 771 def __exit__(self, *args):
ioannis@43 772 logger.debug("Closing SCC connection session.")
ioannis@43 773 self.session.close()
ioannis@43 774
i@31 775 class PageNotAccessibleError(RuntimeError):
i@31 776 pass
ioannis@43 777
victor@7 778
ioannis@17 779 class ApiObject(object):
victor@7 780 """ A generic class object. """
victor@7 781
i@14 782 def __init__(self, base_url, dict_response):
i@14 783 self.base_url = base_url
victor@7 784
victor@7 785 if dict_response:
victor@7 786 # Add the dictionary key value pairs as object properties
victor@7 787 for key, value in dict_response.items():
ioannis@17 788 # logger.debug('Setting key {0} to value {1}'.format(key, value))
ioannis@17 789 try:
ioannis@17 790 setattr(self, key, value)
ioannis@17 791 except:
ioannis@17 792 logger.warning('Could not set attribute {0} to value {1}'.format(key, value))
victor@7 793 self.exists = True
victor@7 794 else:
victor@7 795 self.exists = False
victor@7 796
victor@7 797
victor@7 798 class Measurement(ApiObject):
ioannis@43 799 """ This class represents the measurement object as returned in the SCC API.
ioannis@43 800 """
victor@7 801
i@14 802 def __init__(self, base_url, dict_response):
victor@7 803
ioannis@45 804 # Define expected attributes to assist debugging
ioannis@53 805
ioannis@53 806 self.hirelpp = None
ioannis@53 807 self.hirelpp_exit_code = None
ioannis@43 808 self.cloudmask = None
ioannis@53 809 self.cloudmask_exit_code = None
ioannis@53 810 self.elpp = None
ioannis@53 811 self.elpp_exit_code = None
ioannis@43 812 self.elda = None
ioannis@53 813 self.elda_exit_code = None
ioannis@43 814 self.elic = None
ioannis@53 815 self.elic_exit_code = None
ioannis@53 816 self.eldec = None
ioannis@53 817 self.eldec_exit_code = None
ioannis@53 818 self.elquick = None
ioannis@53 819 self.elquick_exit_code = None
ioannis@53 820
ioannis@43 821 self.id = None
claudio@68 822 self.num_id = None
ioannis@43 823 self.is_calibration = None
ioannis@43 824 self.is_running = None
claudio@68 825 self.is_queued = None
ioannis@53 826
ioannis@43 827 self.resource_uri = None
ioannis@43 828 self.start = None
ioannis@43 829 self.stop = None
ioannis@43 830 self.system = None
claudio@68 831 self.station = None
ioannis@43 832 self.upload = None
ioannis@43 833
ioannis@45 834 super().__init__(base_url, dict_response)
victor@7 835
ioannis@57 836 @property
ioannis@57 837 def has_finished(self):
ioannis@57 838 """ Temporary implementation for SCC version 5.2.0, until the API returns a flag indicating if the
ioannis@57 839 processing measurement has finished. """
ioannis@57 840 if (self.is_running is False) and (self.hirelpp != 0 or self.elpp != 0):
ioannis@57 841 return True
ioannis@57 842 else:
ioannis@57 843 return False
ioannis@57 844
ioannis@53 845 def log_processing_status(self):
ioannis@53 846 """ Log module status. """
claudio@68 847 logger.info("Measurement is being processed. Status: {}, {}, {}, {}, {}, {}, {}). Please wait.".format(
ioannis@53 848 self.upload,
ioannis@53 849 self.hirelpp,
ioannis@53 850 self.cloudmask,
ioannis@53 851 self.elpp,
ioannis@53 852 self.elda,
claudio@68 853 self.elic,
claudio@68 854 self.elquick))
ioannis@53 855
ioannis@53 856 def log_detailed_status(self):
ioannis@53 857 """ Log module exit and status codes."""
ioannis@53 858 logger.info("Measurement exit status:".format(self.id))
ioannis@53 859 if self.is_calibration:
ioannis@53 860 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 861 self._log_module_status('ElDEC', self.eldec, self.eldec_exit_code)
ioannis@53 862 else:
ioannis@53 863 self._log_module_status('HiRElPP', self.hirelpp, self.hirelpp_exit_code)
ioannis@53 864 self._log_module_status('CloudScreen', self.cloudmask, self.cloudmask_exit_code)
ioannis@53 865 self._log_module_status('ElPP', self.elpp, self.elpp_exit_code)
ioannis@53 866 self._log_module_status('ELDA', self.elda, self.elda_exit_code)
ioannis@53 867 self._log_module_status('ELIC', self.elic, self.elic_exit_code)
ioannis@53 868 self._log_module_status('ELQuick', self.elquick, self.elquick_exit_code)
ioannis@53 869
ioannis@53 870 def _log_module_status(self, name, status, exit_code):
ioannis@53 871 if exit_code:
ioannis@54 872 if exit_code['exit_code'] > 0:
ioannis@54 873 logger.warning("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@54 874 else:
ioannis@54 875 logger.info("{0} exit code: {2[exit_code]} - {2[description]}".format(name, status, exit_code))
ioannis@53 876 else:
ioannis@53 877 logger.info("{0} exit code: {2}".format(name, status, exit_code))
ioannis@53 878
ioannis@43 879 @property
ioannis@43 880 def rerun_elda_url(self):
ioannis@43 881 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elda/')
ioannis@43 882 return url_pattern.format(self.id)
victor@7 883
victor@7 884 @property
ioannis@43 885 def rerun_elpp_url(self):
ioannis@43 886 url_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-elpp/')
i@14 887 return url_pattern.format(self.id)
victor@7 888
victor@7 889 @property
victor@7 890 def rerun_all_url(self):
i@14 891 ulr_pattern = urlparse.urljoin(self.base_url, 'data_processing/measurements/{0}/rerun-all/')
i@14 892 return ulr_pattern.format(self.id)
victor@7 893
victor@7 894 def __str__(self):
ioannis@43 895 return "Measurement {}".format(self.id)
victor@7 896
victor@7 897
i@38 898 class AncillaryFile(ApiObject):
i@38 899 """ This class represents the ancilalry file object as returned in the SCC API.
i@38 900 """
ioannis@67 901
i@38 902 @property
i@38 903 def already_on_scc(self):
i@38 904 if self.exists is False:
i@38 905 return False
i@38 906
i@38 907 return not self.status == 'missing'
i@38 908
i@38 909 def __str__(self):
i@38 910 return "%s: %s, %s" % (self.id,
i@38 911 self.filename,
i@38 912 self.status)
i@38 913
i@38 914
ioannis@67 915 # Methods that use the SCC class to perform specific tasks.
ioannis@45 916 def process_file(filename, system_id, settings, force_upload, delete_related,
claudio@69 917 delay=0, cloudfree=False, monitor=True, rs_filename=None, lr_filename=None, ov_filename=None):
ioannis@32 918 """ Shortcut function to process a file to the SCC. """
ioannis@32 919 logger.info("Processing file %s, using system %s" % (filename, system_id))
victor@7 920
ioannis@43 921 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 922 scc.login(settings['website_credentials'])
ioannis@45 923 measurement = scc.process(filename, system_id,
ioannis@45 924 force_upload=force_upload,
ioannis@45 925 delete_related=delete_related,
ioannis@54 926 delay=delay,
claudio@69 927 cloudfree=cloudfree,
ioannis@45 928 monitor=monitor,
ioannis@45 929 rs_filename=rs_filename,
ioannis@45 930 lr_filename=lr_filename,
ioannis@45 931 ov_filename=ov_filename)
ioannis@43 932 scc.logout()
victor@7 933 return measurement
victor@7 934
victor@7 935
ioannis@45 936 def delete_measurements(measurement_ids, delete_related, settings):
moritz@29 937 """ Shortcut function to delete measurements from the SCC. """
ioannis@45 938 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 939 scc.login(settings['website_credentials'])
ioannis@45 940 for m_id in measurement_ids:
ioannis@54 941 logger.info("Deleting %s." % m_id)
ioannis@45 942 scc.delete_measurement(m_id, delete_related)
ioannis@45 943 scc.logout()
moritz@29 944
moritz@29 945
moritz@29 946 def rerun_all(measurement_ids, monitor, settings):
moritz@29 947 """ Shortcut function to rerun measurements from the SCC. """
i@14 948
ioannis@43 949 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 950 scc.login(settings['website_credentials'])
ioannis@45 951 for m_id in measurement_ids:
ioannis@54 952 logger.info("Rerunning all products for %s." % m_id)
ioannis@45 953 scc.rerun_all(m_id, monitor)
ioannis@43 954 scc.logout()
victor@7 955
victor@7 956
moritz@29 957 def rerun_processing(measurement_ids, monitor, settings):
victor@7 958 """ Shortcut function to delete a measurement from the SCC. """
i@14 959
ioannis@43 960 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 961 scc.login(settings['website_credentials'])
ioannis@45 962 for m_id in measurement_ids:
ioannis@45 963 logger.info("Rerunning (optical) processing for %s" % m_id)
ioannis@45 964 scc.rerun_elpp(m_id, monitor)
ioannis@45 965 scc.logout()
moritz@29 966
moritz@29 967
claudio@68 968 def list_measurements(settings, id_exact=None, id_startswith=None,
claudio@68 969 start_exact=None, start_gte=None, start_lte=None,
claudio@68 970 stop_exact=None, stop_gte=None, stop_lte=None,
claudio@68 971 station_exact=None, station_in=None):
moritz@29 972 """List all available measurements"""
ioannis@45 973 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@45 974 scc.login(settings['website_credentials'])
ioannis@65 975
claudio@68 976 results_json = scc.list_measurements(id_exact=id_exact, id_startswith=id_startswith,
claudio@68 977 start_exact=start_exact, start_gte=start_gte, start_lte=start_lte,
claudio@68 978 stop_exact=stop_exact, stop_gte=stop_gte, stop_lte=stop_lte,
claudio@68 979 station_exact=station_exact, station_in=station_in)
ioannis@65 980 print(results_json)
ioannis@65 981
ioannis@43 982 scc.logout()
victor@7 983
victor@7 984
ioannis@61 985 def download_measurements(measurement_ids, max_retries, exit_if_missing, settings):
moritz@29 986 """Download all measurements for the specified IDs"""
ioannis@43 987 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
ioannis@43 988 scc.login(settings['website_credentials'])
ioannis@45 989 for m_id in measurement_ids:
ioannis@61 990 scc.monitor_processing(m_id, retry_max=max_retries, time_sleep=3, exit_if_missing=exit_if_missing)
ioannis@61 991
ioannis@43 992 scc.logout()
i@14 993
i@14 994
claudio@68 995 def eshape_downloader(settings):
claudio@68 996 eshape_dir = settings['output_dir']
claudio@68 997 #directories = [[x[0] for x in os.walk(eshape_dir)]]
claudio@68 998 all_directories = [f.name for f in os.scandir(eshape_dir) if f.is_dir()]
claudio@68 999 folders_pattern = re.compile("^(\d{6}_{1}\d{12})+$")
claudio@68 1000 directories = [dir_name for dir_name in all_directories if folders_pattern.match(dir_name)]
claudio@68 1001 for dir_name in directories:
claudio@68 1002 start_string = dir_name.split("_")[1]
claudio@68 1003 date_time_start = datetime.datetime.strptime(start_string, '%Y%m%d%H%M')
claudio@68 1004 if (datetime.datetime.now() - datetime.timedelta(days=3)) <= date_time_start:
claudio@68 1005 start_parameter = date_time_start.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 1006 date_time_stop = datetime.datetime.now()
claudio@68 1007 stop_parameter = date_time_stop.strftime("%Y-%m-%dT%H:%M:%S")
claudio@68 1008
claudio@68 1009 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
claudio@68 1010 scc.login(settings['website_credentials'])
claudio@68 1011
claudio@68 1012 measurements = scc.available_measurements(start_gte=start_parameter, stop_lte=stop_parameter)
claudio@68 1013 if measurements is not None:
claudio@68 1014 for meas in measurements:
claudio@68 1015 scc.download_products(meas, dir_name)
claudio@68 1016
claudio@68 1017 scc.logout()
claudio@68 1018
claudio@68 1019
claudio@70 1020 def automatic_upload(settings):
claudio@70 1021 date_time_start = datetime.datetime.now() - datetime.timedelta(days=1)
claudio@70 1022 start_parameter = date_time_start.strftime("%Y-%m-%dT%H:%M:%S")
claudio@70 1023 date_time_stop = datetime.datetime.now()
claudio@70 1024 stop_parameter = date_time_stop.strftime("%Y-%m-%dT%H:%M:%S")
claudio@70 1025
claudio@70 1026 with SCC(settings['basic_credentials'], settings['output_dir'], settings['base_url']) as scc:
claudio@70 1027 scc.login(settings['website_credentials'])
claudio@70 1028
claudio@70 1029 measurements = scc.available_measurements(start_gte=start_parameter, stop_lte=stop_parameter, is_queued=False, is_being_processed=False)
claudio@70 1030 if measurements is not None:
claudio@70 1031 for meas in measurements:
claudio@70 1032 scc.download_products(meas, "")
claudio@70 1033
claudio@70 1034 scc.logout()
claudio@70 1035
claudio@70 1036
moritz@29 1037 def settings_from_path(config_file_path):
i@14 1038 """ Read the configuration file.
i@14 1039
i@14 1040 The file should be in YAML syntax."""
i@14 1041
i@14 1042 if not os.path.isfile(config_file_path):
moritz@29 1043 raise argparse.ArgumentTypeError("Wrong path for configuration file (%s)" % config_file_path)
i@14 1044
i@14 1045 with open(config_file_path) as yaml_file:
i@14 1046 try:
i@14 1047 settings = yaml.safe_load(yaml_file)
i@14 1048 logger.debug("Read settings file(%s)" % config_file_path)
moritz@29 1049 except Exception:
moritz@29 1050 raise argparse.ArgumentTypeError("Could not parse YAML file (%s)" % config_file_path)
i@14 1051
i@14 1052 # YAML limitation: does not read tuples
i@14 1053 settings['basic_credentials'] = tuple(settings['basic_credentials'])
i@14 1054 settings['website_credentials'] = tuple(settings['website_credentials'])
i@14 1055 return settings
i@14 1056
i@14 1057
moritz@29 1058 # Setup for command specific parsers
moritz@29 1059 def setup_delete(parser):
moritz@29 1060 def delete_from_args(parsed):
ioannis@45 1061 delete_measurements(parsed.IDs,
ioannis@45 1062 delete_related=False,
ioannis@45 1063 settings=parsed.config)
moritz@29 1064
moritz@29 1065 parser.add_argument("IDs", nargs="+", help="measurement IDs to delete.")
moritz@29 1066 parser.set_defaults(execute=delete_from_args)
moritz@29 1067
moritz@29 1068
moritz@29 1069 def setup_rerun_all(parser):
moritz@29 1070 def rerun_all_from_args(parsed):
moritz@29 1071 rerun_all(parsed.IDs, parsed.process, parsed.config)
moritz@29 1072
moritz@29 1073 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun.")
moritz@29 1074 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1075 action="store_true")
moritz@29 1076 parser.set_defaults(execute=rerun_all_from_args)
moritz@29 1077
moritz@29 1078
ioannis@45 1079 def setup_rerun_elpp(parser):
moritz@29 1080 def rerun_processing_from_args(parsed):
moritz@29 1081 rerun_processing(parsed.IDs, parsed.process, parsed.config)
moritz@29 1082
moritz@29 1083 parser.add_argument("IDs", nargs="+", help="Measurement IDs to rerun the processing on.")
moritz@29 1084 parser.add_argument("-p", "--process", help="Wait for the results of the processing.",
moritz@29 1085 action="store_true")
moritz@29 1086 parser.set_defaults(execute=rerun_processing_from_args)
moritz@29 1087
moritz@29 1088
ioannis@45 1089 def setup_upload_file(parser):
ioannis@45 1090 """ Upload but do not monitor processing progress. """
ioannis@67 1091
ioannis@45 1092 def upload_file_from_args(parsed):
ioannis@45 1093 process_file(parsed.filename, parsed.system, parsed.config,
ioannis@54 1094 delay=parsed.delay,
claudio@69 1095 cloudfree=parsed.cloudfree,
ioannis@45 1096 monitor=parsed.process,
ioannis@45 1097 force_upload=parsed.force_upload,
ioannis@45 1098 delete_related=False, # For now, use this as default
ioannis@32 1099 rs_filename=parsed.radiosounding,
ioannis@32 1100 ov_filename=parsed.overlap,
ioannis@32 1101 lr_filename=parsed.lidarratio)
moritz@29 1102
ioannis@54 1103 def delay(arg):
ioannis@54 1104 try:
ioannis@54 1105 int_arg = int(arg)
ioannis@54 1106 except ValueError:
ioannis@54 1107 raise argparse.ArgumentTypeError("Could not convert delay argument {} to integer.".format(arg))
ioannis@54 1108
ioannis@54 1109 if 0 <= int_arg <= 96:
ioannis@54 1110 return int_arg
ioannis@54 1111 else:
ioannis@54 1112 raise argparse.ArgumentTypeError("Delay should be an integer between 0 and 96.")
ioannis@54 1113
moritz@29 1114 parser.add_argument("filename", help="Measurement file name or path.")
moritz@29 1115 parser.add_argument("system", help="Processing system id.")
ioannis@54 1116 parser.add_argument("--delay", help="Delay processing by the specified number of hours (0 to 96).",
ioannis@54 1117 default=0, type=delay)
claudio@69 1118 parser.add_argument("--cloudfree", help="Manually assume this measurement as cloud free.",
claudio@69 1119 action="store_true", default=False)
ioannis@45 1120 parser.add_argument("-p", "--process", help="Wait for the processing results.",
ioannis@45 1121 action="store_true")
ioannis@45 1122 parser.add_argument("--force_upload", help="If measurement ID exists on SCC, delete before uploading.",
ioannis@45 1123 action="store_true")
i@30 1124 parser.add_argument("--radiosounding", default=None, help="Radiosounding file name or path")
ioannis@32 1125 parser.add_argument("--overlap", default=None, help="Overlap file name or path")
ioannis@32 1126 parser.add_argument("--lidarratio", default=None, help="Lidar ratio file name or path")
i@30 1127
moritz@29 1128 parser.set_defaults(execute=upload_file_from_args)
moritz@29 1129
moritz@29 1130
moritz@29 1131 def setup_list_measurements(parser):
moritz@29 1132 def list_measurements_from_args(parsed):
claudio@68 1133 list_measurements(parsed.config, id_exact=parsed.id_exact, id_startswith=parsed.id_startswith,
claudio@68 1134 start_exact=parsed.start_exact, start_gte=parsed.start_gte, start_lte=parsed.start_lte,
claudio@68 1135 stop_exact=parsed.stop_exact, stop_gte=parsed.stop_gte, stop_lte=parsed.stop_lte,
claudio@68 1136 station_exact=parsed.station_exact, station_in=parsed.station_in)
claudio@68 1137
claudio@68 1138 group = parser.add_argument_group()
claudio@68 1139
claudio@68 1140 group_id = group.add_mutually_exclusive_group()
claudio@68 1141 group_id.add_argument("--id_exact", help="Exact measurement id.")
claudio@68 1142 group_id.add_argument("--id_startswith", help="Initial part of measurement id.")
moritz@29 1143
claudio@68 1144 group_start = group.add_argument_group()
claudio@68 1145 group_start.add_argument("--start_exact", help="Exact start date of the measurement.")
claudio@68 1146 group_start.add_argument("--start_gte", help="Start date of the measurement after the given date.")
claudio@68 1147 group_start.add_argument("--start_lte", help="Start date of the measurement before the given date.")
claudio@68 1148
claudio@68 1149 group_stop = group.add_argument_group()
claudio@68 1150 group_stop.add_argument("--stop_exact", help="Exact stop date of the measurement.")
claudio@68 1151 group_stop.add_argument("--stop_gte", help="Stop date of the measurement after the given date.")
claudio@68 1152 group_stop.add_argument("--stop_lte", help="Stop date of the measurement before the given date.")
claudio@68 1153
claudio@68 1154 group_station = group.add_mutually_exclusive_group()
claudio@68 1155 group_station.add_argument("--station_exact", help="Station the performed the measurement.")
claudio@68 1156 group_station.add_argument("--station_in", help="List of stations (separated by comma) that performed the measurement.")
moritz@29 1157
moritz@29 1158 parser.set_defaults(execute=list_measurements_from_args)
moritz@29 1159
moritz@29 1160
moritz@29 1161 def setup_download_measurements(parser):
moritz@29 1162 def download_measurements_from_args(parsed):
ioannis@61 1163 download_measurements(parsed.IDs, parsed.max_retries, parsed.ignore_errors, parsed.config)
moritz@29 1164
moritz@29 1165 parser.add_argument("IDs", help="Measurement IDs that should be downloaded.", nargs="+")
ioannis@67 1166 parser.add_argument("--max_retries", help="Number of times to retry in cases of missing measurement id.", default=0,
ioannis@67 1167 type=int)
ioannis@67 1168 parser.add_argument("--ignore_errors", help="Ignore errors when downloading multiple measurements.",
ioannis@67 1169 action="store_false")
moritz@29 1170 parser.set_defaults(execute=download_measurements_from_args)
moritz@29 1171
moritz@29 1172
claudio@68 1173 def setup_eshape_downloader(parser):
claudio@68 1174 def run_eshape_downloader(parsed):
claudio@68 1175 eshape_downloader(parsed.config)
claudio@68 1176
claudio@68 1177 parser.set_defaults(execute=run_eshape_downloader)
claudio@68 1178
claudio@68 1179
claudio@70 1180 def setup_automatic_upload(parser):
claudio@70 1181 def run_automatic_upload(parsed):
claudio@70 1182 automatic_upload(parsed.config)
claudio@70 1183
claudio@70 1184 parser.set_defaults(execute=run_automatic_upload)
claudio@70 1185
claudio@70 1186
victor@7 1187 def main():
victor@7 1188 # Define the command line arguments.
victor@7 1189 parser = argparse.ArgumentParser()
moritz@29 1190 subparsers = parser.add_subparsers()
moritz@29 1191
moritz@29 1192 delete_parser = subparsers.add_parser("delete", help="Deletes a measurement.")
ioannis@67 1193 rerun_all_parser = subparsers.add_parser("rerun-all",
ioannis@67 1194 help="Rerun all processing steps for the provided measurement IDs.")
ioannis@45 1195 rerun_processing_parser = subparsers.add_parser("rerun-elpp",
ioannis@45 1196 help="Rerun low-resolution processing steps for the provided measurement ID.")
ioannis@67 1197 upload_file_parser = subparsers.add_parser("upload-file",
ioannis@67 1198 help="Submit a file and, optionally, download the output products.")
ioannis@32 1199 list_parser = subparsers.add_parser("list", help="List measurements registered on the SCC.")
moritz@29 1200 download_parser = subparsers.add_parser("download", help="Download selected measurements.")
claudio@68 1201 eshape_parser = subparsers.add_parser("eshape-downloader", help="Search and download relevant products for E-SHAPE.")
claudio@70 1202 automatic_upload_parser = subparsers.add_parser("automatic-upload", help="Select and download products available for the upload to EARLINET db.")
moritz@29 1203
moritz@29 1204 setup_delete(delete_parser)
moritz@29 1205 setup_rerun_all(rerun_all_parser)
ioannis@45 1206 setup_rerun_elpp(rerun_processing_parser)
ioannis@45 1207
moritz@29 1208 setup_upload_file(upload_file_parser)
moritz@29 1209 setup_list_measurements(list_parser)
moritz@29 1210 setup_download_measurements(download_parser)
claudio@68 1211 setup_eshape_downloader(eshape_parser)
claudio@70 1212 setup_automatic_upload(automatic_upload_parser)
victor@7 1213
victor@7 1214 # Verbosity settings from http://stackoverflow.com/a/20663028
victor@7 1215 parser.add_argument('-d', '--debug', help="Print debugging information.", action="store_const",
victor@7 1216 dest="loglevel", const=logging.DEBUG, default=logging.INFO,
victor@7 1217 )
victor@7 1218 parser.add_argument('-s', '--silent', help="Show only warning and error messages.", action="store_const",
victor@7 1219 dest="loglevel", const=logging.WARNING
victor@7 1220 )
victor@7 1221
ioannis@32 1222 # Setup default config location
moritz@29 1223 home = os.path.expanduser("~")
moritz@29 1224 default_config_location = os.path.abspath(os.path.join(home, ".scc_access.yaml"))
moritz@29 1225 parser.add_argument("-c", "--config", help="Path to the config file.", type=settings_from_path,
moritz@29 1226 default=default_config_location)
victor@7 1227
victor@7 1228 args = parser.parse_args()
ioannis@43 1229
victor@7 1230 # Get the logger with the appropriate level
victor@7 1231 logging.basicConfig(format='%(levelname)s: %(message)s', level=args.loglevel)
victor@7 1232
moritz@29 1233 # Dispatch to appropriate function
moritz@29 1234 args.execute(args)
moritz@29 1235
i@14 1236
moritz@29 1237 # When running through terminal
moritz@29 1238 if __name__ == '__main__':
moritz@29 1239 main()

mercurial