Source code for casaconfig.private.get_data_info

# Copyright 2023 AUI, Inc. Washington DC, USA
#
#   Licensed under the Apache License, Version 2.0 (the "License");
#   you may not use this file except in compliance with the License.
#   You may obtain a copy of the License at
#
#       http://www.apache.org/licenses/LICENSE-2.0
#
#   Unless required by applicable law or agreed to in writing, software
#   distributed under the License is distributed on an "AS IS" BASIS,
#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#   See the License for the specific language governing permissions and
#   limitations under the License.
"""
this module will be included in the api
"""

[docs]def get_data_info(path=None, logger=None, type=None): """ Get the summary information on the 3 types of data managed by casaconfig. The return value is a dictionary by type of data : 'casarundata', 'measures', and 'release'. Each type is itself a dictionary as described below. The path is the location to use to search for the installed release information. The path argument defaults to config.measurespath when not set. The return value can be limited to just a specific type using the type argument ('casarundata', 'measures', 'release'). In that case the returned value is the dictionary for just the requested type. When type is None (the default) the full set of dictionaries is returned. The 'casarundata' and 'measures' dictionaries contain 'version' and 'date' where version is the version string and date is the date when it was installed. These values are taken from the readme.txt file for each type. For 'casarundata' an additional field of 'manifest' is present which is the list of files that have been installed for that specific version (this will be empty for an unknown or invalid version). The measures dictionary also contains a 'site' field which holds the URL of the site that supplied that version. For older readme files that lack any site infromation the site is assumed to be the astron site. The 'release' dictionary comes from the release_data_readme.txt file which is copied into place when a modular CASA is built. It consists of 'casarundata' and 'measures' dictionaries where each dictionary contains the 'version' string and 'date' that that version was created for the described release. This allows casaconfig to install that casarundata version for testing purposes. The release information does not depend on the path argument since it is found in the casaconfig module. If path is empty or does not exist then the return value for the 'casarundata' and 'measures' types is None. If no readme.txt file can be found at path but the contents of path have the directories expected for casarundata then the version returned for 'casarundata' is 'unknown' and the date is an empty string. In that case the path may contain casarundata from a legacy installation of CASA data. CASA will be able to use the files at this location but they can not be maintained by casaconfig. If the path is not empty (except for a possible lock file while it's in use but does not appear to contain legacy casarundata or the readme.txt file found there can not be read as expected then the version is 'invalid'. If no readme.txt file can be found for the measures at path/geodetic but both the geodetic and ephemeris directories are present in path then the version returned for 'measures' is 'unknown' and the date is an empty string. The path location may contain measures data from a legacy installation of CASA data. CASA will be able to use any measures tables at this location by they can not be maintained by casaconfig. If the path is not empty but does not appear to contain legacy measures data or the readme.txt file found in path/geodetic can not be read as expected then the version is 'invalid'. If no casadata release information is found or the contents are unexpected the returned value for 'release' is None and the "--reference-testing" option will not do anything for this installation of casaconfig. This will be the case for a modular installation. If path has not been set (has a value of None) then the returned value will be None. This likely means that a casasiteconfig.py exists but has not yet been edited to set measurespath. Parameters - path (str) - Folder path to find the casarundata and measures data information. If not set then config.measurespath is used. - logger (casatools.logsink=None) - Instance of the casalogger to use for writing messages. Default None writes messages to the terminal. - type (str) - the specific type of data info to return (None, 'casarundata', 'measures', 'release'; None returns a dictionary of all types) Returns - a dictionary by type, 'casarundata', 'measures', 'release' where each type is a dictionary containing 'version' and 'date'. A return value of None indicates path is unset. A value of None for that type means no information could be found about that type. If a specific type is requested then only the dictionary for that type is returned (or None if that type can not be found). Raises - casaconfig.UnsetMeasurespath - path is None and has not been set in config - ValueError - raised when type has an invalid value """ result = None import os import time import importlib.resources from .print_log_messages import print_log_messages from .read_readme import read_readme from casaconfig import UnsetMeasurespath from casaconfig import BadReadme currentTime = time.time() secondsPerDay = 24. * 60. * 60. if path is None: from .. import config as _config path = _config.measurespath if path is None: raise UnsetMeasurespath('get_data_info: path is None and has not been set in config.measurespath. Provide a valid path and retry.') path = os.path.abspath(os.path.expanduser(path)) result = {'casarundata':None, 'measures':None, 'release':None} if type is not None and type not in result: raise ValueError("invalid type %s; must be one of None, 'casarundata', 'measures', 'release'" % type) # casarundata and measures if os.path.isdir(path) and (len(os.listdir(path))>0): # if the only thing at path is the lock file then proceed as if path is empty - skip this section pathfiles = os.listdir(path) if len(pathfiles) == 1 and pathfiles[0] == "data_update.lock": pass else: # there's something at path, look for the casarundata readme if type is None or type=='casarundata': datareadme_path = os.path.join(path,'readme.txt') if os.path.exists(datareadme_path): # the readme exists, get the info result['casarundata'] = {'version':'error', 'date':'', 'manifest':[], 'age':None} try: readmeContents = read_readme(datareadme_path) if readmeContents is not None: currentAge = (currentTime - os.path.getmtime(datareadme_path)) / secondsPerDay currentVersion = readmeContents['version'] currentDate = readmeContents['date'] # the manifest ('extra') must exist with at least 1 entry, otherwise this is no a valid readme file and the version should be 'error' if len(readmeContents['extra']) > 0: result['casarundata'] = {'version':currentVersion, 'date':currentDate, 'manifest':readmeContents['extra'], 'age':currentAge} except BadReadme as exc: # put the exception string into the version so it shows up in the summary resulte['casarundata']['version'] = "error: " + str(exc) else: # does it look like it's probably casarundata? expected_dirs = ['alma','catalogs','demo','ephemerides','geodetic','gui','nrao'] ok = True for d in expected_dirs: if not os.path.isdir(os.path.join(path,d)): ok = False if ok: # probably casarundata result['casarundata'] = {'version':'unknown', 'date':'', 'manifest': None,'age':None} else: # probably not casarundata # this is invalid, unexpected things are happening there result['casarundata'] = {'version':'invalid', 'date':'', 'manifest': None, 'age':None} if type is None or type=='measures': # look for the measures readme measuresreadme_path = os.path.join(path,'geodetic/readme.txt') if os.path.exists(measuresreadme_path): # the readme exists, get the info result['measures'] = {'site':'', 'version':'error', 'date':'', 'age':None} try: readmeContents = read_readme(measuresreadme_path) if readmeContents is not None: currentSite = readmeContents['site'] if currentSite is None: currentSite = 'https://www.astron.nl/iers/' currentVersion = readmeContents['version'] currentDate = readmeContents['date'] currentAge = (currentTime - os.path.getmtime(measuresreadme_path)) / secondsPerDay result['measures'] = {'site':currentSite,'version':currentVersion,'date':currentDate,'age':currentAge} except BadReadme as exc: # put the exception string into the version so it shows up in the summary result['measures']['version'] = "error: " + str(exc) else: # does it look like it's probably measuresdata? # path should have ephemerides and geodetic directories if os.path.isdir(os.path.join(path,'ephemerides')) and os.path.isdir(os.path.join(path,'geodetic')): result['measures'] = {'site':'unknown', 'version':'unknown', 'date':'', 'age':None} else: # probably not measuresdata result['measures'] = {'site':'', 'version':'invalid', 'date':'', 'age':None} if type is None or type=='release': # release data versions if importlib.resources.files('casaconfig').joinpath('release_data_readme.txt').is_file(): try: casarundataVersion = None measuresVersion = None ok = True reason = None readme_lines = importlib.resources.read_text('casaconfig','release_data_readme.txt').split('\n') for readmeLine in readme_lines: # lines must contain something and not start with # if len(readmeLine) > 0 and readmeLine[0] != '#': splitLine = readmeLine.split(':') if len(splitLine) == 2: lineType = splitLine[0].strip() lineVers = splitLine[1].strip() if lineType == 'casarundata': if casarundataVersion is not None: ok = False reason = "duplicate casarundata lines" break casarundataVersion = lineVers elif lineType == 'measures': if measuresVersion is not None: ok = False reason = "duplicate measures line" break measuresVersion = lineVers else: ok = False reason = "Unexpected type : %s" % lineType break else: ok = False reason = "Missing or too many ':' separators" if (casarundataVersion is None or measuresVersion is None) and ok: ok = False reason = "missing one or more version strings for expected casarundata and measures types" if not ok: print_log_messages("Incorrectly formatted release_data_readme.txt. %s" % reason, logger, True) # leave 'release' as None else: result['release'] = {'casarundata':casarundataVersion, 'measures':measuresVersion} except: print("Unexpected error reading release_data_readme.txt") # leave 'release' as None else: # no release information available, probably a modular install only # leave 'release' as None pass if type is not None: result = result[type] return result