diff options
Diffstat (limited to 'weather-2.3/weather.py')
-rw-r--r-- | weather-2.3/weather.py | 2135 |
1 files changed, 2135 insertions, 0 deletions
diff --git a/weather-2.3/weather.py b/weather-2.3/weather.py new file mode 100644 index 0000000..b5b71a1 --- /dev/null +++ b/weather-2.3/weather.py @@ -0,0 +1,2135 @@ +"""Contains various object definitions needed by the weather utility.""" + +weather_copyright = """\ +# Copyright (c) 2006-2016 Jeremy Stanley <fungi@yuggoth.org>. Permission to +# use, copy, modify, and distribute this software is granted under terms +# provided in the LICENSE file distributed with this software. +#""" + +weather_version = "2.3" + +radian_to_km = 6372.795484 +radian_to_mi = 3959.871528 + +def pyversion(ref=None): + """Determine the Python version and optionally compare to a reference.""" + import platform + ver = platform.python_version() + if ref: + return [ + int(x) for x in ver.split(".")[:2] + ] >= [ + int(x) for x in ref.split(".")[:2] + ] + else: return ver + +class Selections: + """An object to contain selection data.""" + def __init__(self): + """Store the config, options and arguments.""" + self.config = get_config() + self.options, self.arguments = get_options(self.config) + if self.get_bool("cache") and self.get_bool("cache_search") \ + and not self.get_bool("longlist"): + integrate_search_cache( + self.config, + self.get("cachedir"), + self.get("setpath") + ) + if not self.arguments: + if "id" in self.options.__dict__ \ + and self.options.__dict__["id"]: + self.arguments.append( self.options.__dict__["id"] ) + del( self.options.__dict__["id"] ) + import sys + message = "WARNING: the --id option is deprecated and will eventually be removed\n" + sys.stderr.write(message) + elif "city" in self.options.__dict__ \ + and self.options.__dict__["city"] \ + and "st" in self.options.__dict__ \ + and self.options.__dict__["st"]: + self.arguments.append( + "^%s city, %s" % ( + self.options.__dict__["city"], + self.options.__dict__["st"] + ) + ) + del( self.options.__dict__["city"] ) + del( self.options.__dict__["st"] ) + import sys + message = "WARNING: the --city/--st options are deprecated and will eventually be removed\n" + sys.stderr.write(message) + def get(self, option, argument=None): + """Retrieve data from the config or options.""" + if argument: + if self.config.has_section(argument) and ( + self.config.has_option(argument, "city") \ + or self.config.has_option(argument, "id") \ + or self.config.has_option(argument, "st") + ): + self.config.remove_section(argument) + import sys + message = "WARNING: the city/id/st options are now unsupported in aliases\n" + sys.stderr.write(message) + if not self.config.has_section(argument): + guessed = guess( + argument, + path=self.get("setpath"), + info=self.get("info"), + cache_search=( + self.get("cache") and self.get("cache_search") + ), + cachedir=self.get("cachedir"), + quiet=self.get_bool("quiet") + ) + self.config.add_section(argument) + for item in guessed.items(): + self.config.set(argument, *item) + if self.config.has_option(argument, option): + return self.config.get(argument, option) + if option in self.options.__dict__: + return self.options.__dict__[option] + else: + import os, sys + message = "%s error: no URI defined for %s\n" % ( + os.path.basename( sys.argv[0] ), + option + ) + sys.stderr.write(message) + exit(1) + def get_bool(self, option, argument=None): + """Get data and coerce to a boolean if necessary.""" + return bool(self.get(option, argument)) + def getint(self, option, argument=None): + """Get data and coerce to an integer if necessary.""" + value = self.get(option, argument) + if value: return int(value) + else: return 0 + +def average(coords): + """Average a list of coordinates.""" + x = 0 + y = 0 + for coord in coords: + x += coord[0] + y += coord[1] + count = len(coords) + return (x/count, y/count) + +def filter_units(line, units="imperial"): + """Filter or convert units in a line of text between US/UK and metric.""" + import re + # filter lines with both pressures in the form of "X inches (Y hPa)" or + # "X in. Hg (Y hPa)" + dual_p = re.match( + "(.* )(\d*(\.\d+)? (inches|in\. Hg)) \((\d*(\.\d+)? hPa)\)(.*)", + line + ) + if dual_p: + preamble, in_hg, i_fr, i_un, hpa, h_fr, trailer = dual_p.groups() + if units == "imperial": line = preamble + in_hg + trailer + elif units == "metric": line = preamble + hpa + trailer + # filter lines with both temperatures in the form of "X F (Y C)" + dual_t = re.match( + "(.* )(-?\d*(\.\d+)? F) \((-?\d*(\.\d+)? C)\)(.*)", + line + ) + if dual_t: + preamble, fahrenheit, f_fr, celsius, c_fr, trailer = dual_t.groups() + if units == "imperial": line = preamble + fahrenheit + trailer + elif units == "metric": line = preamble + celsius + trailer + # if metric is desired, convert distances in the form of "X mile(s)" to + # "Y kilometer(s)" + if units == "metric": + imperial_d = re.match( + "(.* )(\d+)( mile\(s\))(.*)", + line + ) + if imperial_d: + preamble, mi, m_u, trailer = imperial_d.groups() + line = preamble + str(int(round(int(mi)*1.609344))) \ + + " kilometer(s)" + trailer + # filter speeds in the form of "X MPH (Y KT)" to just "X MPH"; if metric is + # desired, convert to "Z KPH" + imperial_s = re.match( + "(.* )(\d+)( MPH)( \(\d+ KT\))(.*)", + line + ) + if imperial_s: + preamble, mph, m_u, kt, trailer = imperial_s.groups() + if units == "imperial": line = preamble + mph + m_u + trailer + elif units == "metric": + line = preamble + str(int(round(int(mph)*1.609344))) + " KPH" + \ + trailer + imperial_s = re.match( + "(.* )(\d+)( MPH)( \(\d+ KT\))(.*)", + line + ) + if imperial_s: + preamble, mph, m_u, kt, trailer = imperial_s.groups() + if units == "imperial": line = preamble + mph + m_u + trailer + elif units == "metric": + line = preamble + str(int(round(int(mph)*1.609344))) + " KPH" + \ + trailer + # if imperial is desired, qualify given forcast temperatures like "X F"; if + # metric is desired, convert to "Y C" + imperial_t = re.match( + "(.* )(High |high |Low |low )(\d+)(\.|,)(.*)", + line + ) + if imperial_t: + preamble, parameter, fahrenheit, sep, trailer = imperial_t.groups() + if units == "imperial": + line = preamble + parameter + fahrenheit + " F" + sep + trailer + elif units == "metric": + line = preamble + parameter \ + + str(int(round((int(fahrenheit)-32)*5/9))) + " C" + sep \ + + trailer + # hand off the resulting line + return line + +def get_uri( + uri, + ignore_fail=False, + cache_data=False, + cacheage=900, + cachedir="." +): + """Return a string containing the results of a URI GET.""" + if pyversion("3"): + import urllib, urllib.error, urllib.request + URLError = urllib.error.URLError + urlopen = urllib.request.urlopen + else: + import urllib2 as urllib + URLError = urllib.URLError + urlopen = urllib.urlopen + import os, time + if cache_data: + dcachedir = os.path.join( os.path.expanduser(cachedir), "datacache" ) + if not os.path.exists(dcachedir): + try: os.makedirs(dcachedir) + except (IOError, OSError): pass + dcache_fn = os.path.join( + dcachedir, + uri.split(":")[1].replace("/","_") + ) + now = time.time() + if cache_data and os.access(dcache_fn, os.R_OK) \ + and now-cacheage < os.stat(dcache_fn).st_mtime <= now: + dcache_fd = open(dcache_fn) + data = dcache_fd.read() + dcache_fd.close() + else: + try: + if pyversion("3"): data = urlopen(uri).read().decode("utf-8") + else: data = urlopen(uri).read() + except URLError: + if ignore_fail: return "" + else: + import os, sys, traceback + message = "%s error: failed to retrieve\n %s\n %s" % ( + os.path.basename( sys.argv[0] ), + uri, + traceback.format_exception_only( + sys.exc_type, + sys.exc_value + )[0] + ) + sys.stderr.write(message) + sys.exit(1) + if cache_data: + try: + import codecs + dcache_fd = codecs.open(dcache_fn, "w", "utf-8") + dcache_fd.write(data) + dcache_fd.close() + except (IOError, OSError): pass + return data + +def get_metar( + uri=None, + verbose=False, + quiet=False, + headers=None, + imperial=False, + metric=False, + cache_data=False, + cacheage=900, + cachedir="." +): + """Return a summarized METAR for the specified station.""" + if not uri: + import os, sys + message = "%s error: METAR URI required for conditions\n" % \ + os.path.basename( sys.argv[0] ) + sys.stderr.write(message) + sys.exit(1) + metar = get_uri( + uri, + cache_data=cache_data, + cacheage=cacheage, + cachedir=cachedir + ) + if pyversion("3") and type(metar) is bytes: metar = metar.decode("utf-8") + if verbose: return metar + else: + import re + lines = metar.split("\n") + if not headers: + headers = \ + "relative_humidity," \ + + "precipitation_last_hour," \ + + "sky conditions," \ + + "temperature," \ + + "heat index," \ + + "windchill," \ + + "weather," \ + + "wind" + headerlist = headers.lower().replace("_"," ").split(",") + output = [] + if not quiet: + title = "Current conditions at %s" + place = lines[0].split(", ") + if len(place) > 1: + place = "%s, %s" % ( place[0].title(), place[1] ) + else: place = "<UNKNOWN>" + output.append(title%place) + output.append("Last updated " + lines[1]) + header_match = False + for header in headerlist: + for line in lines: + if line.lower().startswith(header + ":"): + if re.match(r".*:\d+$", line): line = line[:line.rfind(":")] + if imperial: line = filter_units(line, units="imperial") + elif metric: line = filter_units(line, units="metric") + if quiet: output.append(line) + else: output.append(" " + line) + header_match = True + if not header_match: + output.append( + "(no conditions matched your header list, try with --verbose)" + ) + return "\n".join(output) + +def get_alert( + uri=None, + verbose=False, + quiet=False, + cache_data=False, + cacheage=900, + cachedir="." +): + """Return alert notice for the specified URI.""" + if not uri: + import os, sys + message = "%s error: Alert URI required for alerts\n" % \ + os.path.basename( sys.argv[0] ) + sys.stderr.write(message) + sys.exit(1) + alert = get_uri( + uri, + ignore_fail=True, + cache_data=cache_data, + cacheage=cacheage, + cachedir=cachedir + ).strip() + if pyversion("3") and type(alert) is bytes: alert = alert.decode("utf-8") + if alert: + if verbose: return alert + else: + if alert.find("\nNATIONAL WEATHER SERVICE") == -1: + muted = False + else: + muted = True + lines = alert.split("\n") + import time + valid_time = time.strftime("%Y%m%d%H%M") + output = [] + for line in lines: + if line.startswith("Expires:") \ + and "Expires:" + valid_time > line: + return "" + if muted and line.startswith("NATIONAL WEATHER SERVICE"): + muted = False + line = "" + elif line == "&&": + line = "" + elif line == "$$": + muted = True + if line and not muted: + if quiet: output.append(line) + else: output.append(" " + line) + return "\n".join(output) + +def get_options(config): + """Parse the options passed on the command line.""" + + # for optparse's builtin -h/--help option + usage = \ + "usage: %prog [options] [alias1|search1 [alias2|search2 [...]]]" + + # for optparse's builtin --version option + verstring = "%prog " + weather_version + + # create the parser + import optparse + option_parser = optparse.OptionParser(usage=usage, version=verstring) + # separate options object from list of arguments and return both + + # the -a/--alert option + if config.has_option("default", "alert"): + default_alert = bool(config.get("default", "alert")) + else: default_alert = False + option_parser.add_option("-a", "--alert", + dest="alert", + action="store_true", + default=default_alert, + help="include local alert notices") + + # the --atypes option + if config.has_option("default", "atypes"): + default_atypes = config.get("default", "atypes") + else: + default_atypes = \ + "coastal_flood_statement," \ + + "flash_flood_statement," \ + + "flash_flood_warning," \ + + "flash_flood_watch," \ + + "flood_statement," \ + + "flood_warning," \ + + "marine_weather_statement," \ + + "river_statement," \ + + "severe_thunderstorm_warning," \ + + "severe_weather_statement," \ + + "short_term_forecast," \ + + "special_marine_warning," \ + + "special_weather_statement," \ + + "tornado_warning," \ + + "urgent_weather_message" + option_parser.add_option("--atypes", + dest="atypes", + default=default_atypes, + help="list of alert notification types to display") + + # the --build-sets option + option_parser.add_option("--build-sets", + dest="build_sets", + action="store_true", + default=False, + help="(re)build location correlation sets") + + # the --cacheage option + if config.has_option("default", "cacheage"): + default_cacheage = config.getint("default", "cacheage") + else: default_cacheage = 900 + option_parser.add_option("--cacheage", + dest="cacheage", + default=default_cacheage, + help="duration in seconds to refresh cached data") + + # the --cachedir option + if config.has_option("default", "cachedir"): + default_cachedir = config.get("default", "cachedir") + else: default_cachedir = "~/.weather" + option_parser.add_option("--cachedir", + dest="cachedir", + default=default_cachedir, + help="directory for storing cached searches and data") + + # the -f/--forecast option + if config.has_option("default", "forecast"): + default_forecast = bool(config.get("default", "forecast")) + else: default_forecast = False + option_parser.add_option("-f", "--forecast", + dest="forecast", + action="store_true", + default=default_forecast, + help="include a local forecast") + + # the --headers option + if config.has_option("default", "headers"): + default_headers = config.get("default", "headers") + else: + default_headers = \ + "temperature," \ + + "relative_humidity," \ + + "wind," \ + + "heat_index," \ + + "windchill," \ + + "weather," \ + + "sky_conditions," \ + + "precipitation_last_hour" + option_parser.add_option("--headers", + dest="headers", + default=default_headers, + help="list of conditions headers to display") + + # the --imperial option + if config.has_option("default", "imperial"): + default_imperial = bool(config.get("default", "imperial")) + else: default_imperial = False + option_parser.add_option("--imperial", + dest="imperial", + action="store_true", + default=default_imperial, + help="filter/convert conditions for US/UK units") + + # the --info option + option_parser.add_option("--info", + dest="info", + action="store_true", + default=False, + help="output detailed information for your search") + + # the -l/--list option + option_parser.add_option("-l", "--list", + dest="list", + action="store_true", + default=False, + help="list all configured aliases and cached searches") + + # the --longlist option + option_parser.add_option("--longlist", + dest="longlist", + action="store_true", + default=False, + help="display details of all configured aliases") + + # the -m/--metric option + if config.has_option("default", "metric"): + default_metric = bool(config.get("default", "metric")) + else: default_metric = False + option_parser.add_option("-m", "--metric", + dest="metric", + action="store_true", + default=default_metric, + help="filter/convert conditions for metric units") + + # the -n/--no-conditions option + if config.has_option("default", "conditions"): + default_conditions = bool(config.get("default", "conditions")) + else: default_conditions = True + option_parser.add_option("-n", "--no-conditions", + dest="conditions", + action="store_false", + default=default_conditions, + help="disable output of current conditions") + + # the --no-cache option + if config.has_option("default", "cache"): + default_cache = bool(config.get("default", "cache")) + else: default_cache = True + option_parser.add_option("--no-cache", + dest="cache", + action="store_false", + default=True, + help="disable all caching (searches and data)") + + # the --no-cache-data option + if config.has_option("default", "cache_data"): + default_cache_data = bool(config.get("default", "cache_data")) + else: default_cache_data = True + option_parser.add_option("--no-cache-data", + dest="cache_data", + action="store_false", + default=True, + help="disable retrieved data caching") + + # the --no-cache-search option + if config.has_option("default", "cache_search"): + default_cache_search = bool(config.get("default", "cache_search")) + else: default_cache_search = True + option_parser.add_option("--no-cache-search", + dest="cache_search", + action="store_false", + default=True, + help="disable search result caching") + + # the -q/--quiet option + if config.has_option("default", "quiet"): + default_quiet = bool(config.get("default", "quiet")) + else: default_quiet = False + option_parser.add_option("-q", "--quiet", + dest="quiet", + action="store_true", + default=default_quiet, + help="skip preambles and don't indent") + + # the --setpath option + if config.has_option("default", "setpath"): + default_setpath = config.get("default", "setpath") + else: default_setpath = ".:~/.weather" + option_parser.add_option("--setpath", + dest="setpath", + default=default_setpath, + help="directory search path for correlation sets") + + # the -v/--verbose option + if config.has_option("default", "verbose"): + default_verbose = bool(config.get("default", "verbose")) + else: default_verbose = False + option_parser.add_option("-v", "--verbose", + dest="verbose", + action="store_true", + default=default_verbose, + help="show full decoded feeds") + + # deprecated options + if config.has_option("default", "city"): + default_city = config.get("default", "city") + else: default_city = "" + option_parser.add_option("-c", "--city", + dest="city", + default=default_city, + help=optparse.SUPPRESS_HELP) + if config.has_option("default", "id"): + default_id = config.get("default", "id") + else: default_id = "" + option_parser.add_option("-i", "--id", + dest="id", + default=default_id, + help=optparse.SUPPRESS_HELP) + if config.has_option("default", "st"): + default_st = config.get("default", "st") + else: default_st = "" + option_parser.add_option("-s", "--st", + dest="st", + default=default_st, + help=optparse.SUPPRESS_HELP) + + options, arguments = option_parser.parse_args() + return options, arguments + +def get_config(): + """Parse the aliases and configuration.""" + if pyversion("3"): import configparser + else: import ConfigParser as configparser + config = configparser.ConfigParser() + import os + rcfiles = [ + "/etc/weatherrc", + "/etc/weather/weatherrc", + os.path.expanduser("~/.weather/weatherrc"), + os.path.expanduser("~/.weatherrc"), + "weatherrc" + ] + for rcfile in rcfiles: + if os.access(rcfile, os.R_OK): config.read(rcfile) + for section in config.sections(): + if section != section.lower(): + if config.has_section(section.lower()): + config.remove_section(section.lower()) + config.add_section(section.lower()) + for option,value in config.items(section): + config.set(section.lower(), option, value) + return config + +def integrate_search_cache(config, cachedir, setpath): + """Add cached search results into the configuration.""" + if pyversion("3"): import configparser + else: import ConfigParser as configparser + import os, time + scache_fn = os.path.join( os.path.expanduser(cachedir), "searches" ) + if not os.access(scache_fn, os.R_OK): return config + scache_fd = open(scache_fn) + created = float( scache_fd.readline().split(":")[1].strip().split()[0] ) + scache_fd.close() + now = time.time() + datafiles = data_index(setpath) + if datafiles: + data_freshness = sorted( + [ x[1] for x in datafiles.values() ], + reverse=True + )[0] + else: data_freshness = now + if created < data_freshness <= now: + try: + os.remove(scache_fn) + print( "[clearing outdated %s]" % scache_fn ) + except (IOError, OSError): + pass + return config + scache = configparser.ConfigParser() + scache.read(scache_fn) + for section in scache.sections(): + if not config.has_section(section): + config.add_section(section) + for option,value in scache.items(section): + config.set(section, option, value) + return config + +def list_aliases(config, detail=False): + """Return a formatted list of aliases defined in the config.""" + if detail: + output = "\n# configured alias details..." + for section in sorted(config.sections()): + output += "\n\n[%s]" % section + for item in sorted(config.items(section)): + output += "\n%s = %s" % item + output += "\n" + else: + output = "configured aliases and cached searches..." + for section in sorted(config.sections()): + if config.has_option(section, "description"): + description = config.get(section, "description") + else: description = "(no description provided)" + output += "\n %s: %s" % (section, description) + return output + +def data_index(path): + import os + datafiles = {} + for filename in ("airports", "places", "stations", "zctas", "zones"): + for dirname in path.split(":"): + for extension in ("", ".gz", ".txt"): + candidate = os.path.expanduser( + os.path.join( dirname, "".join( (filename, extension) ) ) + ) + if os.path.exists(candidate): + datafiles[filename] = ( + candidate, + os.stat(candidate).st_mtime + ) + break + if filename in datafiles: + break + return datafiles + +def guess( + expression, + path=".", + max_results=20, + info=False, + cache_search=False, + cacheage=900, + cachedir=".", + quiet=False +): + """Find URIs using airport, gecos, placename, station, ZCTA/ZIP, zone.""" + import codecs, datetime, time, os, re, sys + if pyversion("3"): import configparser + else: import ConfigParser as configparser + datafiles = data_index(path) + if re.match("[A-Za-z]{3}$", expression): searchtype = "airport" + elif re.match("[A-Za-z0-9]{4}$", expression): searchtype = "station" + elif re.match("[A-Za-z]{2}[Zz][0-9]{3}$", expression): searchtype = "zone" + elif re.match("[0-9]{5}$", expression): searchtype = "ZCTA" + elif re.match( + r"[\+-]?\d+(\.\d+)?(-\d+){,2}[ENSWensw]?, *[\+-]?\d+(\.\d+)?(-\d+){,2}[ENSWensw]?$", + expression + ): + searchtype = "coordinates" + elif re.match(r"(FIPS|fips)\d+$", expression): searchtype = "FIPS" + else: + searchtype = "name" + cache_search = False + if cache_search: action = "caching" + else: action = "using" + if info: + scores = [ + (0.005, "bad"), + (0.025, "poor"), + (0.160, "suspect"), + (0.500, "mediocre"), + (0.840, "good"), + (0.975, "great"), + (0.995, "excellent"), + (1.000, "ideal"), + ] + if not quiet: print("Searching via %s..."%searchtype) + stations = configparser.ConfigParser() + dataname = "stations" + if dataname in datafiles: + datafile = datafiles[dataname][0] + if datafile.endswith(".gz"): + import gzip + stations.readfp( gzip.open(datafile) ) + else: + stations.read(datafile) + else: + message = "%s error: can't find \"%s\" data file\n" % ( + os.path.basename( sys.argv[0] ), + dataname + ) + sys.stderr.write(message) + exit(1) + zones = configparser.ConfigParser() + dataname = "zones" + if dataname in datafiles: + datafile = datafiles[dataname][0] + if datafile.endswith(".gz"): + import gzip + zones.readfp( gzip.open(datafile) ) + else: + zones.read(datafile) + else: + message = "%s error: can't find \"%s\" data file\n" % ( + os.path.basename( sys.argv[0] ), + dataname + ) + sys.stderr.write(message) + exit(1) + search = None + station = ("", 0) + zone = ("", 0) + dataset = None + possibilities = [] + uris = {} + if searchtype == "airport": + expression = expression.lower() + airports = configparser.ConfigParser() + dataname = "airports" + if dataname in datafiles: + datafile = datafiles[dataname][0] + if datafile.endswith(".gz"): + import gzip + airports.readfp( gzip.open(datafile) ) + else: + airports.read(datafile) + else: + message = "%s error: can't find \"%s\" data file\n" % ( + os.path.basename( sys.argv[0] ), + dataname + ) + sys.stderr.write(message) + exit(1) + if airports.has_section(expression) \ + and airports.has_option(expression, "station"): + search = (expression, "IATA/FAA airport code %s" % expression) + station = ( airports.get(expression, "station"), 0 ) + if stations.has_option(station[0], "zone"): + zone = eval( stations.get(station[0], "zone") ) + dataset = stations + if not ( info or quiet ) \ + and stations.has_option( station[0], "description" ): + print( + "[%s result %s]" % ( + action, + stations.get(station[0], "description") + ) + ) + else: + message = "No IATA/FAA airport code \"%s\" in the %s file.\n" % ( + expression, + datafiles["airports"][0] + ) + sys.stderr.write(message) + exit(1) + elif searchtype == "station": + expression = expression.lower() + if stations.has_section(expression): + station = (expression, 0) + if not search: + search = (expression, "ICAO station code %s" % expression) + if stations.has_option(expression, "zone"): + zone = eval( stations.get(expression, "zone") ) + dataset = stations + if not ( info or quiet ) \ + and stations.has_option(expression, "description"): + print( + "[%s result %s]" % ( + action, + stations.get(expression, "description") + ) + ) + else: + message = "No ICAO weather station \"%s\" in the %s file.\n" % ( + expression, + datafiles["stations"][0] + ) + sys.stderr.write(message) + exit(1) + elif searchtype == "zone": + expression = expression.lower() + if zones.has_section(expression) \ + and zones.has_option(expression, "station"): + zone = (expression, 0) + station = eval( zones.get(expression, "station") ) + dataset = zones + search = (expression, "NWS/NOAA weather zone %s" % expression) + if not ( info or quiet ) \ + and zones.has_option(expression, "description"): + print( + "[%s result %s]" % ( + action, + zones.get(expression, "description") + ) + ) + else: + message = "No usable NWS weather zone \"%s\" in the %s file.\n" % ( + expression, + datafiles["zones"][0] + ) + sys.stderr.write(message) + exit(1) + elif searchtype == "ZCTA": + zctas = configparser.ConfigParser() + dataname = "zctas" + if dataname in datafiles: + datafile = datafiles[dataname][0] + if datafile.endswith(".gz"): + import gzip + zctas.readfp( gzip.open(datafile) ) + else: + zctas.read(datafile) + else: + message = "%s error: can't find \"%s\" data file\n" % ( + os.path.basename( sys.argv[0] ), + dataname + ) + sys.stderr.write(message) + exit(1) + dataset = zctas + if zctas.has_section(expression) \ + and zctas.has_option(expression, "station"): + station = eval( zctas.get(expression, "station") ) + search = (expression, "Census ZCTA (ZIP code) %s" % expression) + if zctas.has_option(expression, "zone"): + zone = eval( zctas.get(expression, "zone") ) + else: + message = "No census ZCTA (ZIP code) \"%s\" in the %s file.\n" % ( + expression, + datafiles["zctas"][0] + ) + sys.stderr.write(message) + exit(1) + elif searchtype == "coordinates": + search = (expression, "Geographic coordinates %s" % expression) + stationtable = {} + for station in stations.sections(): + if stations.has_option(station, "location"): + stationtable[station] = { + "location": eval( stations.get(station, "location") ) + } + station = closest( gecos(expression), stationtable, "location", 0.1 ) + if not station[0]: + message = "No ICAO weather station found near %s.\n" % expression + sys.stderr.write(message) + exit(1) + zonetable = {} + for zone in zones.sections(): + if zones.has_option(zone, "centroid"): + zonetable[zone] = { + "centroid": eval( zones.get(zone, "centroid") ) + } + zone = closest( gecos(expression), zonetable, "centroid", 0.1 ) + if not zone[0]: + message = "No NWS weather zone near %s; forecasts unavailable.\n" \ + % expression + sys.stderr.write(message) + elif searchtype in ("FIPS", "name"): + places = configparser.ConfigParser() + dataname = "places" + if dataname in datafiles: + datafile = datafiles[dataname][0] + if datafile.endswith(".gz"): + import gzip + places.readfp( gzip.open(datafile) ) + else: + places.read(datafile) + else: + message = "%s error: can't find \"%s\" data file\n" % ( + os.path.basename( sys.argv[0] ), + dataname + ) + sys.stderr.write(message) + exit(1) + dataset = places + place = expression.lower() + if places.has_section(place) and places.has_option(place, "station"): + station = eval( places.get(place, "station") ) + search = (expression, "Census Place %s" % expression) + if places.has_option(place, "description"): + search = ( + search[0], + search[1] + ", %s" % places.get(place, "description") + ) + if places.has_option(place, "zone"): + zone = eval( places.get(place, "zone") ) + if not ( info or quiet ) \ + and places.has_option(place, "description"): + print( + "[%s result %s]" % ( + action, + places.get(place, "description") + ) + ) + else: + for place in places.sections(): + if places.has_option(place, "description") \ + and places.has_option(place, "station") \ + and re.search( + expression, + places.get(place, "description"), + re.I + ): + possibilities.append(place) + for place in stations.sections(): + if stations.has_option(place, "description") \ + and re.search( + expression, + stations.get(place, "description"), + re.I + ): + possibilities.append(place) + for place in zones.sections(): + if zones.has_option(place, "description") \ + and zones.has_option(place, "station") \ + and re.search( + expression, + zones.get(place, "description"), + re.I + ): + possibilities.append(place) + if len(possibilities) == 1: + place = possibilities[0] + if places.has_section(place): + station = eval( places.get(place, "station") ) + description = places.get(place, "description") + if places.has_option(place, "zone"): + zone = eval( places.get(place, "zone" ) ) + search = ( expression, "%s: %s" % (place, description) ) + elif stations.has_section(place): + station = (place, 0.0) + description = stations.get(place, "description") + if stations.has_option(place, "zone"): + zone = eval( stations.get(place, "zone" ) ) + search = ( expression, "ICAO station code %s" % place ) + elif zones.has_section(place): + station = eval( zones.get(place, "station") ) + description = zones.get(place, "description") + zone = (place, 0.0) + search = ( expression, "NWS/NOAA weather zone %s" % place ) + if not ( info or quiet ): + print( "[%s result %s]" % (action, description) ) + if not possibilities and not station[0]: + message = "No FIPS code/census area match in the %s file.\n" % ( + datafiles["places"][0] + ) + sys.stderr.write(message) + exit(1) + if station[0]: + uris["metar"] = stations.get( station[0], "metar" ) + if zone[0]: + for key,value in zones.items( zone[0] ): + if key not in ("centroid", "description", "station"): + uris[key] = value + elif possibilities: + count = len(possibilities) + if count <= max_results: + print( "Your search is ambiguous, returning %s matches:" % count ) + for place in sorted(possibilities): + if places.has_section(place): + print( + " [%s] %s" % ( + place, + places.get(place, "description") + ) + ) + elif stations.has_section(place): + print( + " [%s] %s" % ( + place, + stations.get(place, "description") + ) + ) + elif zones.has_section(place): + print( + " [%s] %s" % ( + place, + zones.get(place, "description") + ) + ) + else: + print( + "Your search is too ambiguous, returning %s matches." % count + ) + exit(0) + if info: + stationlist = [] + zonelist = [] + if dataset: + for section in dataset.sections(): + if dataset.has_option(section, "station"): + stationlist.append( + eval( dataset.get(section, "station") )[1] + ) + if dataset.has_option(section, "zone"): + zonelist.append( eval( dataset.get(section, "zone") )[1] ) + stationlist.sort() + zonelist.sort() + scount = len(stationlist) + zcount = len(zonelist) + sranks = [] + zranks = [] + for score in scores: + if stationlist: + sranks.append( stationlist[ int( (1-score[0]) * scount ) ] ) + if zonelist: + zranks.append( zonelist[ int( (1-score[0]) * zcount ) ] ) + description = search[1] + uris["description"] = description + print( + "%s\n%s" % ( description, "-" * len(description) ) + ) + print( + "%s: %s" % ( + station[0], + stations.get( station[0], "description" ) + ) + ) + km = radian_to_km*station[1] + mi = radian_to_mi*station[1] + if sranks and not description.startswith("ICAO station code "): + for index in range(0, len(scores)): + if station[1] >= sranks[index]: + score = scores[index][1] + break + print( + " (proximity %s, %.3gkm, %.3gmi)" % ( score, km, mi ) + ) + elif searchtype is "coordinates": + print( " (%.3gkm, %.3gmi)" % (km, mi) ) + if zone[0]: + print( + "%s: %s" % ( zone[0], zones.get( zone[0], "description" ) ) + ) + km = radian_to_km*zone[1] + mi = radian_to_mi*zone[1] + if zranks and not description.startswith("NWS/NOAA weather zone "): + for index in range(0, len(scores)): + if zone[1] >= zranks[index]: + score = scores[index][1] + break + print( + " (proximity %s, %.3gkm, %.3gmi)" % ( score, km, mi ) + ) + elif searchtype is "coordinates" and zone[0]: + print( " (%.3gkm, %.3gmi)" % (km, mi) ) + if cache_search: + now = time.time() + nowstamp = "%s (%s)" % ( + now, + datetime.datetime.isoformat( + datetime.datetime.fromtimestamp(now), + " " + ) + ) + search_cache = ["\n"] + search_cache.append( "[%s]\n" % search[0] ) + search_cache.append( "description = cached %s\n" % nowstamp ) + for uriname in sorted(uris.keys()): + search_cache.append( "%s = %s\n" % ( uriname, uris[uriname] ) ) + real_cachedir = os.path.expanduser(cachedir) + if not os.path.exists(real_cachedir): + try: os.makedirs(real_cachedir) + except (IOError, OSError): pass + scache_fn = os.path.join(real_cachedir, "searches") + if not os.path.exists(scache_fn): + then = sorted( + [ x[1] for x in datafiles.values() ], + reverse=True + )[0] + thenstamp = "%s (%s)" % ( + then, + datetime.datetime.isoformat( + datetime.datetime.fromtimestamp(then), + " " + ) + ) + search_cache.insert( + 0, + "# based on data files from: %s\n" % thenstamp + ) + try: + scache_existing = configparser.ConfigParser() + scache_existing.read(scache_fn) + if not scache_existing.has_section(search[0]): + scache_fd = codecs.open(scache_fn, "a", "utf-8") + scache_fd.writelines(search_cache) + scache_fd.close() + except (IOError, OSError): pass + if not info: + return(uris) + +def closest(position, nodes, fieldname, angle=None): + import math + if not angle: angle = 2*math.pi + match = None + for name in nodes: + if fieldname in nodes[name]: + node = nodes[name][fieldname] + if node and abs( position[0]-node[0] ) < angle: + if abs( position[1]-node[1] ) < angle \ + or abs( abs( position[1]-node[1] ) - 2*math.pi ) < angle: + if position == node: + angle = 0 + match = name + else: + candidate = math.acos( + math.sin( position[0] ) * math.sin( node[0] ) \ + + math.cos( position[0] ) \ + * math.cos( node[0] ) \ + * math.cos( position[1] - node[1] ) + ) + if candidate < angle: + angle = candidate + match = name + if match: match = str(match) + return (match, angle) + +def gecos(formatted): + import math, re + coordinates = formatted.split(",") + for coordinate in range(0, 2): + degrees, foo, minutes, bar, seconds, hemisphere = re.match( + r"([\+-]?\d+\.?\d*)(-(\d+))?(-(\d+))?([ensw]?)$", + coordinates[coordinate].strip().lower() + ).groups() + value = float(degrees) + if minutes: value += float(minutes)/60 + if seconds: value += float(seconds)/3600 + if hemisphere and hemisphere in "sw": value *= -1 + coordinates[coordinate] = math.radians(value) + return tuple(coordinates) + +def correlate(): + import codecs, datetime, hashlib, os, re, sys, tarfile, time, zipfile + if pyversion("3"): import configparser + else: import ConfigParser as configparser + gcounties_an = "2015_Gaz_counties_national.zip" + gcounties_fn = "2015_Gaz_counties_national.txt" + gcousubs_an = "2015_Gaz_cousubs_national.zip" + gcousubs_fn = "2015_Gaz_cousubs_national.txt" + gplace_an = "2015_Gaz_place_national.zip" + gplace_fn = "2015_Gaz_place_national.txt" + gzcta_an = "2015_Gaz_zcta_national.zip" + gzcta_fn = "2015_Gaz_zcta_national.txt" + for filename in os.listdir("."): + if re.match("bp[0-9][0-9][a-z][a-z][0-9][0-9].dbx$", filename): + cpfzcf_fn = filename + break + nsdcccc_fn = "nsd_cccc.txt" + zcatalog_an = "zonecatalog.curr.tar" + metartbl_fn = "metar.tbl" + coopstn_fn = "coop-stations.txt" + overrides_fn = "overrides.conf" + overrideslog_fn = "overrides.log" + slist_fn = "slist" + zlist_fn = "zlist" + qalog_fn = "qa.log" + airports_fn = "airports" + places_fn = "places" + stations_fn = "stations" + zctas_fn = "zctas" + zones_fn = "zones" + header = """\ +%s +# generated by %s on %s from these public domain sources: +# +# http://www.census.gov/geo/maps-data/data/gazetteer2015.html +# %s %s %s +# %s %s %s +# %s %s %s +# %s %s %s +# +# http://www.weather.gov/geodata/catalog/wsom/html/cntyzone.htm +# %s %s %s +# +# http://tgftp.nws.noaa.gov/data/nsd_cccc.txt +# %s %s %s +# +# http://tgftp.nws.noaa.gov/data/zonecatalog.curr.tar +# %s %s %s +# +# http://www.nco.ncep.noaa.gov/pmb/codes/nwprod/dictionaries/metar.tbl +# %s %s %s +# +# http://www.ncdc.noaa.gov/homr/reports +# %s %s %s +# +# ...and these manually-generated or hand-compiled adjustments: +# %s %s %s +# %s %s %s +# %s %s %s\ +""" % ( + weather_copyright, + os.path.basename( sys.argv[0] ), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( time.time() ) + ), + hashlib.md5( open(gcounties_an, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(gcounties_an) ) + ), + gcounties_an, + hashlib.md5( open(gcousubs_an, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(gcousubs_an) ) + ), + gcousubs_an, + hashlib.md5( open(gplace_an, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(gplace_an) ) + ), + gplace_an, + hashlib.md5( open(gzcta_an, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(gzcta_an) ) + ), + gzcta_an, + hashlib.md5( open(cpfzcf_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(cpfzcf_fn) ) + ), + cpfzcf_fn, + hashlib.md5( open(nsdcccc_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(nsdcccc_fn) ) + ), + nsdcccc_fn, + hashlib.md5( open(zcatalog_an, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(zcatalog_an) ) + ), + zcatalog_an, + hashlib.md5( open(metartbl_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(metartbl_fn) ) + ), + metartbl_fn, + hashlib.md5( open(coopstn_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(coopstn_fn) ) + ), + coopstn_fn, + hashlib.md5( open(overrides_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(overrides_fn) ) + ), + overrides_fn, + hashlib.md5( open(slist_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(slist_fn) ) + ), + slist_fn, + hashlib.md5( open(zlist_fn, "rb").read() ).hexdigest(), + datetime.date.isoformat( + datetime.datetime.fromtimestamp( os.path.getmtime(zlist_fn) ) + ), + zlist_fn + ) + airports = {} + places = {} + stations = {} + zctas = {} + zones = {} + message = "Reading %s:%s..." % (gcounties_an, gcounties_fn) + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + gcounties = zipfile.ZipFile(gcounties_an).open(gcounties_fn, "rU") + columns = gcounties.readline().decode("latin1").strip().split("\t") + for line in gcounties: + fields = line.decode("latin1").strip().split("\t") + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid + if fips not in places: places[fips] = {} + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) + count += 1 + gcounties.close() + print("done (%s lines)." % count) + message = "Reading %s:%s..." % (gcousubs_an, gcousubs_fn) + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + gcousubs = zipfile.ZipFile(gcousubs_an).open(gcousubs_fn, "rU") + columns = gcousubs.readline().decode("latin1").strip().split("\t") + for line in gcousubs: + fields = line.decode("latin1").strip().split("\t") + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid + if fips not in places: places[fips] = {} + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) + count += 1 + gcousubs.close() + print("done (%s lines)." % count) + message = "Reading %s:%s..." % (gplace_an, gplace_fn) + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + gplace = zipfile.ZipFile(gplace_an).open(gplace_fn, "rU") + columns = gplace.readline().decode("latin1").strip().split("\t") + for line in gplace: + fields = line.decode("latin1").strip().split("\t") + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid + if fips not in places: places[fips] = {} + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) + count += 1 + gplace.close() + print("done (%s lines)." % count) + message = "Reading %s..." % slist_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + slist = codecs.open(slist_fn, "rU") + for line in slist: + icao = line.split("#")[0].strip() + if icao: + stations[icao] = { + "metar": "http://tgftp.nws.noaa.gov/data/observations/"\ + + "metar/decoded/%s.TXT" % icao.upper() + } + count += 1 + slist.close() + print("done (%s lines)." % count) + message = "Reading %s..." % metartbl_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + metartbl = codecs.open(metartbl_fn, "rU") + for line in metartbl: + icao = line[:4].strip().lower() + if icao in stations: + description = [] + name = " ".join( + line[16:48].replace("_", " ").strip().title().split() + ) + if name: description.append(name) + st = line[49:51].strip() + if st: description.append(st) + cn = line[52:54].strip() + if cn: description.append(cn) + if description: + stations[icao]["description"] = ", ".join(description) + lat = line[55:60].strip() + if lat: + lat = int(lat)/100.0 + lon = line[61:67].strip() + if lon: + lon = int(lon)/100.0 + stations[icao]["location"] = gecos( "%s,%s" % (lat, lon) ) + count += 1 + metartbl.close() + print("done (%s lines)." % count) + message = "Reading %s..." % nsdcccc_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + nsdcccc = codecs.open(nsdcccc_fn, "rU", "latin1") + for line in nsdcccc: + line = str(line) + fields = line.split(";") + icao = fields[0].strip().lower() + if icao in stations: + description = [] + name = " ".join( fields[3].strip().title().split() ) + if name: description.append(name) + st = fields[4].strip() + if st: description.append(st) + country = " ".join( fields[5].strip().title().split() ) + if country: description.append(country) + if description: + stations[icao]["description"] = ", ".join(description) + lat, lon = fields[7:9] + if lat and lon: + stations[icao]["location"] = gecos( "%s,%s" % (lat, lon) ) + elif "location" not in stations[icao]: + lat, lon = fields[5:7] + if lat and lon: + stations[icao]["location"] = gecos( "%s,%s" % (lat, lon) ) + count += 1 + nsdcccc.close() + print("done (%s lines)." % count) + message = "Reading %s..." % coopstn_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + coopstn = open(coopstn_fn) + for line in coopstn: + icao = line[33:37].strip().lower() + if icao in stations: + iata = line[22:26].strip().lower() + if len(iata) == 3: airports[iata] = { "station": icao } + if "description" not in stations[icao]: + description = [] + name = " ".join( line[99:129].strip().title().split() ) + if name: description.append(name) + st = line[59:61].strip() + if st: description.append(st) + country = " ".join( line[38:58].strip().title().split() ) + if country: description.append(country) + if description: + stations[icao]["description"] = ", ".join(description) + if "location" not in stations[icao]: + lat = line[130:139].strip() + if lat: + lat = lat.replace(" ", "-") + lon = line[140:150].strip() + if lon: + lon = lon.replace(" ", "-") + stations[icao]["location"] = gecos( + "%s,%s" % (lat, lon) + ) + count += 1 + coopstn.close() + print("done (%s lines)." % count) + message = "Reading %s..." % zlist_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + zlist = codecs.open(zlist_fn, "rU") + for line in zlist: + line = line.split("#")[0].strip() + if line: + zones[line] = {} + count += 1 + zlist.close() + print("done (%s lines)." % count) + message = "Reading %s:*..." % zcatalog_an + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + zcatalog = tarfile.open(zcatalog_an) + for entry in zcatalog.getmembers(): + if entry.isfile(): + fnmatch = re.match( + r"([a-z]+z[0-9]+)\.txt$", + os.path.basename(entry.name) + ) + if fnmatch: + zone = fnmatch.group(1) + if zone in zones: + data = zcatalog.extractfile(entry).readlines() + description = data[0].decode("ascii").strip() + zones[zone]["description"] = description + for line in data[1:]: + line = line.decode("latin1").strip() + urimatch = re.match("/webdocs/pub/(.+):(.+) for ", + line) + if urimatch: + uritype = urimatch.group(2).lower().replace(" ","_") + zones[zone][uritype] = ( + "http://tgftp.nws.noaa.gov/%s" + % urimatch.group(1)) + count += 1 + zcatalog.close() + print("done (%s files)." % count) + message = "Reading %s..." % cpfzcf_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + cpfz = {} + cpfzcf = open(cpfzcf_fn) + for line in cpfzcf: + fields = line.strip().split("|") + if len(fields) == 11 \ + and fields[0] and fields[1] and fields[9] and fields[10]: + zone = "z".join( fields[:2] ).lower() + if zone in zones: + zones[zone]["centroid"] = gecos( ",".join( fields[9:11] ) ) + elif fields[6]: + state = fields[0] + description = fields[3] + county = fields[5] + fips = "fips%s"%fields[6] + possible = [ + "%s, %s" % (county, state), + "%s County, %s" % (county, state), + ] + if description.endswith(" Counties"): + description = description[:-9] + for addition in description.split(" and "): + possible.append( "%s, %s" % (addition, state) ) + possible.append( "%s County, %s" % (addition, state) ) + if fips in places and "centroid" in places[fips]: + for candidate in zones: + if "centroid" not in zones[candidate] and \ + "description" in zones[candidate] and \ + zones[candidate]["description"] in possible: + zones[candidate]["centroid"] = \ + places[fips]["centroid"] + count += 1 + cpfzcf.close() + print("done (%s lines)." % count) + message = "Reading %s:%s..." % (gzcta_an, gzcta_fn) + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + gzcta = zipfile.ZipFile(gzcta_an).open(gzcta_fn, "rU") + columns = gzcta.readline().decode("latin1").strip().split("\t") + for line in gzcta: + fields = line.decode("latin1").strip().split("\t") + f_geoid = fields[ columns.index("GEOID") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_intptlat and f_intptlong: + if f_geoid not in zctas: zctas[f_geoid] = {} + zctas[f_geoid]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + count += 1 + gzcta.close() + print("done (%s lines)." % count) + message = "Reading %s..." % overrides_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + added = 0 + removed = 0 + changed = 0 + overrides = configparser.ConfigParser() + overrides.readfp( codecs.open(overrides_fn, "r", "utf8") ) + overrideslog = [] + for section in overrides.sections(): + addopt = 0 + chgopt = 0 + if section.startswith("-"): + section = section[1:] + delete = True + else: delete = False + if re.match("[A-Za-z]{3}$", section): + if delete: + if section in airports: + del( airports[section] ) + logact = "removed airport %s" % section + removed += 1 + else: + logact = "tried to remove nonexistent airport %s" % section + else: + if section in airports: + logact = "changed airport %s" % section + changed += 1 + else: + airports[section] = {} + logact = "added airport %s" % section + added += 1 + for key,value in overrides.items(section): + if key in airports[section]: chgopt += 1 + else: addopt += 1 + if key in ("centroid", "location"): + airports[section][key] = eval(value) + else: + airports[section][key] = value + if addopt and chgopt: + logact += " (+%s/!%s options)" % (addopt, chgopt) + elif addopt: logact += " (+%s options)" % addopt + elif chgopt: logact += " (!%s options)" % chgopt + elif re.match("[A-Za-z0-9]{4}$", section): + if delete: + if section in stations: + del( stations[section] ) + logact = "removed station %s" % section + removed += 1 + else: + logact = "tried to remove nonexistent station %s" % section + else: + if section in stations: + logact = "changed station %s" % section + changed += 1 + else: + stations[section] = {} + logact = "added station %s" % section + added += 1 + for key,value in overrides.items(section): + if key in stations[section]: chgopt += 1 + else: addopt += 1 + if key in ("centroid", "location"): + stations[section][key] = eval(value) + else: + stations[section][key] = value + if addopt and chgopt: + logact += " (+%s/!%s options)" % (addopt, chgopt) + elif addopt: logact += " (+%s options)" % addopt + elif chgopt: logact += " (!%s options)" % chgopt + elif re.match("[0-9]{5}$", section): + if delete: + if section in zctas: + del( zctas[section] ) + logact = "removed zcta %s" % section + removed += 1 + else: + logact = "tried to remove nonexistent zcta %s" % section + else: + if section in zctas: + logact = "changed zcta %s" % section + changed += 1 + else: + zctas[section] = {} + logact = "added zcta %s" % section + added += 1 + for key,value in overrides.items(section): + if key in zctas[section]: chgopt += 1 + else: addopt += 1 + if key in ("centroid", "location"): + zctas[section][key] = eval(value) + else: + zctas[section][key] = value + if addopt and chgopt: + logact += " (+%s/!%s options)" % (addopt, chgopt) + elif addopt: logact += " (+%s options)" % addopt + elif chgopt: logact += " (!%s options)" % chgopt + elif re.match("[A-Za-z]{2}[Zz][0-9]{3}$", section): + if delete: + if section in zones: + del( zones[section] ) + logact = "removed zone %s" % section + removed += 1 + else: + logact = "tried to remove nonexistent zone %s" % section + else: + if section in zones: + logact = "changed zone %s" % section + changed += 1 + else: + zones[section] = {} + logact = "added zone %s" % section + added += 1 + for key,value in overrides.items(section): + if key in zones[section]: chgopt += 1 + else: addopt += 1 + if key in ("centroid", "location"): + zones[section][key] = eval(value) + else: + zones[section][key] = value + if addopt and chgopt: + logact += " (+%s/!%s options)" % (addopt, chgopt) + elif addopt: logact += " (+%s options)" % addopt + elif chgopt: logact += " (!%s options)" % chgopt + elif re.match("fips[0-9]+$", section): + if delete: + if section in places: + del( places[section] ) + logact = "removed place %s" % section + removed += 1 + else: + logact = "tried to remove nonexistent place %s" % section + else: + if section in places: + logact = "changed place %s" % section + changed += 1 + else: + places[section] = {} + logact = "added place %s" % section + added += 1 + for key,value in overrides.items(section): + if key in places[section]: chgopt += 1 + else: addopt += 1 + if key in ("centroid", "location"): + places[section][key] = eval(value) + else: + places[section][key] = value + if addopt and chgopt: + logact += " (+%s/!%s options)" % (addopt, chgopt) + elif addopt: logact += " (+%s options)" % addopt + elif chgopt: logact += " (!%s options)" % chgopt + count += 1 + overrideslog.append("%s\n" % logact) + overrideslog.sort() + if os.path.exists(overrideslog_fn): + os.rename(overrideslog_fn, "%s_old"%overrideslog_fn) + overrideslog_fd = codecs.open(overrideslog_fn, "w", "utf8") + overrideslog_fd.writelines(overrideslog) + overrideslog_fd.close() + print("done (%s overridden sections: +%s/-%s/!%s)." % ( + count, + added, + removed, + changed + ) ) + estimate = 2*len(places) + len(stations) + 2*len(zctas) + len(zones) + print( + "Correlating places, stations, ZCTAs and zones (upper bound is %s):" % \ + estimate + ) + count = 0 + milestones = list( range(51) ) + message = " " + sys.stdout.write(message) + sys.stdout.flush() + for fips in places: + centroid = places[fips]["centroid"] + if centroid: + station = closest(centroid, stations, "location", 0.1) + if station[0]: + places[fips]["station"] = station + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[:milestones.index(level)+1]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + if centroid: + zone = closest(centroid, zones, "centroid", 0.1) + if zone[0]: + places[fips]["zone"] = zone + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[:milestones.index(level)+1]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + for station in stations: + if "location" in stations[station]: + location = stations[station]["location"] + if location: + zone = closest(location, zones, "centroid", 0.1) + if zone[0]: + stations[station]["zone"] = zone + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[:milestones.index(level)+1]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + for zcta in zctas.keys(): + centroid = zctas[zcta]["centroid"] + if centroid: + station = closest(centroid, stations, "location", 0.1) + if station[0]: + zctas[zcta]["station"] = station + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[ : milestones.index(level)+1 ]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + if centroid: + zone = closest(centroid, zones, "centroid", 0.1) + if zone[0]: + zctas[zcta]["zone"] = zone + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[:milestones.index(level)+1]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + for zone in zones.keys(): + if "centroid" in zones[zone]: + centroid = zones[zone]["centroid"] + if centroid: + station = closest(centroid, stations, "location", 0.1) + if station[0]: + zones[zone]["station"] = station + count += 1 + if not count%100: + level = int(50*count/estimate) + if level in milestones: + for remaining in milestones[:milestones.index(level)+1]: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + milestones.remove(remaining) + for remaining in milestones: + if remaining%5: + message = "." + sys.stdout.write(message) + sys.stdout.flush() + else: + message = "%s%%" % (remaining*2,) + sys.stdout.write(message) + sys.stdout.flush() + print("\n done (%s correlations)." % count) + message = "Writing %s..." % airports_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + if os.path.exists(airports_fn): + os.rename(airports_fn, "%s_old"%airports_fn) + airports_fd = codecs.open(airports_fn, "w", "utf8") + airports_fd.write(header) + for airport in sorted( airports.keys() ): + airports_fd.write("\n\n[%s]" % airport) + for key, value in sorted( airports[airport].items() ): + if type(value) is float: value = "%.7f"%value + elif type(value) is tuple: + elements = [] + for element in value: + if type(element) is float: elements.append("%.7f"%element) + else: elements.append( repr(element) ) + value = "(%s)"%", ".join(elements) + airports_fd.write( "\n%s = %s" % (key, value) ) + count += 1 + airports_fd.write("\n") + airports_fd.close() + print("done (%s sections)." % count) + message = "Writing %s..." % places_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + if os.path.exists(places_fn): + os.rename(places_fn, "%s_old"%places_fn) + places_fd = codecs.open(places_fn, "w", "utf8") + places_fd.write(header) + for fips in sorted( places.keys() ): + places_fd.write("\n\n[%s]" % fips) + for key, value in sorted( places[fips].items() ): + if type(value) is float: value = "%.7f"%value + elif type(value) is tuple: + elements = [] + for element in value: + if type(element) is float: elements.append("%.7f"%element) + else: elements.append( repr(element) ) + value = "(%s)"%", ".join(elements) + places_fd.write( "\n%s = %s" % (key, value) ) + count += 1 + places_fd.write("\n") + places_fd.close() + print("done (%s sections)." % count) + message = "Writing %s..." % stations_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + if os.path.exists(stations_fn): + os.rename(stations_fn, "%s_old"%stations_fn) + stations_fd = codecs.open(stations_fn, "w", "utf8") + stations_fd.write(header) + for station in sorted( stations.keys() ): + stations_fd.write("\n\n[%s]" % station) + for key, value in sorted( stations[station].items() ): + if type(value) is float: value = "%.7f"%value + elif type(value) is tuple: + elements = [] + for element in value: + if type(element) is float: elements.append("%.7f"%element) + else: elements.append( repr(element) ) + value = "(%s)"%", ".join(elements) + stations_fd.write( "\n%s = %s" % (key, value) ) + count += 1 + stations_fd.write("\n") + stations_fd.close() + print("done (%s sections)." % count) + message = "Writing %s..." % zctas_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + if os.path.exists(zctas_fn): + os.rename(zctas_fn, "%s_old"%zctas_fn) + zctas_fd = codecs.open(zctas_fn, "w", "utf8") + zctas_fd.write(header) + for zcta in sorted( zctas.keys() ): + zctas_fd.write("\n\n[%s]" % zcta) + for key, value in sorted( zctas[zcta].items() ): + if type(value) is float: value = "%.7f"%value + elif type(value) is tuple: + elements = [] + for element in value: + if type(element) is float: elements.append("%.7f"%element) + else: elements.append( repr(element) ) + value = "(%s)"%", ".join(elements) + zctas_fd.write( "\n%s = %s" % (key, value) ) + count += 1 + zctas_fd.write("\n") + zctas_fd.close() + print("done (%s sections)." % count) + message = "Writing %s..." % zones_fn + sys.stdout.write(message) + sys.stdout.flush() + count = 0 + if os.path.exists(zones_fn): + os.rename(zones_fn, "%s_old"%zones_fn) + zones_fd = codecs.open(zones_fn, "w", "utf8") + zones_fd.write(header) + for zone in sorted( zones.keys() ): + zones_fd.write("\n\n[%s]" % zone) + for key, value in sorted( zones[zone].items() ): + if type(value) is float: value = "%.7f"%value + elif type(value) is tuple: + elements = [] + for element in value: + if type(element) is float: elements.append("%.7f"%element) + else: elements.append( repr(element) ) + value = "(%s)"%", ".join(elements) + zones_fd.write( "\n%s = %s" % (key, value) ) + count += 1 + zones_fd.write("\n") + zones_fd.close() + print("done (%s sections)." % count) + message = "Starting QA check..." + sys.stdout.write(message) + sys.stdout.flush() + airports = configparser.ConfigParser() + airports.read(airports_fn) + places = configparser.ConfigParser() + places.read(places_fn) + stations = configparser.ConfigParser() + stations.read(stations_fn) + zctas = configparser.ConfigParser() + zctas.read(zctas_fn) + zones = configparser.ConfigParser() + zones.read(zones_fn) + qalog = [] + places_nocentroid = 0 + places_nodescription = 0 + for place in sorted( places.sections() ): + if not places.has_option(place, "centroid"): + qalog.append("%s: no centroid\n" % place) + places_nocentroid += 1 + if not places.has_option(place, "description"): + qalog.append("%s: no description\n" % place) + places_nodescription += 1 + stations_nodescription = 0 + stations_nolocation = 0 + stations_nometar = 0 + for station in sorted( stations.sections() ): + if not stations.has_option(station, "description"): + qalog.append("%s: no description\n" % station) + stations_nodescription += 1 + if not stations.has_option(station, "location"): + qalog.append("%s: no location\n" % station) + stations_nolocation += 1 + if not stations.has_option(station, "metar"): + qalog.append("%s: no metar\n" % station) + stations_nometar += 1 + airports_badstation = 0 + airports_nostation = 0 + for airport in sorted( airports.sections() ): + if not airports.has_option(airport, "station"): + qalog.append("%s: no station\n" % airport) + airports_nostation += 1 + else: + station = airports.get(airport, "station") + if station not in stations.sections(): + qalog.append( "%s: bad station %s\n" % (airport, station) ) + airports_badstation += 1 + zctas_nocentroid = 0 + for zcta in sorted( zctas.sections() ): + if not zctas.has_option(zcta, "centroid"): + qalog.append("%s: no centroid\n" % zcta) + zctas_nocentroid += 1 + zones_nocentroid = 0 + zones_nodescription = 0 + zones_noforecast = 0 + zones_overlapping = 0 + zonetable = {} + for zone in zones.sections(): + if zones.has_option(zone, "centroid"): + zonetable[zone] = { + "centroid": eval( zones.get(zone, "centroid") ) + } + for zone in sorted( zones.sections() ): + if zones.has_option(zone, "centroid"): + zonetable_local = zonetable.copy() + del( zonetable_local[zone] ) + centroid = eval( zones.get(zone, "centroid") ) + if centroid: + nearest = closest(centroid, zonetable_local, "centroid", 0.1) + if nearest[1]*radian_to_km < 1: + qalog.append( "%s: within one km of %s\n" % ( + zone, + nearest[0] + ) ) + zones_overlapping += 1 + else: + qalog.append("%s: no centroid\n" % zone) + zones_nocentroid += 1 + if not zones.has_option(zone, "description"): + qalog.append("%s: no description\n" % zone) + zones_nodescription += 1 + if not zones.has_option(zone, "zone_forecast"): + qalog.append("%s: no forecast\n" % zone) + zones_noforecast += 1 + if os.path.exists(qalog_fn): + os.rename(qalog_fn, "%s_old"%qalog_fn) + qalog_fd = codecs.open(qalog_fn, "w", "utf8") + qalog_fd.writelines(qalog) + qalog_fd.close() + if qalog: + print("issues found (see %s for details):"%qalog_fn) + if airports_badstation: + print(" %s airports with invalid station"%airports_badstation) + if airports_nostation: + print(" %s airports with no station"%airports_nostation) + if places_nocentroid: + print(" %s places with no centroid"%places_nocentroid) + if places_nodescription: + print(" %s places with no description"%places_nodescription) + if stations_nodescription: + print(" %s stations with no description"%stations_nodescription) + if stations_nolocation: + print(" %s stations with no location"%stations_nolocation) + if stations_nometar: + print(" %s stations with no METAR"%stations_nometar) + if zctas_nocentroid: + print(" %s ZCTAs with no centroid"%zctas_nocentroid) + if zones_nocentroid: + print(" %s zones with no centroid"%zones_nocentroid) + if zones_nodescription: + print(" %s zones with no description"%zones_nodescription) + if zones_noforecast: + print(" %s zones with no forecast"%zones_noforecast) + if zones_overlapping: + print(" %s zones within one km of another"%zones_overlapping) + else: print("no issues found.") + print("Indexing complete!") |