X-Git-Url: https://www.yuggoth.org/gitweb?p=weather.git;a=blobdiff_plain;f=weather.py;h=47870ec51273b455bf6290d0b595d2ef3e727eff;hp=60067f25d4b197eb058c42d9ea9b027fcdb60641;hb=0cfa643cef2fb2594129ea92f16a590b150d1027;hpb=13eb635aca2bbd3c95b4a62e23333959b39ecc38 diff --git a/weather.py b/weather.py index 60067f2..47870ec 100644 --- a/weather.py +++ b/weather.py @@ -1328,15 +1328,21 @@ def correlate(): sys.stdout.flush() count = 0 gcounties = zipfile.ZipFile(gcounties_an).open(gcounties_fn, "rU") + columns = gcounties.readline().decode("latin1").strip().split("\t") for line in gcounties: fields = line.decode("latin1").strip().split("\t") - if len(fields) == 10 and fields[0] != "STUSPS": - fips = "fips%s" % fields[1] - description = "%s, %s" % ( fields[3], fields[0] ) - centroid = gecos( ",".join( fields[8:10] ) ) + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid if fips not in places: places[fips] = {} - places[fips]["centroid"] = centroid - places[fips]["description"] = description + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) count += 1 gcounties.close() print("done (%s lines)." % count) @@ -1345,15 +1351,21 @@ def correlate(): sys.stdout.flush() count = 0 gcousubs = zipfile.ZipFile(gcousubs_an).open(gcousubs_fn, "rU") + columns = gcousubs.readline().decode("latin1").strip().split("\t") for line in gcousubs: fields = line.decode("latin1").strip().split("\t") - if len(fields) == 10 and fields[0] != "STUSPS": - fips = "fips%s" % fields[1] - description = "%s, %s" % ( fields[3], fields[0] ) - centroid = gecos( ",".join( fields[8:10] ) ) + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid if fips not in places: places[fips] = {} - places[fips]["centroid"] = centroid - places[fips]["description"] = description + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) count += 1 gcousubs.close() print("done (%s lines)." % count) @@ -1362,15 +1374,21 @@ def correlate(): sys.stdout.flush() count = 0 gplaces = zipfile.ZipFile(gplaces_an).open(gplaces_fn, "rU") + columns = gplaces.readline().decode("latin1").strip().split("\t") for line in gplaces: fields = line.decode("latin1").strip().split("\t") - if len(fields) == 10 and fields[0] != "STUSPS": - fips = "fips%s" % fields[1] - description = "%s, %s" % ( fields[3], fields[0] ) - centroid = gecos( ",".join( fields[8:10] ) ) + f_geoid = fields[ columns.index("GEOID") ].strip() + f_name = fields[ columns.index("NAME") ].strip() + f_usps = fields[ columns.index("USPS") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_name and f_usps and f_intptlat and f_intptlong: + fips = "fips%s" % f_geoid if fips not in places: places[fips] = {} - places[fips]["centroid"] = centroid - places[fips]["description"] = description + places[fips]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) + ) + places[fips]["description"] = "%s, %s" % (f_name, f_usps) count += 1 gplaces.close() print("done (%s lines)." % count) @@ -1562,13 +1580,16 @@ def correlate(): sys.stdout.flush() count = 0 gzcta = zipfile.ZipFile(gzcta_an).open(gzcta_fn, "rU") + columns = gzcta.readline().decode("latin1").strip().split("\t") for line in gzcta: fields = line.decode("latin1").strip().split("\t") - if len(fields) == 7 and fields[0] != "GEOID": - zcta = fields[0] - if zcta not in zctas: zctas[zcta] = {} - zctas[zcta]["centroid"] = gecos( - ",".join( ( fields[6], fields[5] ) ) + f_geoid = fields[ columns.index("GEOID") ].strip() + f_intptlat = fields[ columns.index("INTPTLAT") ].strip() + f_intptlong = fields[ columns.index("INTPTLONG") ].strip() + if f_geoid and f_intptlat and f_intptlong: + if f_geoid not in zctas: zctas[f_geoid] = {} + zctas[f_geoid]["centroid"] = gecos( + "%s,%s" % (f_intptlat, f_intptlong) ) count += 1 gzcta.close() @@ -1890,6 +1911,7 @@ def correlate(): for key, value in sorted( airports[airport].items() ): airports_fd.write( "\n%s = %s" % (key, value) ) count += 1 + airports_fd.write("\n") airports_fd.close() print("done (%s sections)." % count) message = "Writing %s..." % places_fn @@ -1905,6 +1927,7 @@ def correlate(): for key, value in sorted( places[fips].items() ): places_fd.write( "\n%s = %s" % (key, value) ) count += 1 + places_fd.write("\n") places_fd.close() print("done (%s sections)." % count) message = "Writing %s..." % stations_fn @@ -1920,6 +1943,7 @@ def correlate(): for key, value in sorted( stations[station].items() ): stations_fd.write( "\n%s = %s" % (key, value) ) count += 1 + stations_fd.write("\n") stations_fd.close() print("done (%s sections)." % count) message = "Writing %s..." % zctas_fn @@ -1935,6 +1959,7 @@ def correlate(): for key, value in sorted( zctas[zcta].items() ): zctas_fd.write( "\n%s = %s" % (key, value) ) count += 1 + zctas_fd.write("\n") zctas_fd.close() print("done (%s sections)." % count) message = "Writing %s..." % zones_fn @@ -1950,6 +1975,7 @@ def correlate(): for key, value in sorted( zones[zone].items() ): zones_fd.write( "\n%s = %s" % (key, value) ) count += 1 + zones_fd.write("\n") zones_fd.close() print("done (%s sections)." % count) message = "Starting QA check..."