sondehub-infra/lambda/recovery_ingest/__init__.py

131 lines
5.3 KiB
Python
Raw Normal View History

2022-01-26 04:21:51 +00:00
from datetime import datetime
2022-01-26 04:21:18 +00:00
import urllib.request
import json
2022-01-26 04:21:51 +00:00
import os
2022-01-26 04:21:18 +00:00
2022-01-28 10:31:27 +00:00
apiKey = os.environ["radiosondy_apikey"]
2022-01-26 04:21:51 +00:00
params = "?token={}&period=2".format(apiKey)
2022-01-26 04:21:18 +00:00
url = "https://radiosondy.info/api/v1/sonde-logs{}".format(params)
recoveryUrl = "https://api.v2.sondehub.org/recovered"
searchUrl = "https://api.v2.sondehub.org/sondes"
2022-01-26 05:02:26 +00:00
# Main function
def handler(event,context):
response = urllib.request.urlopen(url)
data = json.load(response)
2022-01-26 05:04:37 +00:00
processReports(data)
2022-01-26 04:21:18 +00:00
2022-01-26 04:21:51 +00:00
# Check exisiting SondeHub recovery reports
2022-01-26 04:21:18 +00:00
def checkExisting(serial, recovered):
# Get SondeHub recoveries for serial
recoveryCheckParams = "?serial={}".format(serial)
recoveryCheckUrl = recoveryUrl + recoveryCheckParams
recoveryCheckResponse = urllib.request.urlopen(recoveryCheckUrl)
recoveryCheckData = json.load(recoveryCheckResponse)
# No recovery reports for serial
if len(recoveryCheckData) == 0:
return True
# Not recovered report and we have recovered
if recoveryCheckData[0]["recovered"] == False and recovered == True:
return True
# Valid recovery report already exists
return False
2022-01-26 04:21:51 +00:00
# Attempt to find SondeHub serial for a Radiosony.info serial
2022-01-26 04:21:18 +00:00
def findSonde(recovery, lat, lon):
# Get facts to compare against
launchTime = datetime.strptime(recovery["start_time"], "%Y-%m-%d %H:%M:%S")
sondeType = recovery["radiosonde"]["type"]
sondeFrequency = recovery["radiosonde"]["qrg"]
# Determine how far back to query
nowTime = datetime.utcnow()
searchDifference = nowTime - launchTime
searchSeconds = round(searchDifference.total_seconds()) + 10800 # Search from 3 hours before reported launch
2022-01-26 04:21:18 +00:00
# Geographical SondeHub search
searchParams = "?lat={}&lon={}&distance=2000&last={}".format(lat, lon, searchSeconds)
2022-01-26 04:21:18 +00:00
searchCompletedUrl = searchUrl + searchParams
searchResponse = urllib.request.urlopen(searchCompletedUrl)
searchData = json.load(searchResponse)
serial = None
# Check all returned sondes
for key, value in searchData.items():
receivedTime = datetime.strptime(value["datetime"], "%Y-%m-%dT%H:%M:%S.%fZ")
timeDifference = receivedTime - launchTime
if timeDifference.total_seconds() < 10800: # 3 Hours or less
2022-01-26 04:21:18 +00:00
if value["type"] in sondeType: # Type matches
if abs(float(sondeFrequency) - float(value["frequency"])) < 0.05: # 0.05 MHz or less
serial = key
return serial
2022-01-26 04:21:51 +00:00
# Process each recovery report from Radiosondy.info
2022-01-26 05:04:37 +00:00
def processReports(data):
2022-01-26 05:02:26 +00:00
for recovery in data["results"]:
# Get recovery status
if recovery["log_info"]["status"] == "FOUND":
2022-01-26 05:02:26 +00:00
recovered = True
elif recovery["log_info"]["status"] == "NEED ATTENTION":
recovered = False
elif recovery["log_info"]["status"] == "LOST":
2022-01-26 05:02:26 +00:00
recovered = False
else:
2022-01-26 04:21:18 +00:00
continue
2022-01-26 05:02:26 +00:00
# Get finder if available
if recovery["log_info"]["finder"] is not None:
recovered_by = recovery["log_info"]["finder"]
elif "[BOT]" not in recovery["log_info"]["added_by"]:
recovered_by = recovery["log_info"]["added_by"]
2022-01-26 05:02:26 +00:00
else:
continue
2022-01-26 04:21:18 +00:00
2022-01-26 05:02:26 +00:00
# Import time
recovered_time = datetime.strptime(recovery["log_info"]["log_added"], "%Y-%m-%d %H:%M:%S")
# Get comment and add attribution
description = recovery["log_info"]["comment"]
description += " [via Radiosondy.info]"
description = description.lstrip()
if recovery["log_info"]["found_coordinates"]["latitude"] != "0" and recovery["log_info"]["found_coordinates"]["longitude"] != "0":
lat = float(recovery["log_info"]["found_coordinates"]["latitude"])
lon = float(recovery["log_info"]["found_coordinates"]["longitude"])
else:
continue
# Use the reported serial number for RS41/RS92
if "RS41" in recovery["radiosonde"]["type"] or "RS92" in recovery["radiosonde"]["type"]:
serial = recovery["radiosonde"]["number"]
# Remove D prefix for DFM
elif "DFM" in recovery["radiosonde"]["type"]:
serial = recovery["radiosonde"]["number"][1:]
2022-01-26 05:02:26 +00:00
# Try to find serial in SondeHub database for others
else:
serial = findSonde(recovery, lat, lon)
if serial is None:
print("{}: could not match to SondeHub serial".format(recovery["radiosonde"]["number"]))
2022-01-26 05:02:26 +00:00
continue
# Check if a valid recovery already exists
if checkExisting(serial, recovered) == False:
print("{}: recovery already exists".format(serial))
continue
# Format data for upload
recoveryPutData = {"datetime": recovered_time.isoformat(), "serial": serial, "lat": lat, "lon": lon, "recovered": recovered, "recovered_by": recovered_by, "description": description}
recoveryPutData = str(json.dumps(recoveryPutData)).encode('utf-8')
print("{}: {}".format(serial, recoveryPutData))
# Upload data
recoveryPutRequest = urllib.request.Request(recoveryUrl, data=recoveryPutData, method="PUT")
print("{}: {}".format(serial, urllib.request.urlopen(recoveryPutRequest).read().decode('utf-8')))