diff --git a/modules/icing/pirep_goes.py b/modules/icing/pirep_goes.py index 7d1601f66962ca5cff5d9424e5203735910a0348..9e8a7a4048da7727dc611673b39fc7ee1a793eeb 100644 --- a/modules/icing/pirep_goes.py +++ b/modules/icing/pirep_goes.py @@ -474,8 +474,36 @@ def analyze(ice_dct, no_ice_dct): print(dt_str[2:]) +lon_space_hdeg = np.linspace(-180, 180, 721) +lat_space_hdeg = np.linspace(-90, 90, 361) +# grd_bins = np.full((lat_space.shape[0], lon_space.shape[0]), t_delta) + + +def check_no_overlap(lon, lat, ts, grd_bins, t_delta=600.0): + + grd_x_hi = lon_space.shape[0] - 1 + grd_y_hi = lat_space.shape[0] - 1 + + lon_idx = np.searchsorted(lon_space_hdeg, lon) + lat_idx = np.searchsorted(lat_space_hdeg, lat) + + if lon_idx < 0 or lon_idx > grd_x_hi: + return False + if lat_idx < 0 or lat_idx > grd_y_hi: + return False + + last_ts = grd_bins[lat_idx, lon_idx] + if ts - last_ts > t_delta: + grd_bins[lat_idx, lon_idx] = ts + return True + else: + return False + + # This mostly reduces some categories for a degree of class balancing and removes no intensity reports def process(ice_dct, no_ice_dct, neg_ice_dct): + t_delta = 600 # seconds + new_ice_dct = {} new_no_ice_dct = {} new_neg_ice_dct = {} @@ -526,10 +554,12 @@ def process(ice_dct, no_ice_dct, neg_ice_dct): no_ice_tidx.append(idx) neg_ice_keys = [] + neg_ice_tidx = [] for ts in list(neg_ice_dct.keys()): - rpts = neg_ice_dct[ts] - for tup in rpts: - neg_ice_keys.append(ts) + rpts = neg_ice_dct[ts] + for idx, tup in enumerate(rpts): + neg_ice_keys.append(ts) + neg_ice_tidx.append(idx) print('num ice reports, no ice, neg ice: ', num_ice_reports, len(no_ice_keys), len(neg_ice_keys)) print('------------------------------------------------') @@ -571,15 +601,23 @@ def process(ice_dct, no_ice_dct, neg_ice_dct): ice_keys = ice_keys[sidxs] ice_tidx = ice_tidx[sidxs] + grd_bins = np.full((lat_space_hdeg.shape[0], lon_space_hdeg.shape[0]), -(t_delta+1)) + cnt = 0 for idx, key in enumerate(ice_keys): rpts = ice_dct[key] + tup = rpts[ice_tidx[idx]] + lat, lon = tup[0], tup[1] + if not check_no_overlap(lon, lat, key, grd_bins, t_delta=t_delta): + continue + cnt += 1 n_rpts = new_ice_dct.get(key) if n_rpts is None: n_rpts = [] new_ice_dct[key] = n_rpts n_rpts.append(tup) + print('icing total no overlap: ', cnt) # ----------------------------------------------------- no_ice_keys = np.array(no_ice_keys) @@ -589,35 +627,68 @@ def process(ice_dct, no_ice_dct, neg_ice_dct): ridxs = np.random.permutation(np.arange(no_ice_keys.shape[0])) no_ice_keys = no_ice_keys[ridxs] no_ice_tidx = no_ice_tidx[ridxs] - no_ice_keys = no_ice_keys[::10] - no_ice_tidx = no_ice_tidx[::10] + no_ice_keys = no_ice_keys[::5] + no_ice_tidx = no_ice_tidx[::5] print('no ice reduced: ', no_ice_keys.shape[0]) sidxs = np.argsort(no_ice_keys) no_ice_keys = no_ice_keys[sidxs] no_ice_tidx = no_ice_tidx[sidxs] + grd_bins = np.full((lat_space_hdeg.shape[0], lon_space_hdeg.shape[0]), -(t_delta+1)) + cnt = 0 for idx, key in enumerate(no_ice_keys): rpts = no_ice_dct[key] tup = rpts[no_ice_tidx[idx]] + lat, lon = tup[0], tup[1] + if not check_no_overlap(lon, lat, key, grd_bins, t_delta=t_delta): + continue + cnt += 1 + n_rpts = new_no_ice_dct.get(key) if n_rpts is None: n_rpts = [] new_no_ice_dct[key] = n_rpts n_rpts.append(tup) + print('no icing total no overlap: ', cnt) # ------------------------------------------------- + # Previous for neg icing + # neg_ice_keys = np.array(neg_ice_keys) + # print('neg ice total: ', neg_ice_keys.shape[0]) + # np.random.seed(42) + # np.random.shuffle(neg_ice_keys) + # neg_ice_keys = neg_ice_keys[0:12000] + # uniq_sorted_neg_ice = np.unique(neg_ice_keys) + # print('neg ice reduced: ', uniq_sorted_neg_ice.shape) + # + # for key in uniq_sorted_neg_ice: + # new_neg_ice_dct[key] = neg_ice_dct[key] + + # ----------------------------------------------------- neg_ice_keys = np.array(neg_ice_keys) + neg_ice_tidx = np.array(neg_ice_tidx) print('neg ice total: ', neg_ice_keys.shape[0]) - np.random.seed(42) - np.random.shuffle(neg_ice_keys) - neg_ice_keys = neg_ice_keys[0:12000] - uniq_sorted_neg_ice = np.unique(neg_ice_keys) - print('neg ice reduced: ', uniq_sorted_neg_ice.shape) - for key in uniq_sorted_neg_ice: - new_neg_ice_dct[key] = neg_ice_dct[key] + grd_bins = np.full((lat_space_hdeg.shape[0], lon_space_hdeg.shape[0]), -(t_delta+1)) + cnt = 0 + for idx, key in enumerate(neg_ice_keys): + rpts = neg_ice_dct[key] + tup = rpts[neg_ice_tidx[idx]] + + lat, lon = tup[0], tup[1] + if not check_no_overlap(lon, lat, key, grd_bins, t_delta=t_delta): + continue + cnt += 1 + + n_rpts = new_neg_ice_dct.get(key) + if n_rpts is None: + n_rpts = [] + new_neg_ice_dct[key] = n_rpts + n_rpts.append(tup) + print('neg icing total no overlap: ', cnt) + # ------------------------------------------------- return new_ice_dct, new_no_ice_dct, new_neg_ice_dct