From fe3b8453b292ea7d68ca16a4e11fabf18557a5d2 Mon Sep 17 00:00:00 2001 From: tomrink <rink@ssec.wisc.edu> Date: Tue, 23 Apr 2024 13:56:31 -0500 Subject: [PATCH] snapshot... --- modules/util/hdf5_conversion.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/modules/util/hdf5_conversion.py b/modules/util/hdf5_conversion.py index 3ffef6f9..08dc02e0 100644 --- a/modules/util/hdf5_conversion.py +++ b/modules/util/hdf5_conversion.py @@ -1,6 +1,7 @@ import h5py import numpy as np import pandas as pd +import random def hdf5_to_npz_csv(hdf5_filename, output_file_prefix, chunk_size=10000): @@ -14,6 +15,15 @@ def hdf5_to_npz_csv(hdf5_filename, output_file_prefix, chunk_size=10000): chunk_size (int): Size of chunks to process at once (default is 1000). """ + # # New step: keep only 10 mask values == True + # mask_indices = list(np.nonzero(mask)[0]) + # if len(mask_indices) > 10: + # selected_indices = random.sample(mask_indices, 10) + # new_mask = np.zeros(mask.size).astype(np.bool) + # new_mask[selected_indices] = True + # mask = new_mask + # keep_array.append(data[mask]) + # Step 1: Open HDF5 file with h5py.File(hdf5_filename, "r") as file: fov_mask = np.asarray(file["FOV_mask"]) -- GitLab