From 1ba0a6c266bf9877369922147c48a2abfa6f306c Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 1 Feb 2024 11:13:53 -0500 Subject: [PATCH 01/27] Initial commit --- src/kbmod/search/kernels.cu | 62 ++++--- src/kbmod/search/psi_phi_array_utils.h | 33 ---- src/kbmod/search/pydocs/psi_phi_array_docs.h | 95 ++++++---- .../{psi_phi_array.cpp => search_data.cpp} | 163 ++++++++++++------ .../{psi_phi_array_ds.h => search_data_ds.h} | 53 +++--- src/kbmod/search/search_data_utils.h | 39 +++++ src/kbmod/search/stack_search.cpp | 11 +- 7 files changed, 287 insertions(+), 169 deletions(-) delete mode 100644 src/kbmod/search/psi_phi_array_utils.h rename src/kbmod/search/{psi_phi_array.cpp => search_data.cpp} (67%) rename src/kbmod/search/{psi_phi_array_ds.h => search_data_ds.h} (68%) create mode 100644 src/kbmod/search/search_data_utils.h diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index 84b6cf249..2accdb171 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -19,29 +19,45 @@ #include "common.h" #include "cuda_errors.h" -#include "psi_phi_array_ds.h" +#include "search_data_ds.h" namespace search { -extern "C" void device_allocate_psi_phi_array(PsiPhiArray *data) { - if (!data->cpu_array_allocated()) throw std::runtime_error("CPU data is not allocated."); - if (data->gpu_array_allocated()) throw std::runtime_error("GPU data is already allocated."); +extern "C" void device_allocate_search_data_arrays(SearchData *data) { + if (!data->cpu_array_allocated() || !data->cpu_time_array_allocated()) { + throw std::runtime_error("CPU data is not allocated."); + } + if (data->gpu_array_allocated() || data->gpu_time_array_allocated()) { + throw std::runtime_error("GPU data is already allocated."); + } + // Allocate space for the psi/phi data. void *device_array_ptr; checkCudaErrors(cudaMalloc((void **)&device_array_ptr, data->get_total_array_size())); checkCudaErrors(cudaMemcpy(device_array_ptr, data->get_cpu_array_ptr(), data->get_total_array_size(), cudaMemcpyHostToDevice)); data->set_gpu_array_ptr(device_array_ptr); + + // Allocate space for the times data. + float *device_times_ptr; + long unsigned time_bytes = data->get_num_times() * sizeof(float); + checkCudaErrors(cudaMalloc((void **)&device_times_ptr, time_bytes)); + checkCudaErrors(cudaMemcpy(device_times_ptr, data->get_cpu_time_array_ptr(), time_bytes, cudaMemcpyHostToDevice)); + data->set_gpu_time_array_ptr(device_times_ptr); } -extern "C" void device_free_psi_phi_array(PsiPhiArray *data) { +extern "C" void device_free_search_data_arrays(SearchData *data) { if (data->gpu_array_allocated()) { checkCudaErrors(cudaFree(data->get_gpu_array_ptr())); data->set_gpu_array_ptr(nullptr); } + if (data->gpu_time_array_allocated()) { + checkCudaErrors(cudaFree(data->get_gpu_time_array_ptr())); + data->set_gpu_time_array_ptr(nullptr); + } } -__forceinline__ __device__ PsiPhi read_encoded_psi_phi(PsiPhiArrayMeta ¶ms, void *psi_phi_vect, int time, +__forceinline__ __device__ PsiPhi read_encoded_psi_phi(SearchDataMeta ¶ms, void *psi_phi_vect, int time, int row, int col) { // Bounds checking. if ((row < 0) || (col < 0) || (row >= params.height) || (col >= params.width)) { @@ -130,7 +146,7 @@ extern "C" __device__ __host__ void SigmaGFilteredIndicesCU(float *values, int n * * Creates a local copy of psi_phi_meta and params in local memory space. */ -__global__ void searchFilterImages(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_vect, float *image_times, +__global__ void searchFilterImages(SearchDataMeta psi_phi_meta, void *psi_phi_vect, float *image_times, SearchParameters params, int num_trajectories, Trajectory *trajectories, Trajectory *results) { // Get the x and y coordinates within the search space. @@ -257,24 +273,25 @@ __global__ void searchFilterImages(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_v } } -extern "C" void deviceSearchFilter(PsiPhiArray &psi_phi_array, float *image_times, SearchParameters params, - int num_trajectories, Trajectory *trj_to_search, int num_results, - Trajectory *best_results) { +extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters params, int num_trajectories, + Trajectory *trj_to_search, int num_results, Trajectory *best_results) { // Allocate Device memory Trajectory *device_tests; - float *device_img_times; Trajectory *device_search_results; // Check the hard coded maximum number of images against the num_images. - int num_images = psi_phi_array.get_num_times(); + int num_images = search_data.get_num_times(); if (num_images > MAX_NUM_IMAGES) { throw std::runtime_error("Number of images exceeds GPU maximum."); } - // Check that the device psi_phi vector has been allocated. - if (psi_phi_array.gpu_array_allocated() == false) { + // Check that the device vectors have already been allocated. + if (search_data.gpu_array_allocated() == false) { throw std::runtime_error("PsiPhi data has not been created."); } + if (search_data.gpu_time_array_allocated() == false) { + throw std::runtime_error("GPU time data has not been created."); + } // Copy trajectories to search if (params.debug) { @@ -285,14 +302,6 @@ extern "C" void deviceSearchFilter(PsiPhiArray &psi_phi_array, float *image_time checkCudaErrors(cudaMemcpy(device_tests, trj_to_search, sizeof(Trajectory) * num_trajectories, cudaMemcpyHostToDevice)); - // Copy the time vector. - if (params.debug) { - printf("Allocating GPU memory for time data using %lu bytes.\n", sizeof(float) * num_images); - } - checkCudaErrors(cudaMalloc((void **)&device_img_times, sizeof(float) * num_images)); - checkCudaErrors( - cudaMemcpy(device_img_times, image_times, sizeof(float) * num_images, cudaMemcpyHostToDevice)); - // Allocate space for the results. if (params.debug) { printf("Allocating GPU memory for %i results using %lu bytes.\n", num_results, sizeof(Trajectory) * num_results); @@ -308,17 +317,16 @@ extern "C" void deviceSearchFilter(PsiPhiArray &psi_phi_array, float *image_time dim3 threads(THREAD_DIM_X, THREAD_DIM_Y); // Launch Search - searchFilterImages<<>>(psi_phi_array.get_meta_data(), psi_phi_array.get_gpu_array_ptr(), - device_img_times, params, num_trajectories, device_tests, - device_search_results); + searchFilterImages<<>>(search_data.get_meta_data(), search_data.get_gpu_array_ptr(), + static_cast(search_data.get_gpu_time_array_ptr()), params, + num_trajectories, device_tests, device_search_results); // Read back results checkCudaErrors(cudaMemcpy(best_results, device_search_results, sizeof(Trajectory) * num_results, cudaMemcpyDeviceToHost)); - // Free the on GPU memory. + // Free the on GPU memory for this specific search. checkCudaErrors(cudaFree(device_search_results)); - checkCudaErrors(cudaFree(device_img_times)); checkCudaErrors(cudaFree(device_tests)); } diff --git a/src/kbmod/search/psi_phi_array_utils.h b/src/kbmod/search/psi_phi_array_utils.h deleted file mode 100644 index c363f65d4..000000000 --- a/src/kbmod/search/psi_phi_array_utils.h +++ /dev/null @@ -1,33 +0,0 @@ -/* - * psi_phi_array_utils.h - * - * The utility functions for the psi/phi array. Broken out from the header - * data structure so that it can use packages that won't be imported into the - * CUDA kernel, such as Eigen. - * - * Created on: Dec 8, 2023 - */ - -#ifndef PSI_PHI_ARRAY_UTILS_ -#define PSI_PHI_ARRAY_UTILS_ - -#include -#include -#include -#include - -#include "common.h" -#include "psi_phi_array_ds.h" -#include "raw_image.h" - -namespace search { - -// Compute the min, max, and scale parameter from the a vector of image data. -std::array compute_scale_params_from_image_vect(const std::vector& imgs, int num_bytes); - -void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug = false); - -} /* namespace search */ - -#endif /* PSI_PHI_ARRAY_UTILS_ */ diff --git a/src/kbmod/search/pydocs/psi_phi_array_docs.h b/src/kbmod/search/pydocs/psi_phi_array_docs.h index ffb7b009f..4f668e3ea 100644 --- a/src/kbmod/search/pydocs/psi_phi_array_docs.h +++ b/src/kbmod/search/pydocs/psi_phi_array_docs.h @@ -1,5 +1,5 @@ -#ifndef PSI_PHI_ARRAY_DOCS -#define PSI_PHI_ARRAY_DOCS +#ifndef SEARCH_DATA_DOCS +#define SEARCH_DATA_DOCS namespace pydocs { @@ -14,80 +14,88 @@ static const auto DOC_PsiPhi = R"doc( The phi value at a pixel. )doc"; -static const auto DOC_PsiPhiArray = R"doc( +static const auto DOC_SearchData = R"doc( An encoded array of Psi and Phi values along with their meta data. )doc"; -static const auto DOC_PsiPhiArray_get_num_bytes = R"doc( +static const auto DOC_SearchData_get_num_bytes = R"doc( The target number of bytes to use for encoding the data (1 for uint8, 2 for uint16, or 4 for float32). Might differ from actual number of bytes (block_size). )doc"; -static const auto DOC_PsiPhiArray_get_num_times = R"doc( +static const auto DOC_SearchData_get_num_times = R"doc( The number of times. )doc"; -static const auto DOC_PsiPhiArray_get_width = R"doc( +static const auto DOC_SearchData_get_width = R"doc( The image width. )doc"; -static const auto DOC_PsiPhiArray_get_height = R"doc( +static const auto DOC_SearchData_get_height = R"doc( The image height. )doc"; -static const auto DOC_PsiPhiArray_get_pixels_per_image = R"doc( +static const auto DOC_SearchData_get_pixels_per_image = R"doc( The number of pixels per each image. )doc"; -static const auto DOC_PsiPhiArray_get_num_entries = R"doc( +static const auto DOC_SearchData_get_num_entries = R"doc( The number of array entries. )doc"; -static const auto DOC_PsiPhiArray_get_total_array_size = R"doc( +static const auto DOC_SearchData_get_total_array_size = R"doc( The size of the array in bytes. )doc"; -static const auto DOC_PsiPhiArray_get_block_size = R"doc( +static const auto DOC_SearchData_get_block_size = R"doc( The size of a single entry in bytes. )doc"; -static const auto DOC_PsiPhiArray_get_psi_min_val = R"doc( +static const auto DOC_SearchData_get_psi_min_val = R"doc( The minimum value of psi used in the scaling computations. )doc"; -static const auto DOC_PsiPhiArray_get_psi_max_val = R"doc( +static const auto DOC_SearchData_get_psi_max_val = R"doc( The maximum value of psi used in the scaling computations. )doc"; -static const auto DOC_PsiPhiArray_get_psi_scale = R"doc( +static const auto DOC_SearchData_get_psi_scale = R"doc( The scaling parameter for psi. )doc"; -static const auto DOC_PsiPhiArray_get_phi_min_val = R"doc( +static const auto DOC_SearchData_get_phi_min_val = R"doc( The minimum value of phi used in the scaling computations. )doc"; -static const auto DOC_PsiPhiArray_get_phi_max_val = R"doc( +static const auto DOC_SearchData_get_phi_max_val = R"doc( The maximum value of phi used in the scaling computations. )doc"; -static const auto DOC_PsiPhiArray_get_phi_scale = R"doc( +static const auto DOC_SearchData_get_phi_scale = R"doc( The scaling parameter for phi. )doc"; -static const auto DOC_PsiPhiArray_get_cpu_array_allocated = R"doc( - A Boolean indicating whether the cpu array exists. +static const auto DOC_SearchData_get_cpu_array_allocated = R"doc( + A Boolean indicating whether the cpu data (psi/phi) array exists. )doc"; -static const auto DOC_PsiPhiArray_get_gpu_array_allocated = R"doc( - A Boolean indicating whether the gpu array exists. +static const auto DOC_SearchData_get_gpu_array_allocated = R"doc( + A Boolean indicating whether the gpu data (psi/phi) array exists. )doc"; -static const auto DOC_PsiPhiArray_clear = R"doc( +static const auto DOC_SearchData_get_cpu_time_array_allocated = R"doc( + A Boolean indicating whether the cpu time array exists. + )doc"; + +static const auto DOC_SearchData_get_gpu_time_array_allocated = R"doc( + A Boolean indicating whether the gpu time array exists. + )doc"; + +static const auto DOC_SearchData_clear = R"doc( Clear all data and free the arrays. )doc"; -static const auto DOC_PsiPhiArray_read_psi_phi = R"doc( +static const auto DOC_SearchData_read_psi_phi = R"doc( Read a PsiPhi value from the CPU array. Parameters @@ -105,9 +113,23 @@ static const auto DOC_PsiPhiArray_read_psi_phi = R"doc( The pixel values. )doc"; -static const auto DOC_PsiPhiArray_set_meta_data = R"doc( +static const auto DOC_SearchData_read_time = R"doc( + Read a zeroed time value from the CPU array. + + Parameters + ---------- + time : `int` + The timestep to read. + + Returns + ------- + `float` + The time. + )doc"; + +static const auto DOC_SearchData_set_meta_data = R"doc( Set the meta data for the array. Automatically called by - fill_psi_phi_array(). + fill_search_data(). Parameters ---------- @@ -121,12 +143,12 @@ static const auto DOC_PsiPhiArray_set_meta_data = R"doc( The width of each image in pixels. )doc"; -static const auto DOC_PsiPhiArray_fill_psi_phi_array = R"doc( - Fill the PsiPhiArray from Psi and Phi images. +static const auto DOC_SearchData_fill_search_data = R"doc( + Fill the SearchData from Psi and Phi images. Parameters ---------- - result_data : `PsiPhiArray` + result_data : `SearchData` The location to store the data. num_bytes : `int` The type of encoding to use (1, 2, or 4). @@ -134,8 +156,23 @@ static const auto DOC_PsiPhiArray_fill_psi_phi_array = R"doc( A list of psi images. phi_imgs : `list` A list of phi images. + zeroed_times : `list` + A list of floating point times starting at zero. + )doc"; + +static const auto DOC_SearchData_fill_search_data_from_image_stack = R"doc( + Fill the SearchData an ImageStack. + + Parameters + ---------- + result_data : `SearchData` + The location to store the data. + num_bytes : `int` + The type of encoding to use (1, 2, or 4). + stack : `ImageStack` + The stack of LayeredImages from which to build the psi and phi images. )doc"; } // namespace pydocs -#endif /* PSI_PHI_ARRAY_DOCS */ +#endif /* SEARCH_DATA_DOCS */ diff --git a/src/kbmod/search/psi_phi_array.cpp b/src/kbmod/search/search_data.cpp similarity index 67% rename from src/kbmod/search/psi_phi_array.cpp rename to src/kbmod/search/search_data.cpp index 3f2656680..4331f7792 100644 --- a/src/kbmod/search/psi_phi_array.cpp +++ b/src/kbmod/search/search_data.cpp @@ -1,43 +1,41 @@ -#include "psi_phi_array_ds.h" -#include "psi_phi_array_utils.h" -#include "pydocs/psi_phi_array_docs.h" +#include "search_data_ds.h" +#include "search_data_utils.h" +#include "pydocs/search_data_docs.h" namespace search { // Declaration of CUDA functions that will be linked in. #ifdef HAVE_CUDA -extern "C" void device_allocate_psi_phi_array(PsiPhiArray* data); +extern "C" void device_allocate_search_data_arrays(SearchData* data); -extern "C" void device_free_psi_phi_array(PsiPhiArray* data); +extern "C" void device_free_search_data_arrays(SearchData* data); #endif // ------------------------------------------------------- // --- Implementation of core data structure functions --- // ------------------------------------------------------- -PsiPhiArray::PsiPhiArray() {} +SearchData::SearchData() {} -PsiPhiArray::~PsiPhiArray() { - if (cpu_array_ptr != nullptr) { - free(cpu_array_ptr); - } -#ifdef HAVE_CUDA - if (gpu_array_ptr != nullptr) { - device_free_psi_phi_array(this); - } -#endif +SearchData::~SearchData() { + clear(); } -void PsiPhiArray::clear() { +void SearchData::clear() { // Free all used memory on CPU and GPU. if (cpu_array_ptr != nullptr) { free(cpu_array_ptr); cpu_array_ptr = nullptr; } + if (cpu_time_array != nullptr) { + free(cpu_time_array); + cpu_array_ptr = nullptr; + } #ifdef HAVE_CUDA - if (gpu_array_ptr != nullptr) { - device_free_psi_phi_array(this); + if ((gpu_array_ptr != nullptr) || (gpu_time_array != nullptr)) { + device_free_search_data_arrays(this); gpu_array_ptr = nullptr; + gpu_time_array = nullptr; } #endif @@ -58,7 +56,7 @@ void PsiPhiArray::clear() { meta_data.phi_scale = 1.0; } -void PsiPhiArray::set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width) { +void SearchData::set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width) { // Validity checking of parameters. if (new_num_bytes != -1 && new_num_bytes != 1 && new_num_bytes != 2 && new_num_bytes != 4) { throw std::runtime_error("Invalid setting of num_bytes. Must be (-1 [use default], 1, 2, or 4)."); @@ -90,7 +88,7 @@ void PsiPhiArray::set_meta_data(int new_num_bytes, int new_num_times, int new_he meta_data.total_array_size = meta_data.block_size * meta_data.num_entries; } -void PsiPhiArray::set_psi_scaling(float min_val, float max_val, float scale_val) { +void SearchData::set_psi_scaling(float min_val, float max_val, float scale_val) { if (min_val > max_val) throw std::runtime_error("Min value needs to be < max value"); if (scale_val <= 0) throw std::runtime_error("Scale value must be greater than zero."); meta_data.psi_min_val = min_val; @@ -98,7 +96,7 @@ void PsiPhiArray::set_psi_scaling(float min_val, float max_val, float scale_val) meta_data.psi_scale = scale_val; } -void PsiPhiArray::set_phi_scaling(float min_val, float max_val, float scale_val) { +void SearchData::set_phi_scaling(float min_val, float max_val, float scale_val) { if (min_val > max_val) throw std::runtime_error("Min value needs to be < max value"); if (scale_val <= 0) throw std::runtime_error("Scale value must be greater than zero."); meta_data.phi_min_val = min_val; @@ -106,7 +104,7 @@ void PsiPhiArray::set_phi_scaling(float min_val, float max_val, float scale_val) meta_data.phi_scale = scale_val; } -PsiPhi PsiPhiArray::read_psi_phi(int time, int row, int col) { +PsiPhi SearchData::read_psi_phi(int time, int row, int col) { PsiPhi result = {NO_DATA, NO_DATA}; // Array allocation and bounds checking. @@ -140,6 +138,15 @@ PsiPhi PsiPhiArray::read_psi_phi(int time, int row, int col) { return result; } +float SearchData::read_time(int time_index) { + if (cpu_time_array == nullptr) throw std::runtime_error("Read from unallocated times array."); + if ((time_index < 0 )|| (time_index >= meta_data.num_times)) { + throw std::runtime_error("Out of bounds read for time step=%i", time_index); + } + return cpu_time_array[time_index]; +} + + // ------------------------------------------- // --- Implementation of utility functions --- // ------------------------------------------- @@ -171,7 +178,7 @@ std::array compute_scale_params_from_image_vect(const std::vector -void set_encode_cpu_psi_phi_array(PsiPhiArray& data, const std::vector& psi_imgs, +void set_encode_cpu_search_data(SearchData& data, const std::vector& psi_imgs, const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); @@ -215,7 +222,7 @@ void set_encode_cpu_psi_phi_array(PsiPhiArray& data, const std::vector data.set_cpu_array_ptr((void*)encoded); } -void set_float_cpu_psi_phi_array(PsiPhiArray& data, const std::vector& psi_imgs, +void set_float_cpu_search_data(SearchData& data, const std::vector& psi_imgs, const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); @@ -241,8 +248,9 @@ void set_float_cpu_psi_phi_array(PsiPhiArray& data, const std::vector& data.set_cpu_array_ptr((void*)encoded); } -void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug) { +void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug) { if (result_data.get_cpu_array_ptr() != nullptr) { return; } @@ -251,6 +259,7 @@ void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vect int num_times = psi_imgs.size(); if (num_times <= 0) throw std::runtime_error("Trying to fill PsiPhi from empty vectors."); if (num_times != phi_imgs.size()) throw std::runtime_error("Size mismatch between psi and phi."); + if (num_times != zeroed_times.size()) throw std::runtime_error("Size mismatch between psi and zeroed times."); int width = phi_imgs[0].get_width(); int height = phi_imgs[0].get_height(); @@ -275,78 +284,126 @@ void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vect // Do the local encoding. if (result_data.get_num_bytes() == 1) { - set_encode_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); + set_encode_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); } else { - set_encode_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); + set_encode_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); } } else { if (debug) { printf("Encoding psi and phi as floats.\n"); } // Just interleave psi and phi images. - set_float_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); + set_float_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); } + // Copy the time array. + const long unsigned times_bytes = result_data.get_num_times() * sizeof(float); + if (debug) printf("Allocating %lu bytes on the CPU for times.\n"); + + float* times_array = (float*)malloc(data.get_total_array_size()); + if (times_array == nullptr) throw std::runtime_error("Unable to allocate space for CPU times."); + for (int i = 0; i < result_data.get_num_times(); ++i) { + times_array[i] = zeroed_times[i]; + } + data.set_cpu_time_array_ptr((void*)times_array); + #ifdef HAVE_CUDA // Create a copy of the encoded data in GPU memory. if (debug) { printf("Allocating GPU memory for PsiPhi array using %lu bytes.\n", result_data.get_total_array_size()); + printf("Allocating GPU memory for times array using %lu bytes.\n", times_bytes); } - device_allocate_psi_phi_array(&result_data); + + device_allocate_search_data_arrays(&result_data); if (result_data.get_gpu_array_ptr() == nullptr) { throw std::runtime_error("Unable to allocate GPU PsiPhi array."); } + if (result_data.get_gpu_time_array_ptr() == nullptr) { + throw std::runtime_error("Unable to allocate GPU time array."); + } #endif } +void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, bool debug) { + // Compute Phi and Psi from convolved images while leaving masked pixels alone + // Reinsert 0s for NO_DATA? + std::vector psi_images; + std::vector phi_images; + const int num_images = stack.img_count(); + if (debug) { + unsigned long num_bytes = 2 * stack.get_height() * stack.get_width() * num_images * sizeof(float); + printf("Building %i temporary %i by %i images (psi and phi), requiring %lu bytes", + (num_images * 2), stack.get_width(), stack.get_height(), num_bytes); + } + + // Build the psi and phi images first. + for (int i = 0; i < num_images; ++i) { + LayeredImage& img = stack.get_single_image(i); + psi_images.push_back(img.generate_psi_image()); + phi_images.push_back(img.generate_phi_image()); + } + + // Convert these into an array form. Needs the full psi and phi computed first so the + // encoding can compute the bounds of each array. + std::vector zeroed_times = stack.build_zeroed_times(); + fill_search_data(psi_phi_data, num_bytes, psi_images, phi_images, zeroed_times, debug); +} + // ------------------------------------------- // --- Python definitions -------------------- // ------------------------------------------- #ifdef Py_PYTHON_H -static void psi_phi_array_binding(py::module& m) { - using ppa = search::PsiPhiArray; +static void search_data_binding(py::module& m) { + using ppa = search::SearchData; py::class_(m, "PsiPhi", pydocs::DOC_PsiPhi) .def(py::init<>()) .def_readwrite("psi", &search::PsiPhi::psi) .def_readwrite("phi", &search::PsiPhi::phi); - py::class_(m, "PsiPhiArray", pydocs::DOC_PsiPhiArray) + py::class_(m, "SearchData", pydocs::DOC_SearchData) .def(py::init<>()) - .def_property_readonly("num_bytes", &ppa::get_num_bytes, pydocs::DOC_PsiPhiArray_get_num_bytes) - .def_property_readonly("num_times", &ppa::get_num_times, pydocs::DOC_PsiPhiArray_get_num_times) - .def_property_readonly("width", &ppa::get_width, pydocs::DOC_PsiPhiArray_get_width) - .def_property_readonly("height", &ppa::get_height, pydocs::DOC_PsiPhiArray_get_height) + .def_property_readonly("num_bytes", &ppa::get_num_bytes, pydocs::DOC_SearchData_get_num_bytes) + .def_property_readonly("num_times", &ppa::get_num_times, pydocs::DOC_SearchData_get_num_times) + .def_property_readonly("width", &ppa::get_width, pydocs::DOC_SearchData_get_width) + .def_property_readonly("height", &ppa::get_height, pydocs::DOC_SearchData_get_height) .def_property_readonly("pixels_per_image", &ppa::get_pixels_per_image, - pydocs::DOC_PsiPhiArray_get_pixels_per_image) + pydocs::DOC_SearchData_get_pixels_per_image) .def_property_readonly("num_entries", &ppa::get_num_entries, - pydocs::DOC_PsiPhiArray_get_num_entries) + pydocs::DOC_SearchData_get_num_entries) .def_property_readonly("total_array_size", &ppa::get_total_array_size, - pydocs::DOC_PsiPhiArray_get_total_array_size) - .def_property_readonly("block_size", &ppa::get_block_size, pydocs::DOC_PsiPhiArray_get_block_size) + pydocs::DOC_SearchData_get_total_array_size) + .def_property_readonly("block_size", &ppa::get_block_size, pydocs::DOC_SearchData_get_block_size) .def_property_readonly("psi_min_val", &ppa::get_psi_min_val, - pydocs::DOC_PsiPhiArray_get_psi_min_val) + pydocs::DOC_SearchData_get_psi_min_val) .def_property_readonly("psi_max_val", &ppa::get_psi_max_val, - pydocs::DOC_PsiPhiArray_get_psi_max_val) - .def_property_readonly("psi_scale", &ppa::get_psi_scale, pydocs::DOC_PsiPhiArray_get_psi_scale) + pydocs::DOC_SearchData_get_psi_max_val) + .def_property_readonly("psi_scale", &ppa::get_psi_scale, pydocs::DOC_SearchData_get_psi_scale) .def_property_readonly("phi_min_val", &ppa::get_phi_min_val, - pydocs::DOC_PsiPhiArray_get_phi_min_val) + pydocs::DOC_SearchData_get_phi_min_val) .def_property_readonly("phi_max_val", &ppa::get_phi_max_val, - pydocs::DOC_PsiPhiArray_get_phi_max_val) - .def_property_readonly("phi_scale", &ppa::get_phi_scale, pydocs::DOC_PsiPhiArray_get_phi_scale) + pydocs::DOC_SearchData_get_phi_max_val) + .def_property_readonly("phi_scale", &ppa::get_phi_scale, pydocs::DOC_SearchData_get_phi_scale) .def_property_readonly("cpu_array_allocated", &ppa::cpu_array_allocated, - pydocs::DOC_PsiPhiArray_get_cpu_array_allocated) + pydocs::DOC_SearchData_get_cpu_array_allocated) .def_property_readonly("gpu_array_allocated", &ppa::gpu_array_allocated, - pydocs::DOC_PsiPhiArray_get_gpu_array_allocated) - .def("set_meta_data", &ppa::set_meta_data, pydocs::DOC_PsiPhiArray_set_meta_data) - .def("clear", &ppa::clear, pydocs::DOC_PsiPhiArray_clear) - .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_PsiPhiArray_read_psi_phi); + pydocs::DOC_SearchData_get_gpu_array_allocated) + .def_property_readonly("cpu_time_array_allocated", &ppa::cpu_time_array_allocated, + pydocs::DOC_SearchData_get_cpu_time_array_allocated) + .def_property_readonly("gpu_time_array_allocated", &ppa::gpu_time_array_allocated, + pydocs::DOC_SearchData_get_gpu_time_array_allocated) + .def("set_meta_data", &ppa::set_meta_data, pydocs::DOC_SearchData_set_meta_data) + .def("clear", &ppa::clear, pydocs::DOC_SearchData_clear) + .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_SearchData_read_psi_phi); + .def("read_time", &ppa::read_time, pydocs::DOC_SearchData_read_time); m.def("compute_scale_params_from_image_vect", &search::compute_scale_params_from_image_vect); m.def("decode_uint_scalar", &search::decode_uint_scalar); m.def("encode_uint_scalar", &search::encode_uint_scalar); - m.def("fill_psi_phi_array", &search::fill_psi_phi_array, pydocs::DOC_PsiPhiArray_fill_psi_phi_array); + m.def("fill_search_data", &search::fill_search_data, pydocs::DOC_SearchData_fill_search_data); + m.def("fill_search_data_from_image_stack", &search::fill_search_data_from_image_stack, + pydocs::DOC_SearchData_fill_search_data_from_image_stack); } #endif diff --git a/src/kbmod/search/psi_phi_array_ds.h b/src/kbmod/search/search_data_ds.h similarity index 68% rename from src/kbmod/search/psi_phi_array_ds.h rename to src/kbmod/search/search_data_ds.h index 719ec8687..900c3cf51 100644 --- a/src/kbmod/search/psi_phi_array_ds.h +++ b/src/kbmod/search/search_data_ds.h @@ -1,22 +1,23 @@ /* - * psi_phi_array_ds.h + * search_data_ds.h * - * The data structure for the interleaved psi/phi array. The the data + * The data structure for the raw data needed for the search algorith, + * including the psi/phi values and the zeroed times. The the data * structure and core functions are included in the header (and separated out * from the rest of the utility functions) to allow the CUDA files to import * only what they need. * * The data structure allocates memory on both the CPU and GPU for the - * interleaved psi/phi array and maintains ownership of the pointers - * until clear() is called or the PsiPhiArray's destructor is called. This allows - * the object to be passed repeatedly to the on-device search without reallocating - * and copying the memory on the GPU. + * arraysand maintains ownership of the pointers until clear() is called + * the object's destructor is called. This allows the object to be passed + * repeatedly to the on-device search without reallocating and copying the + * memory on the GPU. * * Created on: Dec 5, 2023 */ -#ifndef PSI_PHI_ARRAY_DS_ -#define PSI_PHI_ARRAY_DS_ +#ifndef SEARCH_DATA_DS_ +#define SEARCH_DATA_DS_ #include #include @@ -42,8 +43,8 @@ inline float decode_uint_scalar(float value, float min_val, float scale) { return (value == 0.0) ? NO_DATA : (value - 1.0) * scale + min_val; } -// The struct of meta data for the PsiPhiArray. -struct PsiPhiArrayMeta { +// The struct of meta data for the SearchData. +struct SearchDataMeta { int num_times = 0; int width = 0; int height = 0; @@ -64,17 +65,17 @@ struct PsiPhiArrayMeta { float phi_scale = 1.0; }; -/* PsiPhiArray is a class to hold the psi and phi arrays for the CPU and GPU as well as +/* SearchData is a class to hold the psi and phi arrays for the CPU and GPU as well as the meta data and functions to do encoding and decoding on CPU. */ -class PsiPhiArray { +class SearchData { public: - explicit PsiPhiArray(); - virtual ~PsiPhiArray(); + explicit SearchData(); + virtual ~SearchData(); void clear(); - inline PsiPhiArrayMeta& get_meta_data() { return meta_data; } + inline SearchDataMeta& get_meta_data() { return meta_data; } // --- Getter functions (for Python interface) ---------------- inline int get_num_bytes() { return meta_data.num_bytes; } @@ -95,9 +96,12 @@ class PsiPhiArray { inline bool cpu_array_allocated() { return cpu_array_ptr != nullptr; } inline bool gpu_array_allocated() { return gpu_array_ptr != nullptr; } + inline bool cpu_time_array_allocated() { return cpu_time_array != nullptr; } + inline bool gpu_time_array_allocated() { return gpu_time_array != nullptr; } - // Primary getter function for interaction (read the data). - PsiPhi read_psi_phi(int time, int row, int col); + // Primary getter functions for interaction (read the data). + PsiPhi read_psi_phi(int time_index, int row, int col); + float read_time_value(int time_index); // Setters for the utility functions to allocate the data. void set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width); @@ -110,14 +114,21 @@ class PsiPhiArray { inline void set_cpu_array_ptr(void* new_ptr) { cpu_array_ptr = new_ptr; } inline void set_gpu_array_ptr(void* new_ptr) { gpu_array_ptr = new_ptr; } + inline float* get_cpu_time_array_ptr() { return cpu_time_array; } + inline float* get_gpu_time_array_ptr() { return gpu_time_array; } + inline void set_cpu_time_array_ptr(float* new_ptr) { cpu_time_array = new_ptr; } + inline void set_gpu_time_array_ptr(float* new_ptr) { gpu_time_array = new_ptr; } + private: - PsiPhiArrayMeta meta_data; + SearchDataMeta meta_data; - // Pointers the array (CPU space). - void* cpu_array_ptr = nullptr; + // Pointers to the arrays + void* cpu_array_ptr = nullptr; void* gpu_array_ptr = nullptr; + float* cpu_time_array = nullptr; + float* gpu_time_array = nullptr; }; } /* namespace search */ -#endif /* PSI_PHI_ARRAY_DS_ */ +#endif /* SEARCH_DATA_DS_ */ diff --git a/src/kbmod/search/search_data_utils.h b/src/kbmod/search/search_data_utils.h new file mode 100644 index 000000000..50538e990 --- /dev/null +++ b/src/kbmod/search/search_data_utils.h @@ -0,0 +1,39 @@ +/* + * search_data_utils.h + * + * The utility functions for the psi/phi array. Broken out from the header + * data structure so that it can use packages that won't be imported into the + * CUDA kernel, such as Eigen. + * + * Created on: Dec 8, 2023 + */ + +#ifndef SEARCH_DATA_UTILS_ +#define SEARCH_DATA_UTILS_ + +#include +#include +#include +#include + +#include "common.h" +#include "image_stack.h" +#include "layered_image.h" +#include "search_data_ds.h" +#include "raw_image.h" + +namespace search { + +// Compute the min, max, and scale parameter from the a vector of image data. +std::array compute_scale_params_from_image_vect(const std::vector& imgs, int num_bytes); + +void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug = false); + +void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, + bool debug = false); + +} /* namespace search */ + +#endif /* SEARCH_DATA_UTILS_ */ diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index ba31ef247..60ff1611c 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -2,9 +2,8 @@ namespace search { #ifdef HAVE_CUDA -extern "C" void deviceSearchFilter(PsiPhiArray& psi_phi_data, float* image_times, SearchParameters params, - int num_trajectories, Trajectory* trj_to_search, int num_results, - Trajectory* best_results); +extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters params, int num_trajectories, + Trajectory *trj_to_search, int num_results, Trajectory *best_results); #endif StackSearch::StackSearch(ImageStack& imstack) : stack(imstack) { @@ -76,8 +75,8 @@ void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ DebugTimer psi_phi_timer = DebugTimer("Creating psi/phi buffers", debug_info); prepare_psi_phi(); - PsiPhiArray psi_phi_data; - fill_psi_phi_array(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, debug_info); + SearchData psi_phi_data; + fill_search_data(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, debug_info); psi_phi_timer.stop(); // Allocate a vector for the results. @@ -98,7 +97,7 @@ void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ // Do the actual search on the GPU. DebugTimer search_timer = DebugTimer("Running search", debug_info); #ifdef HAVE_CUDA - deviceSearchFilter(psi_phi_data, image_times.data(), params, search_list.size(), search_list.data(), + deviceSearchFilter(psi_phi_data, params, search_list.size(), search_list.data(), max_results, results.data()); #else throw std::runtime_error("Non-GPU search is not implemented."); From 881a058f466acd19982b1b5f60bd4e94da87d44a Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 1 Feb 2024 11:14:43 -0500 Subject: [PATCH 02/27] File rename --- .../search/pydocs/{psi_phi_array_docs.h => search_data_docs.h} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename src/kbmod/search/pydocs/{psi_phi_array_docs.h => search_data_docs.h} (100%) diff --git a/src/kbmod/search/pydocs/psi_phi_array_docs.h b/src/kbmod/search/pydocs/search_data_docs.h similarity index 100% rename from src/kbmod/search/pydocs/psi_phi_array_docs.h rename to src/kbmod/search/pydocs/search_data_docs.h From ce99d654d67b6afc66c3237340979918122f4e33 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 1 Feb 2024 11:29:48 -0500 Subject: [PATCH 03/27] Add tests --- src/kbmod/search/search_data_utils.h | 2 +- ...t_psi_phi_array.py => test_search_data.py} | 77 +++++++++++++++++-- 2 files changed, 70 insertions(+), 9 deletions(-) rename tests/{test_psi_phi_array.py => test_search_data.py} (72%) diff --git a/src/kbmod/search/search_data_utils.h b/src/kbmod/search/search_data_utils.h index 50538e990..4d300af66 100644 --- a/src/kbmod/search/search_data_utils.h +++ b/src/kbmod/search/search_data_utils.h @@ -32,7 +32,7 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< bool debug = false); void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, - bool debug = false); + bool debug = false); } /* namespace search */ diff --git a/tests/test_psi_phi_array.py b/tests/test_search_data.py similarity index 72% rename from tests/test_psi_phi_array.py rename to tests/test_search_data.py index 8260fffaf..6e3e234e2 100644 --- a/tests/test_psi_phi_array.py +++ b/tests/test_search_data.py @@ -3,18 +3,23 @@ import numpy as np from kbmod.search import ( + HAS_GPU, KB_NO_DATA, + PSF, + ImageStack, + LayeredImage, PsiPhi, - PsiPhiArray, + SearchData, RawImage, compute_scale_params_from_image_vect, decode_uint_scalar, encode_uint_scalar, - fill_psi_phi_array, + fill_search_data, + fill_search_data_from_image_stack, ) -class test_psi_phi_array(unittest.TestCase): +class test_search_data(unittest.TestCase): def setUp(self): self.num_times = 2 self.width = 4 @@ -31,8 +36,10 @@ def setUp(self): self.phi_1 = RawImage(np.full((self.height, self.width), 0.1, dtype=np.single), obs_time=1.0) self.phi_2 = RawImage(np.full((self.height, self.width), 0.2, dtype=np.single), obs_time=2.0) + self.zeroed_times = [0.0, 1.0] + def test_set_meta_data(self): - arr = PsiPhiArray() + arr = SearchData() self.assertEqual(arr.num_times, 0) self.assertEqual(arr.num_bytes, 4) self.assertEqual(arr.width, 0) @@ -121,10 +128,10 @@ def test_compute_scale_params_from_image_vect(self): self.assertAlmostEqual(result_uint16[1], max_val, delta=1e-5) self.assertAlmostEqual(result_uint16[2], max_val / 65535.0, delta=1e-5) - def test_fill_psi_phi_array(self): + def test_fill_search_data(self): for num_bytes in [2, 4]: - arr = PsiPhiArray() - fill_psi_phi_array(arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], False) + arr = SearchData() + fill_search_data(arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], self.zeroed_times, False) # Check the meta data. self.assertEqual(arr.num_times, self.num_times) @@ -139,9 +146,16 @@ def test_fill_psi_phi_array(self): self.assertEqual(arr.block_size, num_bytes) self.assertEqual(arr.total_array_size, arr.num_entries * arr.block_size) - # Check that we can correctly read the values from the CPU. + # Check that we allocate the arrays self.assertTrue(arr.cpu_array_allocated) + self.assertTrue(arr.cpu_time_array_allocated) + if (HAS_GPU): + self.assertTrue(arr.gpu_array_allocated) + self.assertTrue(arr.gpu_time_array_allocated) + + # Check that we can correctly read the values from the CPU. for time in range(self.num_times): + self.assertAlmostEqual(arr.read_time(time), self.zeroed_times[time]) offset = time * self.width * self.height for row in range(self.height): for col in range(self.width): @@ -152,6 +166,53 @@ def test_fill_psi_phi_array(self): # Check that the arrays are set to NULL after we clear it (memory should be freed too). arr.clear() self.assertFalse(arr.cpu_array_allocated) + self.assertFalse(arr.cpu_time_array_allocated) + if (HAS_GPU): + self.assertFalse(arr.gpu_array_allocated) + self.assertFalse(arr.gpu_time_array_allocated) + + def test_fill_search_data_from_image_stack(self): + # Build a fake image stack. + num_images = 5 + width = 21 + height = 15 + images = [None] * num_images + p = PSF(1.0) + for i in range(num_images): + self.images[i] = kb.LayeredImage( + width, + height, + 2.0, # noise_level + 4.0, # variance + 2.0 * i + 1.0, # time + p, + ) + im_stack = ImageStack(images) + + # Create the SearchData from the ImageStack. + arr = SearchData() + fill_search_data_from_image_stack(arr, im_stack, 4, False) + + # Check the meta data. + self.assertEqual(arr.num_times, num_images) + self.assertEqual(arr.num_bytes, 4) + self.assertEqual(arr.width, width) + self.assertEqual(arr.height, height) + self.assertEqual(arr.pixels_per_image, width * height) + self.assertEqual(arr.num_entries, 2 * arr.pixels_per_image * num_times) + self.assertEqual(arr.block_size, 4) + self.assertEqual(arr.total_array_size, arr.num_entries * arr.block_size) + + # Check that we allocated the arrays. + self.assertTrue(arr.cpu_array_allocated) + self.assertTrue(arr.cpu_time_array_allocated) + if (HAS_GPU): + self.assertTrue(arr.gpu_array_allocated) + self.assertTrue(arr.gpu_time_array_allocated) + + # Since we filled the images with random data, we only test the times. + for time in range(self.num_times): + self.assertAlmostEqual(arr.read_time(time), 2.0 * time) if __name__ == "__main__": From 0b2b94124926e4776757561a1cc77d99fc8870a8 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 1 Feb 2024 12:13:19 -0500 Subject: [PATCH 04/27] Bug fixes and linting --- src/kbmod/search/bindings.cpp | 4 +-- src/kbmod/search/kernels.cu | 12 ++++---- src/kbmod/search/search_data.cpp | 41 ++++++++++++++-------------- src/kbmod/search/search_data_ds.h | 9 +++--- src/kbmod/search/search_data_utils.h | 4 +-- src/kbmod/search/stack_search.cpp | 10 +++---- src/kbmod/search/stack_search.h | 4 +-- tests/test_search_data.py | 24 ++++++++-------- 8 files changed, 56 insertions(+), 52 deletions(-) diff --git a/src/kbmod/search/bindings.cpp b/src/kbmod/search/bindings.cpp index 4175c9639..a76eb0645 100644 --- a/src/kbmod/search/bindings.cpp +++ b/src/kbmod/search/bindings.cpp @@ -16,7 +16,7 @@ namespace py = pybind11; #include "stack_search.cpp" #include "stamp_creator.cpp" #include "kernel_testing_helpers.cpp" -#include "psi_phi_array.cpp" +#include "search_data.cpp" PYBIND11_MODULE(search, m) { m.attr("KB_NO_DATA") = pybind11::float_(search::NO_DATA); @@ -40,7 +40,7 @@ PYBIND11_MODULE(search, m) { search::pixel_pos_bindings(m); search::image_moments_bindings(m); search::stamp_parameters_bindings(m); - search::psi_phi_array_binding(m); + search::search_data_binding(m); // Functions from raw_image.cpp m.def("create_median_image", &search::create_median_image); m.def("create_summed_image", &search::create_summed_image); diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index 2accdb171..c5036a0ac 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -42,7 +42,8 @@ extern "C" void device_allocate_search_data_arrays(SearchData *data) { float *device_times_ptr; long unsigned time_bytes = data->get_num_times() * sizeof(float); checkCudaErrors(cudaMalloc((void **)&device_times_ptr, time_bytes)); - checkCudaErrors(cudaMemcpy(device_times_ptr, data->get_cpu_time_array_ptr(), time_bytes, cudaMemcpyHostToDevice)); + checkCudaErrors( + cudaMemcpy(device_times_ptr, data->get_cpu_time_array_ptr(), time_bytes, cudaMemcpyHostToDevice)); data->set_gpu_time_array_ptr(device_times_ptr); } @@ -296,7 +297,7 @@ extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters par // Copy trajectories to search if (params.debug) { printf("Allocating GPU memory for testing grid with %i elements using %lu bytes.\n", num_trajectories, - sizeof(Trajectory) * num_trajectories); + sizeof(Trajectory) * num_trajectories); } checkCudaErrors(cudaMalloc((void **)&device_tests, sizeof(Trajectory) * num_trajectories)); checkCudaErrors(cudaMemcpy(device_tests, trj_to_search, sizeof(Trajectory) * num_trajectories, @@ -304,7 +305,8 @@ extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters par // Allocate space for the results. if (params.debug) { - printf("Allocating GPU memory for %i results using %lu bytes.\n", num_results, sizeof(Trajectory) * num_results); + printf("Allocating GPU memory for %i results using %lu bytes.\n", num_results, + sizeof(Trajectory) * num_results); } checkCudaErrors(cudaMalloc((void **)&device_search_results, sizeof(Trajectory) * num_results)); @@ -318,8 +320,8 @@ extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters par // Launch Search searchFilterImages<<>>(search_data.get_meta_data(), search_data.get_gpu_array_ptr(), - static_cast(search_data.get_gpu_time_array_ptr()), params, - num_trajectories, device_tests, device_search_results); + static_cast(search_data.get_gpu_time_array_ptr()), + params, num_trajectories, device_tests, device_search_results); // Read back results checkCudaErrors(cudaMemcpy(best_results, device_search_results, sizeof(Trajectory) * num_results, diff --git a/src/kbmod/search/search_data.cpp b/src/kbmod/search/search_data.cpp index 4331f7792..ae2e1c425 100644 --- a/src/kbmod/search/search_data.cpp +++ b/src/kbmod/search/search_data.cpp @@ -17,9 +17,7 @@ extern "C" void device_free_search_data_arrays(SearchData* data); SearchData::SearchData() {} -SearchData::~SearchData() { - clear(); -} +SearchData::~SearchData() { clear(); } void SearchData::clear() { // Free all used memory on CPU and GPU. @@ -29,7 +27,7 @@ void SearchData::clear() { } if (cpu_time_array != nullptr) { free(cpu_time_array); - cpu_array_ptr = nullptr; + cpu_time_array = nullptr; } #ifdef HAVE_CUDA if ((gpu_array_ptr != nullptr) || (gpu_time_array != nullptr)) { @@ -140,13 +138,12 @@ PsiPhi SearchData::read_psi_phi(int time, int row, int col) { float SearchData::read_time(int time_index) { if (cpu_time_array == nullptr) throw std::runtime_error("Read from unallocated times array."); - if ((time_index < 0 )|| (time_index >= meta_data.num_times)) { - throw std::runtime_error("Out of bounds read for time step=%i", time_index); + if ((time_index < 0) || (time_index >= meta_data.num_times)) { + throw std::runtime_error("Out of bounds read for time step."); } return cpu_time_array[time_index]; } - // ------------------------------------------- // --- Implementation of utility functions --- // ------------------------------------------- @@ -179,7 +176,7 @@ std::array compute_scale_params_from_image_vect(const std::vector void set_encode_cpu_search_data(SearchData& data, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug) { + const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); } @@ -223,7 +220,7 @@ void set_encode_cpu_search_data(SearchData& data, const std::vector& p } void set_float_cpu_search_data(SearchData& data, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug) { + const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); } @@ -249,8 +246,8 @@ void set_float_cpu_search_data(SearchData& data, const std::vector& ps } void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, const std::vector zeroed_times, - bool debug) { + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug) { if (result_data.get_cpu_array_ptr() != nullptr) { return; } @@ -259,7 +256,8 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< int num_times = psi_imgs.size(); if (num_times <= 0) throw std::runtime_error("Trying to fill PsiPhi from empty vectors."); if (num_times != phi_imgs.size()) throw std::runtime_error("Size mismatch between psi and phi."); - if (num_times != zeroed_times.size()) throw std::runtime_error("Size mismatch between psi and zeroed times."); + if (num_times != zeroed_times.size()) + throw std::runtime_error("Size mismatch between psi and zeroed times."); int width = phi_imgs[0].get_width(); int height = phi_imgs[0].get_height(); @@ -298,14 +296,14 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< // Copy the time array. const long unsigned times_bytes = result_data.get_num_times() * sizeof(float); - if (debug) printf("Allocating %lu bytes on the CPU for times.\n"); + if (debug) printf("Allocating %lu bytes on the CPU for times.\n", times_bytes); - float* times_array = (float*)malloc(data.get_total_array_size()); + float* times_array = (float*)malloc(times_bytes); if (times_array == nullptr) throw std::runtime_error("Unable to allocate space for CPU times."); for (int i = 0; i < result_data.get_num_times(); ++i) { times_array[i] = zeroed_times[i]; } - data.set_cpu_time_array_ptr((void*)times_array); + result_data.set_cpu_time_array_ptr(times_array); #ifdef HAVE_CUDA // Create a copy of the encoded data in GPU memory. @@ -314,7 +312,7 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< result_data.get_total_array_size()); printf("Allocating GPU memory for times array using %lu bytes.\n", times_bytes); } - + device_allocate_search_data_arrays(&result_data); if (result_data.get_gpu_array_ptr() == nullptr) { throw std::runtime_error("Unable to allocate GPU PsiPhi array."); @@ -325,7 +323,8 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< #endif } -void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, bool debug) { +void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, + bool debug) { // Compute Phi and Psi from convolved images while leaving masked pixels alone // Reinsert 0s for NO_DATA? std::vector psi_images; @@ -333,8 +332,8 @@ void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stac const int num_images = stack.img_count(); if (debug) { unsigned long num_bytes = 2 * stack.get_height() * stack.get_width() * num_images * sizeof(float); - printf("Building %i temporary %i by %i images (psi and phi), requiring %lu bytes", - (num_images * 2), stack.get_width(), stack.get_height(), num_bytes); + printf("Building %i temporary %i by %i images (psi and phi), requiring %lu bytes", (num_images * 2), + stack.get_width(), stack.get_height(), num_bytes); } // Build the psi and phi images first. @@ -347,7 +346,7 @@ void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stac // Convert these into an array form. Needs the full psi and phi computed first so the // encoding can compute the bounds of each array. std::vector zeroed_times = stack.build_zeroed_times(); - fill_search_data(psi_phi_data, num_bytes, psi_images, phi_images, zeroed_times, debug); + fill_search_data(result_data, num_bytes, psi_images, phi_images, zeroed_times, debug); } // ------------------------------------------- @@ -396,7 +395,7 @@ static void search_data_binding(py::module& m) { pydocs::DOC_SearchData_get_gpu_time_array_allocated) .def("set_meta_data", &ppa::set_meta_data, pydocs::DOC_SearchData_set_meta_data) .def("clear", &ppa::clear, pydocs::DOC_SearchData_clear) - .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_SearchData_read_psi_phi); + .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_SearchData_read_psi_phi) .def("read_time", &ppa::read_time, pydocs::DOC_SearchData_read_time); m.def("compute_scale_params_from_image_vect", &search::compute_scale_params_from_image_vect); m.def("decode_uint_scalar", &search::decode_uint_scalar); diff --git a/src/kbmod/search/search_data_ds.h b/src/kbmod/search/search_data_ds.h index 900c3cf51..7a64842ce 100644 --- a/src/kbmod/search/search_data_ds.h +++ b/src/kbmod/search/search_data_ds.h @@ -8,10 +8,11 @@ * only what they need. * * The data structure allocates memory on both the CPU and GPU for the - * arraysand maintains ownership of the pointers until clear() is called + * arrays and maintains ownership of the pointers until clear() is called * the object's destructor is called. This allows the object to be passed * repeatedly to the on-device search without reallocating and copying the - * memory on the GPU. + * memory on the GPU. All arrays are stored as pointers (instead of vectors) + * for compatibility with CUDA. * * Created on: Dec 5, 2023 */ @@ -101,7 +102,7 @@ class SearchData { // Primary getter functions for interaction (read the data). PsiPhi read_psi_phi(int time_index, int row, int col); - float read_time_value(int time_index); + float read_time(int time_index); // Setters for the utility functions to allocate the data. void set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width); @@ -123,7 +124,7 @@ class SearchData { SearchDataMeta meta_data; // Pointers to the arrays - void* cpu_array_ptr = nullptr; + void* cpu_array_ptr = nullptr; void* gpu_array_ptr = nullptr; float* cpu_time_array = nullptr; float* gpu_time_array = nullptr; diff --git a/src/kbmod/search/search_data_utils.h b/src/kbmod/search/search_data_utils.h index 4d300af66..683895ce4 100644 --- a/src/kbmod/search/search_data_utils.h +++ b/src/kbmod/search/search_data_utils.h @@ -28,8 +28,8 @@ namespace search { std::array compute_scale_params_from_image_vect(const std::vector& imgs, int num_bytes); void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, const std::vector zeroed_times, - bool debug = false); + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug = false); void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, bool debug = false); diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index 60ff1611c..64c6741b7 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -2,8 +2,8 @@ namespace search { #ifdef HAVE_CUDA -extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters params, int num_trajectories, - Trajectory *trj_to_search, int num_results, Trajectory *best_results); +extern "C" void deviceSearchFilter(SearchData& search_data, SearchParameters params, int num_trajectories, + Trajectory* trj_to_search, int num_results, Trajectory* best_results); #endif StackSearch::StackSearch(ImageStack& imstack) : stack(imstack) { @@ -76,7 +76,7 @@ void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ DebugTimer psi_phi_timer = DebugTimer("Creating psi/phi buffers", debug_info); prepare_psi_phi(); SearchData psi_phi_data; - fill_search_data(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, debug_info); + fill_search_data(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, image_times, debug_info); psi_phi_timer.stop(); // Allocate a vector for the results. @@ -97,8 +97,8 @@ void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ // Do the actual search on the GPU. DebugTimer search_timer = DebugTimer("Running search", debug_info); #ifdef HAVE_CUDA - deviceSearchFilter(psi_phi_data, params, search_list.size(), search_list.data(), - max_results, results.data()); + deviceSearchFilter(psi_phi_data, params, search_list.size(), search_list.data(), max_results, + results.data()); #else throw std::runtime_error("Non-GPU search is not implemented."); #endif diff --git a/src/kbmod/search/stack_search.h b/src/kbmod/search/stack_search.h index 597f78850..5b5af451e 100644 --- a/src/kbmod/search/stack_search.h +++ b/src/kbmod/search/stack_search.h @@ -16,8 +16,8 @@ #include "geom.h" #include "image_stack.h" #include "psf.h" -#include "psi_phi_array_ds.h" -#include "psi_phi_array_utils.h" +#include "search_data_ds.h" +#include "search_data_utils.h" #include "pydocs/stack_search_docs.h" #include "stamp_creator.h" diff --git a/tests/test_search_data.py b/tests/test_search_data.py index 6e3e234e2..80b847365 100644 --- a/tests/test_search_data.py +++ b/tests/test_search_data.py @@ -131,7 +131,9 @@ def test_compute_scale_params_from_image_vect(self): def test_fill_search_data(self): for num_bytes in [2, 4]: arr = SearchData() - fill_search_data(arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], self.zeroed_times, False) + fill_search_data( + arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], self.zeroed_times, False + ) # Check the meta data. self.assertEqual(arr.num_times, self.num_times) @@ -149,7 +151,7 @@ def test_fill_search_data(self): # Check that we allocate the arrays self.assertTrue(arr.cpu_array_allocated) self.assertTrue(arr.cpu_time_array_allocated) - if (HAS_GPU): + if HAS_GPU: self.assertTrue(arr.gpu_array_allocated) self.assertTrue(arr.gpu_time_array_allocated) @@ -167,19 +169,19 @@ def test_fill_search_data(self): arr.clear() self.assertFalse(arr.cpu_array_allocated) self.assertFalse(arr.cpu_time_array_allocated) - if (HAS_GPU): + if HAS_GPU: self.assertFalse(arr.gpu_array_allocated) self.assertFalse(arr.gpu_time_array_allocated) def test_fill_search_data_from_image_stack(self): # Build a fake image stack. - num_images = 5 + num_times = 5 width = 21 height = 15 - images = [None] * num_images + images = [None] * num_times p = PSF(1.0) - for i in range(num_images): - self.images[i] = kb.LayeredImage( + for i in range(num_times): + images[i] = LayeredImage( width, height, 2.0, # noise_level @@ -192,9 +194,9 @@ def test_fill_search_data_from_image_stack(self): # Create the SearchData from the ImageStack. arr = SearchData() fill_search_data_from_image_stack(arr, im_stack, 4, False) - + # Check the meta data. - self.assertEqual(arr.num_times, num_images) + self.assertEqual(arr.num_times, num_times) self.assertEqual(arr.num_bytes, 4) self.assertEqual(arr.width, width) self.assertEqual(arr.height, height) @@ -206,12 +208,12 @@ def test_fill_search_data_from_image_stack(self): # Check that we allocated the arrays. self.assertTrue(arr.cpu_array_allocated) self.assertTrue(arr.cpu_time_array_allocated) - if (HAS_GPU): + if HAS_GPU: self.assertTrue(arr.gpu_array_allocated) self.assertTrue(arr.gpu_time_array_allocated) # Since we filled the images with random data, we only test the times. - for time in range(self.num_times): + for time in range(num_times): self.assertAlmostEqual(arr.read_time(time), 2.0 * time) From a2bcbc0b0a24eab9aa01a51b84c9652d9699f3ae Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 1 Feb 2024 16:37:30 -0500 Subject: [PATCH 05/27] Break out core evaluation into its own function --- src/kbmod/search/kernels.cu | 243 ++++++++++++------------------------ 1 file changed, 80 insertions(+), 163 deletions(-) diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index 84b6cf249..4a798155b 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -41,7 +41,7 @@ extern "C" void device_free_psi_phi_array(PsiPhiArray *data) { } } -__forceinline__ __device__ PsiPhi read_encoded_psi_phi(PsiPhiArrayMeta ¶ms, void *psi_phi_vect, int time, +__host__ __device__ PsiPhi read_encoded_psi_phi(PsiPhiArrayMeta ¶ms, void *psi_phi_vect, int time, int row, int col) { // Bounds checking. if ((row < 0) || (col < 0) || (row >= params.height) || (col >= params.width)) { @@ -122,6 +122,81 @@ extern "C" __device__ __host__ void SigmaGFilteredIndicesCU(float *values, int n *max_keep_idx = end - 1; } +/* + * Evaluate the likelihood score (as computed with from the psi and phi values) for a single + * given candidate trajectory. Modifies the trajectory in place to update the number of + * observations, likelihood, and flux. + */ +extern "C" __device__ __host__ void evaluateTrajectory(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_vect, float *image_times, + SearchParameters params, Trajectory *candidate) { + // Data structures used for filtering. We fill in only what we need. + float psi_array[MAX_NUM_IMAGES]; + float phi_array[MAX_NUM_IMAGES]; + float psi_sum = 0.0; + float phi_sum = 0.0; + + // Reset the statistics for the candidate. + candidate->obs_count = 0; + candidate->lh = -1.0; + candidate->flux = -1.0; + + // Loop over each image and sample the appropriate pixel + int num_seen = 0; + for (int i = 0; i < psi_phi_meta.num_times; ++i) { + // Predict the trajectory's position. + float curr_time = image_times[i]; + int current_x = candidate->x + int(candidate->vx * curr_time + 0.5); + int current_y = candidate->y + int(candidate->vy * curr_time + 0.5); + + // Get the Psi and Phi pixel values. + PsiPhi pixel_vals = read_encoded_psi_phi(psi_phi_meta, psi_phi_vect, i, current_y, current_x); + if (pixel_vals.psi != NO_DATA && pixel_vals.phi != NO_DATA) { + psi_sum += pixel_vals.psi; + phi_sum += pixel_vals.phi; + psi_array[num_seen] = pixel_vals.psi; + phi_array[num_seen] = pixel_vals.phi; + num_seen += 1; + } + } + candidate->obs_count = num_seen; + candidate->lh = psi_sum / sqrt(phi_sum); + candidate->flux = psi_sum / phi_sum; + + // If we do not have enough observations or a good enough LH score, + // do not bother with any of the following steps. + if ((candidate->obs_count < params.min_observations) || + (params.do_sigmag_filter && candidate->lh < params.min_lh)) + return; + + // If we are doing on GPU filtering, run the sigma_g filter and recompute the likelihoods. + if (params.do_sigmag_filter) { + // Fill in a likelihood and index array for sorting. + float lc_array[MAX_NUM_IMAGES]; + int idx_array[MAX_NUM_IMAGES]; + for (int i = 0; i < num_seen; ++i) { + lc_array[i] = (phi_array[i] != 0) ? (psi_array[i] / phi_array[i]) : 0; + idx_array[i] = i; + } + + int min_keep_idx = 0; + int max_keep_idx = num_seen - 1; + SigmaGFilteredIndicesCU(lc_array, num_seen, params.sgl_L, params.sgl_H, params.sigmag_coeff, 2.0, + idx_array, &min_keep_idx, &max_keep_idx); + + // Compute the likelihood and flux of the track based on the filtered + // observations (ones in [min_keep_idx, max_keep_idx]). + float new_psi_sum = 0.0; + float new_phi_sum = 0.0; + for (int i = min_keep_idx; i <= max_keep_idx; i++) { + int idx = idx_array[i]; + new_psi_sum += psi_array[idx]; + new_phi_sum += phi_array[idx]; + } + candidate->lh = new_psi_sum / sqrt(new_phi_sum); + candidate->flux = new_psi_sum / new_phi_sum; + } +} + /* * Searches through images (represented as a flat array of floats) looking for most likely * trajectories in the given list. Outputs a results image of best trajectories. Returns a @@ -148,12 +223,6 @@ __global__ void searchFilterImages(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_v const int x = x_i + params.x_start_min; const int y = y_i + params.y_start_min; - // Data structures used for filtering. - float lc_array[MAX_NUM_IMAGES]; - float psi_array[MAX_NUM_IMAGES]; - float phi_array[MAX_NUM_IMAGES]; - int idx_array[MAX_NUM_IMAGES]; - // Create an initial set of best results with likelihood -1.0. // We also set (x, y) because they are used in the later python // functions. @@ -174,67 +243,15 @@ __global__ void searchFilterImages(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_v curr_trj.vy = trajectories[t].vy; curr_trj.obs_count = 0; - float psi_sum = 0.0; - float phi_sum = 0.0; - - // Loop over each image and sample the appropriate pixel - for (int i = 0; i < psi_phi_meta.num_times; ++i) { - lc_array[i] = 0; - psi_array[i] = 0; - phi_array[i] = 0; - idx_array[i] = i; - } - - // Loop over each image and sample the appropriate pixel - int num_seen = 0; - for (int i = 0; i < psi_phi_meta.num_times; ++i) { - // Predict the trajectory's position. - float curr_time = image_times[i]; - int current_x = x + int(curr_trj.vx * curr_time + 0.5); - int current_y = y + int(curr_trj.vy * curr_time + 0.5); - - // Get the Psi and Phi pixel values. - PsiPhi pixel_vals = read_encoded_psi_phi(psi_phi_meta, psi_phi_vect, i, current_y, current_x); - if (pixel_vals.psi != NO_DATA && pixel_vals.phi != NO_DATA) { - curr_trj.obs_count++; - psi_sum += pixel_vals.psi; - phi_sum += pixel_vals.phi; - psi_array[num_seen] = pixel_vals.psi; - phi_array[num_seen] = pixel_vals.phi; - if (pixel_vals.phi != 0.0) lc_array[num_seen] = pixel_vals.psi / pixel_vals.phi; - num_seen += 1; - } - } - curr_trj.lh = psi_sum / sqrt(phi_sum); - curr_trj.flux = psi_sum / phi_sum; + // Evaluate the trajectory. + evaluateTrajectory(psi_phi_meta, psi_phi_vect, image_times, params, &curr_trj); // If we do not have enough observations or a good enough LH score, - // do not bother with any of the following steps. + // do not bother inserting it into the sorted list of results. if ((curr_trj.obs_count < params.min_observations) || (params.do_sigmag_filter && curr_trj.lh < params.min_lh)) continue; - // If we are doing on GPU filtering, run the sigma_g filter - // and recompute the likelihoods. - if (params.do_sigmag_filter) { - int min_keep_idx = 0; - int max_keep_idx = num_seen - 1; - SigmaGFilteredIndicesCU(lc_array, num_seen, params.sgl_L, params.sgl_H, params.sigmag_coeff, 2.0, - idx_array, &min_keep_idx, &max_keep_idx); - - // Compute the likelihood and flux of the track based on the filtered - // observations (ones in [min_keep_idx, max_keep_idx]). - float new_psi_sum = 0.0; - float new_phi_sum = 0.0; - for (int i = min_keep_idx; i <= max_keep_idx; i++) { - int idx = idx_array[i]; - new_psi_sum += psi_array[idx]; - new_phi_sum += phi_array[idx]; - } - curr_trj.lh = new_psi_sum / sqrt(new_phi_sum); - curr_trj.flux = new_psi_sum / new_phi_sum; - } - // Insert the new trajectory into the sorted list of results. // Only sort the values with valid likelihoods. Trajectory temp; @@ -311,6 +328,7 @@ extern "C" void deviceSearchFilter(PsiPhiArray &psi_phi_array, float *image_time searchFilterImages<<>>(psi_phi_array.get_meta_data(), psi_phi_array.get_gpu_array_ptr(), device_img_times, params, num_trajectories, device_tests, device_search_results); + cudaDeviceSynchronize(); // Read back results checkCudaErrors(cudaMemcpy(best_results, device_search_results, sizeof(Trajectory) * num_results, @@ -502,107 +520,6 @@ void deviceGetCoadds(const unsigned int num_images, const unsigned int width, co checkCudaErrors(cudaFree(device_res)); } -/* - void deviceGetCoadds(ImageStack &stack, PerImageData image_data, int num_trajectories, - Trajectory *trajectories, StampParameters params, - std::vector> &use_index_vect, float *results) { - // Allocate Device memory - Trajectory *device_trjs; - int *device_use_index = nullptr; - float *device_times; - float *device_img; - float *device_res; - - // Compute the dimensions for the data. - const unsigned int num_images = stack.img_count(); - const unsigned int width = stack.get_width(); - const unsigned int height = stack.get_height(); - const unsigned int num_image_pixels = num_images * width * height; - const unsigned int stamp_width = 2 * params.radius + 1; - const unsigned int stamp_ppi = (2 * params.radius + 1) * (2 * params.radius + 1); - const unsigned int num_stamp_pixels = num_trajectories * stamp_ppi; - - // Allocate and copy the trajectories. - checkCudaErrors(cudaMalloc((void **)&device_trjs, sizeof(Trajectory) * num_trajectories)); - checkCudaErrors(cudaMemcpy(device_trjs, trajectories, sizeof(Trajectory) * num_trajectories, - cudaMemcpyHostToDevice)); - - // Check if we need to create a vector of per-trajectory, per-image use. - // Convert the vector of booleans into an integer array so we do a cudaMemcpy. - if (use_index_vect.size() == num_trajectories) { - checkCudaErrors(cudaMalloc((void **)&device_use_index, sizeof(int) * num_images * num_trajectories)); - - int *start_ptr = device_use_index; - std::vector int_vect(num_images, 0); - for (unsigned i = 0; i < num_trajectories; ++i) { - assert(use_index_vect[i].size() == num_images); - for (unsigned t = 0; t < num_images; ++t) { - int_vect[t] = use_index_vect[i][t] ? 1 : 0; - } - - checkCudaErrors( - cudaMemcpy(start_ptr, int_vect.data(), sizeof(int) * num_images, cudaMemcpyHostToDevice)); - start_ptr += num_images; - } - } - - // Allocate and copy the times. - checkCudaErrors(cudaMalloc((void **)&device_times, sizeof(float) * num_images)); - checkCudaErrors(cudaMemcpy(device_times, image_data.image_times, sizeof(float) * num_images, - cudaMemcpyHostToDevice)); - - // Allocate and copy the images. - checkCudaErrors(cudaMalloc((void **)&device_img, sizeof(float) * num_image_pixels)); - float *next_ptr = device_img; - for (unsigned t = 0; t < num_images; ++t) { - // Used to be a vector of floats, now is an eigen::vector of floats or something - // but that's ok because all we use it for is the .data() -> float* - // I think this can also just directly go to .data because of RowMajor layout - auto& data_ref = stack.get_single_image(t).get_science().get_image(); - - assert(data_ref.size() == width * height); - checkCudaErrors(cudaMemcpy(next_ptr, data_ref.data(), sizeof(float) * width * height, - cudaMemcpyHostToDevice)); - next_ptr += width * height; - } - - // Allocate space for the results. - checkCudaErrors(cudaMalloc((void **)&device_res, sizeof(float) * num_stamp_pixels)); - - // Wrap the per-image data into a struct. This struct will be copied by value - // during the function call, so we don't need to allocate memory for the - // struct itself. We just set the pointers to the on device vectors. - PerImageData device_image_data; - device_image_data.num_images = num_images; - device_image_data.image_times = device_times; - device_image_data.psi_params = nullptr; - device_image_data.phi_params = nullptr; - - dim3 blocks(num_trajectories, 1, 1); - dim3 threads(1, stamp_width, stamp_width); - - // Create the stamps. - deviceGetCoaddStamp<<>>(num_images, width, height, device_img, device_image_data, - num_trajectories, device_trjs, params, device_use_index, - device_res); - cudaDeviceSynchronize(); - - // Free up the unneeded memory (everything except for the on-device results). - checkCudaErrors(cudaFree(device_img)); - if (device_use_index != nullptr) checkCudaErrors(cudaFree(device_use_index)); - checkCudaErrors(cudaFree(device_times)); - checkCudaErrors(cudaFree(device_trjs)); - cudaDeviceSynchronize(); - - // Read back results - checkCudaErrors( - cudaMemcpy(results, device_res, sizeof(float) * num_stamp_pixels, cudaMemcpyDeviceToHost)); - cudaDeviceSynchronize(); - - // Free the rest of the on GPU memory. - checkCudaErrors(cudaFree(device_res)); - } -*/ } /* namespace search */ #endif /* KERNELS_CU_ */ From 0839114ec797a8869f94cbd5e5821a9b1e3d9eb2 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 07:58:44 -0500 Subject: [PATCH 06/27] Fix bad merge --- src/kbmod/search/kernels.cu | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index a70e41bcc..21bf19a9c 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -337,8 +337,8 @@ extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters par // Launch Search searchFilterImages<<>>(search_data.get_meta_data(), search_data.get_gpu_array_ptr(), - device_img_times, params, num_trajectories, device_tests, - device_search_results); + static_cast(search_data.get_gpu_time_array_ptr()), + params, num_trajectories, device_tests, device_search_results); cudaDeviceSynchronize(); // Read back results From ca87995c15e4438b64c947ed8d6b51a6e50f1bf9 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 10:11:29 -0500 Subject: [PATCH 07/27] Remove unused functions --- src/kbmod/search/common.h | 22 ---------------------- src/kbmod/search/stack_search.cpp | 24 ++++-------------------- src/kbmod/search/stack_search.h | 4 ---- 3 files changed, 4 insertions(+), 46 deletions(-) diff --git a/src/kbmod/search/common.h b/src/kbmod/search/common.h index 394497930..b1e47eb66 100644 --- a/src/kbmod/search/common.h +++ b/src/kbmod/search/common.h @@ -26,18 +26,6 @@ constexpr float NO_DATA = -9999.0; enum StampType { STAMP_SUM = 0, STAMP_MEAN, STAMP_MEDIAN }; -// The position (in pixels) of a trajectory. -struct PixelPos { - float x; - float y; - - const std::string to_string() const { return "x: " + std::to_string(x) + " y: " + std::to_string(y); } - - const std::string to_yaml() const { - return "{x: " + std::to_string(x) + ", y: " + std::to_string(y) + "}"; - } -}; - /* * Data structure to represent an objects trajectory * through a stack of images @@ -59,7 +47,6 @@ struct Trajectory { // Get pixel positions from a zero-shifted time. float get_x_pos(float time) const { return x + time * vx; } float get_y_pos(float time) const { return y + time * vy; } - PixelPos get_pos(float time) const { return {x + time * vx, y + time * vy}; } // I can't believe string::format is not a thing until C++ 20 const std::string to_string() const { @@ -162,15 +149,6 @@ static void trajectory_bindings(py::module &m) { })); } -static void pixel_pos_bindings(py::module &m) { - py::class_(m, "PixelPos", pydocs::DOC_PixelPos) - .def(py::init<>()) - .def_readwrite("x", &PixelPos::x) - .def_readwrite("y", &PixelPos::y) - .def("__repr__", [](const PixelPos &p) { return "PixelPos(" + p.to_string() + ")"; }) - .def("__str__", &PixelPos::to_string); -} - static void image_moments_bindings(py::module &m) { py::class_(m, "ImageMoments", pydocs::DOC_ImageMoments) .def(py::init<>()) diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index ba31ef247..4c8777c84 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -159,21 +159,6 @@ void StackSearch::create_search_list(int angle_steps, int velocity_steps, float timer.stop(); } -Point StackSearch::get_trajectory_position(const Trajectory& t, int i) const { - float time = stack.get_zeroed_time(i); - return {t.x + time * t.vx, t.y + time * t.vy}; -} - -std::vector StackSearch::get_trajectory_positions(Trajectory& t) const { - std::vector results; - int num_times = stack.img_count(); - for (int i = 0; i < num_times; ++i) { - Point pos = get_trajectory_position(t, i); - results.push_back(pos); - } - return results; -} - std::vector StackSearch::create_curves(Trajectory t, const std::vector& imgs) { /*Create a lightcurve from an image along a trajectory * @@ -188,12 +173,13 @@ std::vector StackSearch::create_curves(Trajectory t, const std::vector lightcurve; lightcurve.reserve(img_size); - std::vector times = stack.build_zeroed_times(); for (int i = 0; i < img_size; ++i) { /* Do not use get_pixel_interp(), because results from create_curves must * be able to recover the same likelihoods as the ones reported by the - * gpu search.*/ - Point p({t.x + times[i] * t.vx + 0.5f, t.y + times[i] * t.vy + 0.5f}); + * gpu search. Shift by 0.5 pixels to center as done on GPU. */ + float time = stack.get_zeroed_time(i); + Point p{t.get_x_pos(time) + 0.5f, t.get_y_pos(time) + 0.5f}; + float pix_val = imgs[i].get_pixel(p.to_index()); if (pix_val == NO_DATA) pix_val = 0.0; lightcurve.push_back(pix_val); @@ -282,8 +268,6 @@ static void stack_search_bindings(py::module& m) { .def("get_imagestack", &ks::get_imagestack, py::return_value_policy::reference_internal, pydocs::DOC_StackSearch_get_imagestack) // For testings - .def("get_trajectory_position", &ks::get_trajectory_position, - pydocs::DOC_StackSearch_get_trajectory_position) .def("get_psi_curves", (std::vector(ks::*)(tj&)) & ks::get_psi_curves, pydocs::DOC_StackSearch_get_psi_curves) .def("get_phi_curves", (std::vector(ks::*)(tj&)) & ks::get_phi_curves, diff --git a/src/kbmod/search/stack_search.h b/src/kbmod/search/stack_search.h index 597f78850..fbb9568a1 100644 --- a/src/kbmod/search/stack_search.h +++ b/src/kbmod/search/stack_search.h @@ -50,10 +50,6 @@ class StackSearch { // Gets the vector of result trajectories. std::vector get_results(int start, int end); - // Get the predicted (pixel) positions for a given trajectory. - Point get_trajectory_position(const Trajectory& t, int i) const; - std::vector get_trajectory_positions(Trajectory& t) const; - // Filters the results based on various parameters. void filter_results(int min_observations); void filter_results_lh(float min_lh); From ddb56d7d4e3d7db2526be238eeaedd71c8b18ae4 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 10:27:57 -0500 Subject: [PATCH 08/27] small fixes --- src/kbmod/search/bindings.cpp | 1 - src/kbmod/search/common.h | 1 - 2 files changed, 2 deletions(-) diff --git a/src/kbmod/search/bindings.cpp b/src/kbmod/search/bindings.cpp index 4175c9639..225bf477b 100644 --- a/src/kbmod/search/bindings.cpp +++ b/src/kbmod/search/bindings.cpp @@ -37,7 +37,6 @@ PYBIND11_MODULE(search, m) { search::stack_search_bindings(m); search::stamp_creator_bindings(m); search::trajectory_bindings(m); - search::pixel_pos_bindings(m); search::image_moments_bindings(m); search::stamp_parameters_bindings(m); search::psi_phi_array_binding(m); diff --git a/src/kbmod/search/common.h b/src/kbmod/search/common.h index b1e47eb66..b7c89663e 100644 --- a/src/kbmod/search/common.h +++ b/src/kbmod/search/common.h @@ -133,7 +133,6 @@ static void trajectory_bindings(py::module &m) { .def_readwrite("obs_count", &tj::obs_count) .def("get_x_pos", &tj::get_x_pos, pydocs::DOC_Trajectory_get_x_pos) .def("get_y_pos", &tj::get_y_pos, pydocs::DOC_Trajectory_get_y_pos) - .def("get_pos", &tj::get_pos, pydocs::DOC_Trajectory_get_pos) .def("__repr__", [](const tj &t) { return "Trajectory(" + t.to_string() + ")"; }) .def("__str__", &tj::to_string) .def(py::pickle( From ea0dee6a5e12600dc5df9649431f8d3d163b17bc Mon Sep 17 00:00:00 2001 From: DinoBektesevic Date: Fri, 2 Feb 2024 12:14:00 -0800 Subject: [PATCH 09/27] Skip regression test when no GPU exists. --- tests/test_regression_test.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/test_regression_test.py b/tests/test_regression_test.py index fe8a08e0e..56c099a6e 100644 --- a/tests/test_regression_test.py +++ b/tests/test_regression_test.py @@ -511,6 +511,7 @@ def run_full_test(): # The unit test runner class test_regression_test(unittest.TestCase): + @unittest.skipIf(not HAS_GPU, "Skipping test (no GPU detected)") def test_run_test(self): self.assertTrue(run_full_test()) From e4a4a089a85e85ac1ab0f715caf9e6267f3855e5 Mon Sep 17 00:00:00 2001 From: DinoBektesevic Date: Fri, 2 Feb 2024 12:38:20 -0800 Subject: [PATCH 10/27] Fix trajectory position predictions in results. --- src/kbmod/trajectory_utils.py | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) diff --git a/src/kbmod/trajectory_utils.py b/src/kbmod/trajectory_utils.py index e05fde489..0459e1376 100644 --- a/src/kbmod/trajectory_utils.py +++ b/src/kbmod/trajectory_utils.py @@ -67,16 +67,23 @@ def trajectory_predict_skypos(trj, wcs, times): times : `list` or `numpy.ndarray` The times at which to predict the positions. + .. note:: + The motion is approximated as linear and will be approximately correct + only for small temporal range and spatial region. In essence, the new + coordinates are calculated as: + :math: x_new = x_old + v * (t_new - t_old) + Returns ------- result : `astropy.coordinates.SkyCoord` A SkyCoord with the transformed locations. """ - np_times = np.array(times) + dt = np.array(times) + dt -= dt[0] # Predict locations in pixel space. - x_vals = trj.x + trj.vx * np_times - y_vals = trj.y + trj.vy * np_times + x_vals = trj.x + trj.vx * dt + y_vals = trj.y + trj.vy * dt result = wcs.pixel_to_world(x_vals, y_vals) return result From 86a080fbc56c5411009bfde5492a34231c5e14ae Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 15:56:08 -0500 Subject: [PATCH 11/27] Initial cleanups --- src/kbmod/search/pydocs/raw_image_docs.h | 1 - src/kbmod/search/pydocs/stack_search_docs.h | 79 ++++++++++++++------- src/kbmod/search/stack_search.cpp | 6 -- src/kbmod/search/stack_search.h | 2 - tests/test_search.py | 50 ------------- 5 files changed, 54 insertions(+), 84 deletions(-) diff --git a/src/kbmod/search/pydocs/raw_image_docs.h b/src/kbmod/search/pydocs/raw_image_docs.h index 7fd2e6c88..09ad76190 100644 --- a/src/kbmod/search/pydocs/raw_image_docs.h +++ b/src/kbmod/search/pydocs/raw_image_docs.h @@ -195,7 +195,6 @@ static const auto DOC_RawImage_center_is_local_max = R"doc( Whether or not the stamp passes the check. )doc"; - static const auto DOC_RawImage_create_stamp = R"doc( Create an image stamp around a given region. diff --git a/src/kbmod/search/pydocs/stack_search_docs.h b/src/kbmod/search/pydocs/stack_search_docs.h index 865ff6103..f52e2aece 100644 --- a/src/kbmod/search/pydocs/stack_search_docs.h +++ b/src/kbmod/search/pydocs/stack_search_docs.h @@ -15,23 +15,48 @@ static const auto DOC_StackSearch_enable_gpu_sigmag_filter = R"doc( )doc"; static const auto DOC_StackSearch_enable_gpu_encoding = R"doc( - todo - )doc"; + Set the encoding level for the data copied to the GPU. + 1 = uint8 + 2 = uint16 + 4 or -1 = float -static const auto DOC_StackSearch_enable_corr = R"doc( - todo + Parameters + ---------- + encode_num_bytes : `int` + The number of bytes to use for encoding the data. )doc"; static const auto DOC_StackSearch_set_start_bounds_x = R"doc( - todo + Set the starting and ending bounds in the x direction for a grid search. + The grid search will test all pixels [x_min, x_max). + + Parameters + ---------- + x_min : `int` + The inclusive lower bound of the search. + x_max : `int` + The exclusive upper bound of the search. )doc"; static const auto DOC_StackSearch_set_start_bounds_y = R"doc( - todo + Set the starting and ending bounds in the y direction for a grid search. + The grid search will test all pixels [y_min, y_max). + + Parameters + ---------- + y_min : `int` + The inclusive lower bound of the search. + y_max : `int` + The exclusive upper bound of the search. )doc"; static const auto DOC_StackSearch_set_debug = R"doc( - todo + Set whether to dislpay debug output. + + Parameters + ---------- + d : `bool` + Set to ``True`` to turn on debug output and ``False`` to turn it off. )doc"; static const auto DOC_StackSearch_filter_min_obs = R"doc( @@ -55,35 +80,39 @@ static const auto DOC_StackSearch_get_image_npixels = R"doc( ")doc"; static const auto DOC_StackSearch_get_imagestack = R"doc( - todo + Return the `kb.ImageStack` containing the data to search. )doc"; -static const auto DOC_StackSearch_get_trajectory_position = R"doc( - todo - )doc"; +static const auto DOC_StackSearch_get_psi_curves = R"doc( + Return the time series of psi values for a given trajectory in pixel space. -static const auto DOC_StackSearch_get_trajectory_positions = R"doc( - todo - )doc"; + Parameters + ---------- + trj : `kb.Trajectory` + The input trajectory. -static const auto DOC_StackSearch_get_psi_curves = R"doc( - todo + Returns + ------- + result : `list` of `float` + The psi values at each time step with NO_DATA replaced by 0.0. )doc"; static const auto DOC_StackSearch_get_phi_curves = R"doc( - todo - )doc"; + Return the time series of phi values for a given trajectory in pixel space. -static const auto DOC_StackSearch_prepare_psi_phi = R"doc( - todo - )doc"; + Parameters + ---------- + trj : `kb.Trajectory` + The input trajectory. -static const auto DOC_StackSearch_get_psi_images = R"doc( - todo + Returns + ------- + result : `list` of `float` + The phi values at each time step with NO_DATA replaced by 0.0. )doc"; -static const auto DOC_StackSearch_get_phi_images = R"doc( - todo +static const auto DOC_StackSearch_prepare_psi_phi = R"doc( + Compute the cached psi and phi data. )doc"; static const auto DOC_StackSearch_get_results = R"doc( diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index 4c8777c84..eb7829304 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -209,10 +209,6 @@ std::vector StackSearch::get_phi_curves(Trajectory& t) { return create_curves(t, phi_images); } -std::vector& StackSearch::get_psi_images() { return psi_images; } - -std::vector& StackSearch::get_phi_images() { return phi_images; } - void StackSearch::sort_results() { __gnu_parallel::sort(results.begin(), results.end(), [](Trajectory a, Trajectory b) { return b.lh < a.lh; }); @@ -273,8 +269,6 @@ static void stack_search_bindings(py::module& m) { .def("get_phi_curves", (std::vector(ks::*)(tj&)) & ks::get_phi_curves, pydocs::DOC_StackSearch_get_phi_curves) .def("prepare_psi_phi", &ks::prepare_psi_phi, pydocs::DOC_StackSearch_prepare_psi_phi) - .def("get_psi_images", &ks::get_psi_images, pydocs::DOC_StackSearch_get_psi_images) - .def("get_phi_images", &ks::get_phi_images, pydocs::DOC_StackSearch_get_phi_images) .def("get_results", &ks::get_results, pydocs::DOC_StackSearch_get_results) .def("set_results", &ks::set_results, pydocs::DOC_StackSearch_set_results); } diff --git a/src/kbmod/search/stack_search.h b/src/kbmod/search/stack_search.h index fbb9568a1..48f3386d9 100644 --- a/src/kbmod/search/stack_search.h +++ b/src/kbmod/search/stack_search.h @@ -55,8 +55,6 @@ class StackSearch { void filter_results_lh(float min_lh); // Getters for the Psi and Phi data. - std::vector& get_psi_images(); - std::vector& get_phi_images(); std::vector get_psi_curves(Trajectory& t); std::vector get_phi_curves(Trajectory& t); diff --git a/tests/test_search.py b/tests/test_search.py index 7d27423cc..33c06cc82 100644 --- a/tests/test_search.py +++ b/tests/test_search.py @@ -87,56 +87,6 @@ def setUp(self): self.params.m02_limit = 35.5 self.params.m20_limit = 35.5 - def test_psiphi(self): - p = PSF(0.00001) - - # Image1 has a single object. - height = 19 - width = 5 - image1 = LayeredImage(width, height, 2.0, 4.0, 1.0, p) - add_fake_object(image1, 3.5, 2.5, 400.0, p) - - # Image2 has a single object and a masked pixel. - image2 = LayeredImage(width, height, 2.0, 4.0, 2.0, p) - add_fake_object(image2, 4.5, 2.5, 400.0, p) - - mask = image2.get_mask() - mask.set_pixel(9, 4, 1) - image2.apply_mask(1) - - # Create a stack from the two objects. - stack = ImageStack([image1, image2]) - search = StackSearch(stack) - - # Generate psi and phi. - search.prepare_psi_phi() - psi = search.get_psi_images() - phi = search.get_phi_images() - - # Test phi and psi for image1. - sci = image1.get_science() - var = image1.get_variance() - for x in range(width): - for y in range(height): - self.assertAlmostEqual( - psi[0].get_pixel(y, x), sci.get_pixel(y, x) / var.get_pixel(y, x), delta=1e-6 - ) - self.assertAlmostEqual(phi[0].get_pixel(y, x), 1.0 / var.get_pixel(y, x), delta=1e-6) - - # Test phi and psi for image2. - sci = image2.get_science() - var = image2.get_variance() - for x in range(width): - for y in range(height): - if x == 4 and y == 9: - self.assertFalse(psi[1].pixel_has_data(y, x)) - self.assertFalse(phi[1].pixel_has_data(y, x)) - else: - self.assertAlmostEqual( - psi[1].get_pixel(y, x), sci.get_pixel(y, x) / var.get_pixel(y, x), delta=1e-6 - ) - self.assertAlmostEqual(phi[1].get_pixel(y, x), 1.0 / var.get_pixel(y, x), delta=1e-6) - @unittest.skipIf(not HAS_GPU, "Skipping test (no GPU detected)") def test_results(self): self.search.search( From 43e82a83d5e811b3f7978ba6b24c5863bd6af0ad Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:20:57 -0500 Subject: [PATCH 12/27] Revert the name change --- src/kbmod/search/bindings.cpp | 4 +- src/kbmod/search/kernels.cu | 31 ++++----- src/kbmod/search/layered_image.cpp | 8 +-- .../{search_data.cpp => psi_phi_array.cpp} | 0 .../{search_data_ds.h => psi_phi_array_ds.h} | 24 +++---- ...rch_data_utils.h => psi_phi_array_utils.h} | 20 +++--- src/kbmod/search/pydocs/search_data_docs.h | 66 +++++++++---------- src/kbmod/search/stack_search.cpp | 7 +- src/kbmod/search/stack_search.h | 4 +- ...t_search_data.py => test_psi_phi_array.py} | 10 +-- 10 files changed, 88 insertions(+), 86 deletions(-) rename src/kbmod/search/{search_data.cpp => psi_phi_array.cpp} (100%) rename src/kbmod/search/{search_data_ds.h => psi_phi_array_ds.h} (91%) rename src/kbmod/search/{search_data_utils.h => psi_phi_array_utils.h} (52%) rename tests/{test_search_data.py => test_psi_phi_array.py} (98%) diff --git a/src/kbmod/search/bindings.cpp b/src/kbmod/search/bindings.cpp index c39343c2a..225bf477b 100644 --- a/src/kbmod/search/bindings.cpp +++ b/src/kbmod/search/bindings.cpp @@ -16,7 +16,7 @@ namespace py = pybind11; #include "stack_search.cpp" #include "stamp_creator.cpp" #include "kernel_testing_helpers.cpp" -#include "search_data.cpp" +#include "psi_phi_array.cpp" PYBIND11_MODULE(search, m) { m.attr("KB_NO_DATA") = pybind11::float_(search::NO_DATA); @@ -39,7 +39,7 @@ PYBIND11_MODULE(search, m) { search::trajectory_bindings(m); search::image_moments_bindings(m); search::stamp_parameters_bindings(m); - search::search_data_binding(m); + search::psi_phi_array_binding(m); // Functions from raw_image.cpp m.def("create_median_image", &search::create_median_image); m.def("create_summed_image", &search::create_summed_image); diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index 21bf19a9c..c400c4380 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -19,11 +19,11 @@ #include "common.h" #include "cuda_errors.h" -#include "search_data_ds.h" +#include "psi_phi_array_ds.h" namespace search { -extern "C" void device_allocate_search_data_arrays(SearchData *data) { +extern "C" void device_allocate_psi_phi_array_arrays(PsiPhiArray *data) { if (!data->cpu_array_allocated() || !data->cpu_time_array_allocated()) { throw std::runtime_error("CPU data is not allocated."); } @@ -47,7 +47,7 @@ extern "C" void device_allocate_search_data_arrays(SearchData *data) { data->set_gpu_time_array_ptr(device_times_ptr); } -extern "C" void device_free_search_data_arrays(SearchData *data) { +extern "C" void device_free_psi_phi_array_arrays(PsiPhiArray *data) { if (data->gpu_array_allocated()) { checkCudaErrors(cudaFree(data->get_gpu_array_ptr())); data->set_gpu_array_ptr(nullptr); @@ -58,8 +58,8 @@ extern "C" void device_free_search_data_arrays(SearchData *data) { } } -__host__ __device__ PsiPhi read_encoded_psi_phi(SearchDataMeta ¶ms, void *psi_phi_vect, int time, - int row, int col) { +__host__ __device__ PsiPhi read_encoded_psi_phi(PsiPhiArrayMeta ¶ms, void *psi_phi_vect, int time, + int row, int col) { // Bounds checking. if ((row < 0) || (col < 0) || (row >= params.height) || (col >= params.width)) { return {NO_DATA, NO_DATA}; @@ -141,11 +141,12 @@ extern "C" __device__ __host__ void SigmaGFilteredIndicesCU(float *values, int n /* * Evaluate the likelihood score (as computed with from the psi and phi values) for a single - * given candidate trajectory. Modifies the trajectory in place to update the number of + * given candidate trajectory. Modifies the trajectory in place to update the number of * observations, likelihood, and flux. */ -extern "C" __device__ __host__ void evaluateTrajectory(SearchDataMeta psi_phi_meta, void *psi_phi_vect, float *image_times, - SearchParameters params, Trajectory *candidate) { +extern "C" __device__ __host__ void evaluateTrajectory(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_vect, + float *image_times, SearchParameters params, + Trajectory *candidate) { // Data structures used for filtering. We fill in only what we need. float psi_array[MAX_NUM_IMAGES]; float phi_array[MAX_NUM_IMAGES]; @@ -222,7 +223,7 @@ extern "C" __device__ __host__ void evaluateTrajectory(SearchDataMeta psi_phi_me * * Creates a local copy of psi_phi_meta and params in local memory space. */ -__global__ void searchFilterImages(SearchDataMeta psi_phi_meta, void *psi_phi_vect, float *image_times, +__global__ void searchFilterImages(PsiPhiArrayMeta psi_phi_meta, void *psi_phi_vect, float *image_times, SearchParameters params, int num_trajectories, Trajectory *trajectories, Trajectory *results) { // Get the x and y coordinates within the search space. @@ -291,23 +292,23 @@ __global__ void searchFilterImages(SearchDataMeta psi_phi_meta, void *psi_phi_ve } } -extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters params, int num_trajectories, +extern "C" void deviceSearchFilter(PsiPhiArray &psi_phi_array, SearchParameters params, int num_trajectories, Trajectory *trj_to_search, int num_results, Trajectory *best_results) { // Allocate Device memory Trajectory *device_tests; Trajectory *device_search_results; // Check the hard coded maximum number of images against the num_images. - int num_images = search_data.get_num_times(); + int num_images = psi_phi_array.get_num_times(); if (num_images > MAX_NUM_IMAGES) { throw std::runtime_error("Number of images exceeds GPU maximum."); } // Check that the device vectors have already been allocated. - if (search_data.gpu_array_allocated() == false) { + if (psi_phi_array.gpu_array_allocated() == false) { throw std::runtime_error("PsiPhi data has not been created."); } - if (search_data.gpu_time_array_allocated() == false) { + if (psi_phi_array.gpu_time_array_allocated() == false) { throw std::runtime_error("GPU time data has not been created."); } @@ -336,8 +337,8 @@ extern "C" void deviceSearchFilter(SearchData &search_data, SearchParameters par dim3 threads(THREAD_DIM_X, THREAD_DIM_Y); // Launch Search - searchFilterImages<<>>(search_data.get_meta_data(), search_data.get_gpu_array_ptr(), - static_cast(search_data.get_gpu_time_array_ptr()), + searchFilterImages<<>>(psi_phi_array.get_meta_data(), psi_phi_array.get_gpu_array_ptr(), + static_cast(psi_phi_array.get_gpu_time_array_ptr()), params, num_trajectories, device_tests, device_search_results); cudaDeviceSynchronize(); diff --git a/src/kbmod/search/layered_image.cpp b/src/kbmod/search/layered_image.cpp index 903ec82ad..ba7efbb06 100644 --- a/src/kbmod/search/layered_image.cpp +++ b/src/kbmod/search/layered_image.cpp @@ -40,12 +40,12 @@ LayeredImage::LayeredImage(const RawImage& sci, const RawImage& var, const RawIm variance = var; } -LayeredImage::LayeredImage(unsigned w, unsigned h, float noise_stdev, float pixel_variance, - double time, const PSF& psf) +LayeredImage::LayeredImage(unsigned w, unsigned h, float noise_stdev, float pixel_variance, double time, + const PSF& psf) : LayeredImage(w, h, noise_stdev, pixel_variance, time, psf, -1) {} -LayeredImage::LayeredImage(unsigned w, unsigned h, float noise_stdev, float pixel_variance, - double time, const PSF& psf, int seed) +LayeredImage::LayeredImage(unsigned w, unsigned h, float noise_stdev, float pixel_variance, double time, + const PSF& psf, int seed) : psf(psf), width(w), height(h) { std::random_device r; std::default_random_engine generator(r()); diff --git a/src/kbmod/search/search_data.cpp b/src/kbmod/search/psi_phi_array.cpp similarity index 100% rename from src/kbmod/search/search_data.cpp rename to src/kbmod/search/psi_phi_array.cpp diff --git a/src/kbmod/search/search_data_ds.h b/src/kbmod/search/psi_phi_array_ds.h similarity index 91% rename from src/kbmod/search/search_data_ds.h rename to src/kbmod/search/psi_phi_array_ds.h index 7a64842ce..477b17041 100644 --- a/src/kbmod/search/search_data_ds.h +++ b/src/kbmod/search/psi_phi_array_ds.h @@ -1,5 +1,5 @@ /* - * search_data_ds.h + * psi_phi_array_ds.h * * The data structure for the raw data needed for the search algorith, * including the psi/phi values and the zeroed times. The the data @@ -17,8 +17,8 @@ * Created on: Dec 5, 2023 */ -#ifndef SEARCH_DATA_DS_ -#define SEARCH_DATA_DS_ +#ifndef PSI_PHI_ARRAY_DS_ +#define PSI_PHI_ARRAY_DS_ #include #include @@ -44,8 +44,8 @@ inline float decode_uint_scalar(float value, float min_val, float scale) { return (value == 0.0) ? NO_DATA : (value - 1.0) * scale + min_val; } -// The struct of meta data for the SearchData. -struct SearchDataMeta { +// The struct of meta data for the PsiPhiArray. +struct PsiPhiArrayMeta { int num_times = 0; int width = 0; int height = 0; @@ -66,17 +66,17 @@ struct SearchDataMeta { float phi_scale = 1.0; }; -/* SearchData is a class to hold the psi and phi arrays for the CPU and GPU as well as +/* PsiPhiArray is a class to hold the psi and phi arrays for the CPU and GPU as well as the meta data and functions to do encoding and decoding on CPU. */ -class SearchData { +class PsiPhiArray { public: - explicit SearchData(); - virtual ~SearchData(); + explicit PsiPhiArray(); + virtual ~PsiPhiArray(); void clear(); - inline SearchDataMeta& get_meta_data() { return meta_data; } + inline PsiPhiArrayMeta& get_meta_data() { return meta_data; } // --- Getter functions (for Python interface) ---------------- inline int get_num_bytes() { return meta_data.num_bytes; } @@ -121,7 +121,7 @@ class SearchData { inline void set_gpu_time_array_ptr(float* new_ptr) { gpu_time_array = new_ptr; } private: - SearchDataMeta meta_data; + PsiPhiArrayMeta meta_data; // Pointers to the arrays void* cpu_array_ptr = nullptr; @@ -132,4 +132,4 @@ class SearchData { } /* namespace search */ -#endif /* SEARCH_DATA_DS_ */ +#endif /* PSI_PHI_ARRAY_DS_ */ diff --git a/src/kbmod/search/search_data_utils.h b/src/kbmod/search/psi_phi_array_utils.h similarity index 52% rename from src/kbmod/search/search_data_utils.h rename to src/kbmod/search/psi_phi_array_utils.h index 683895ce4..3573df268 100644 --- a/src/kbmod/search/search_data_utils.h +++ b/src/kbmod/search/psi_phi_array_utils.h @@ -1,5 +1,5 @@ /* - * search_data_utils.h + * psi_phi_array_utils.h * * The utility functions for the psi/phi array. Broken out from the header * data structure so that it can use packages that won't be imported into the @@ -8,8 +8,8 @@ * Created on: Dec 8, 2023 */ -#ifndef SEARCH_DATA_UTILS_ -#define SEARCH_DATA_UTILS_ +#ifndef PSI_PHI_ARRAY_UTILS_ +#define PSI_PHI_ARRAY_UTILS_ #include #include @@ -19,7 +19,7 @@ #include "common.h" #include "image_stack.h" #include "layered_image.h" -#include "search_data_ds.h" +#include "psi_phi_array_ds.h" #include "raw_image.h" namespace search { @@ -27,13 +27,13 @@ namespace search { // Compute the min, max, and scale parameter from the a vector of image data. std::array compute_scale_params_from_image_vect(const std::vector& imgs, int num_bytes); -void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, const std::vector zeroed_times, - bool debug = false); +void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vector& psi_imgs, + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug = false); -void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, - bool debug = false); +void fill_psi_phi_array_from_image_stack(PsiPhiArray& result_data, ImageStack& stack, int num_bytes, + bool debug = false); } /* namespace search */ -#endif /* SEARCH_DATA_UTILS_ */ +#endif /* PSI_PHI_ARRAY_UTILS_ */ diff --git a/src/kbmod/search/pydocs/search_data_docs.h b/src/kbmod/search/pydocs/search_data_docs.h index 4f668e3ea..05abe3053 100644 --- a/src/kbmod/search/pydocs/search_data_docs.h +++ b/src/kbmod/search/pydocs/search_data_docs.h @@ -1,5 +1,5 @@ -#ifndef SEARCH_DATA_DOCS -#define SEARCH_DATA_DOCS +#ifndef PSI_PHI_ARRAY_DOCS +#define PSI_PHI_ARRAY_DOCS namespace pydocs { @@ -14,88 +14,88 @@ static const auto DOC_PsiPhi = R"doc( The phi value at a pixel. )doc"; -static const auto DOC_SearchData = R"doc( +static const auto DOC_PsiPhiArray = R"doc( An encoded array of Psi and Phi values along with their meta data. )doc"; -static const auto DOC_SearchData_get_num_bytes = R"doc( +static const auto DOC_PsiPhiArray_get_num_bytes = R"doc( The target number of bytes to use for encoding the data (1 for uint8, 2 for uint16, or 4 for float32). Might differ from actual number of bytes (block_size). )doc"; -static const auto DOC_SearchData_get_num_times = R"doc( +static const auto DOC_PsiPhiArray_get_num_times = R"doc( The number of times. )doc"; -static const auto DOC_SearchData_get_width = R"doc( +static const auto DOC_PsiPhiArray_get_width = R"doc( The image width. )doc"; -static const auto DOC_SearchData_get_height = R"doc( +static const auto DOC_PsiPhiArray_get_height = R"doc( The image height. )doc"; -static const auto DOC_SearchData_get_pixels_per_image = R"doc( +static const auto DOC_PsiPhiArray_get_pixels_per_image = R"doc( The number of pixels per each image. )doc"; -static const auto DOC_SearchData_get_num_entries = R"doc( +static const auto DOC_PsiPhiArray_get_num_entries = R"doc( The number of array entries. )doc"; -static const auto DOC_SearchData_get_total_array_size = R"doc( +static const auto DOC_PsiPhiArray_get_total_array_size = R"doc( The size of the array in bytes. )doc"; -static const auto DOC_SearchData_get_block_size = R"doc( +static const auto DOC_PsiPhiArray_get_block_size = R"doc( The size of a single entry in bytes. )doc"; -static const auto DOC_SearchData_get_psi_min_val = R"doc( +static const auto DOC_PsiPhiArray_get_psi_min_val = R"doc( The minimum value of psi used in the scaling computations. )doc"; -static const auto DOC_SearchData_get_psi_max_val = R"doc( +static const auto DOC_PsiPhiArray_get_psi_max_val = R"doc( The maximum value of psi used in the scaling computations. )doc"; -static const auto DOC_SearchData_get_psi_scale = R"doc( +static const auto DOC_PsiPhiArray_get_psi_scale = R"doc( The scaling parameter for psi. )doc"; -static const auto DOC_SearchData_get_phi_min_val = R"doc( +static const auto DOC_PsiPhiArray_get_phi_min_val = R"doc( The minimum value of phi used in the scaling computations. )doc"; -static const auto DOC_SearchData_get_phi_max_val = R"doc( +static const auto DOC_PsiPhiArray_get_phi_max_val = R"doc( The maximum value of phi used in the scaling computations. )doc"; -static const auto DOC_SearchData_get_phi_scale = R"doc( +static const auto DOC_PsiPhiArray_get_phi_scale = R"doc( The scaling parameter for phi. )doc"; -static const auto DOC_SearchData_get_cpu_array_allocated = R"doc( +static const auto DOC_PsiPhiArray_get_cpu_array_allocated = R"doc( A Boolean indicating whether the cpu data (psi/phi) array exists. )doc"; -static const auto DOC_SearchData_get_gpu_array_allocated = R"doc( +static const auto DOC_PsiPhiArray_get_gpu_array_allocated = R"doc( A Boolean indicating whether the gpu data (psi/phi) array exists. )doc"; -static const auto DOC_SearchData_get_cpu_time_array_allocated = R"doc( +static const auto DOC_PsiPhiArray_get_cpu_time_array_allocated = R"doc( A Boolean indicating whether the cpu time array exists. )doc"; -static const auto DOC_SearchData_get_gpu_time_array_allocated = R"doc( +static const auto DOC_PsiPhiArray_get_gpu_time_array_allocated = R"doc( A Boolean indicating whether the gpu time array exists. )doc"; -static const auto DOC_SearchData_clear = R"doc( +static const auto DOC_PsiPhiArray_clear = R"doc( Clear all data and free the arrays. )doc"; -static const auto DOC_SearchData_read_psi_phi = R"doc( +static const auto DOC_PsiPhiArray_read_psi_phi = R"doc( Read a PsiPhi value from the CPU array. Parameters @@ -113,7 +113,7 @@ static const auto DOC_SearchData_read_psi_phi = R"doc( The pixel values. )doc"; -static const auto DOC_SearchData_read_time = R"doc( +static const auto DOC_PsiPhiArray_read_time = R"doc( Read a zeroed time value from the CPU array. Parameters @@ -127,9 +127,9 @@ static const auto DOC_SearchData_read_time = R"doc( The time. )doc"; -static const auto DOC_SearchData_set_meta_data = R"doc( +static const auto DOC_PsiPhiArray_set_meta_data = R"doc( Set the meta data for the array. Automatically called by - fill_search_data(). + fill_psi_phi_array(). Parameters ---------- @@ -143,12 +143,12 @@ static const auto DOC_SearchData_set_meta_data = R"doc( The width of each image in pixels. )doc"; -static const auto DOC_SearchData_fill_search_data = R"doc( - Fill the SearchData from Psi and Phi images. +static const auto DOC_PsiPhiArray_fill_psi_phi_array = R"doc( + Fill the PsiPhiArray from Psi and Phi images. Parameters ---------- - result_data : `SearchData` + result_data : `PsiPhiArray` The location to store the data. num_bytes : `int` The type of encoding to use (1, 2, or 4). @@ -160,12 +160,12 @@ static const auto DOC_SearchData_fill_search_data = R"doc( A list of floating point times starting at zero. )doc"; -static const auto DOC_SearchData_fill_search_data_from_image_stack = R"doc( - Fill the SearchData an ImageStack. +static const auto DOC_PsiPhiArray_fill_psi_phi_array_from_image_stack = R"doc( + Fill the PsiPhiArray an ImageStack. Parameters ---------- - result_data : `SearchData` + result_data : `PsiPhiArray` The location to store the data. num_bytes : `int` The type of encoding to use (1, 2, or 4). @@ -175,4 +175,4 @@ static const auto DOC_SearchData_fill_search_data_from_image_stack = R"doc( } // namespace pydocs -#endif /* SEARCH_DATA_DOCS */ +#endif /* PSI_PHI_ARRAY_DOCS */ diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index 401177d62..c945b4507 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -2,7 +2,7 @@ namespace search { #ifdef HAVE_CUDA -extern "C" void deviceSearchFilter(SearchData& search_data, SearchParameters params, int num_trajectories, +extern "C" void deviceSearchFilter(PsiPhiArray& psi_phi_array, SearchParameters params, int num_trajectories, Trajectory* trj_to_search, int num_results, Trajectory* best_results); #endif @@ -75,8 +75,9 @@ void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ DebugTimer psi_phi_timer = DebugTimer("Creating psi/phi buffers", debug_info); prepare_psi_phi(); - SearchData psi_phi_data; - fill_search_data(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, image_times, debug_info); + PsiPhiArray psi_phi_data; + fill_psi_phi_array(psi_phi_data, params.encode_num_bytes, psi_images, phi_images, image_times, + debug_info); psi_phi_timer.stop(); // Allocate a vector for the results. diff --git a/src/kbmod/search/stack_search.h b/src/kbmod/search/stack_search.h index ca7ebdd9f..fbb9568a1 100644 --- a/src/kbmod/search/stack_search.h +++ b/src/kbmod/search/stack_search.h @@ -16,8 +16,8 @@ #include "geom.h" #include "image_stack.h" #include "psf.h" -#include "search_data_ds.h" -#include "search_data_utils.h" +#include "psi_phi_array_ds.h" +#include "psi_phi_array_utils.h" #include "pydocs/stack_search_docs.h" #include "stamp_creator.h" diff --git a/tests/test_search_data.py b/tests/test_psi_phi_array.py similarity index 98% rename from tests/test_search_data.py rename to tests/test_psi_phi_array.py index 80b847365..0e805dd7c 100644 --- a/tests/test_search_data.py +++ b/tests/test_psi_phi_array.py @@ -9,7 +9,7 @@ ImageStack, LayeredImage, PsiPhi, - SearchData, + PsiPhiArray, RawImage, compute_scale_params_from_image_vect, decode_uint_scalar, @@ -39,7 +39,7 @@ def setUp(self): self.zeroed_times = [0.0, 1.0] def test_set_meta_data(self): - arr = SearchData() + arr = PsiPhiArray() self.assertEqual(arr.num_times, 0) self.assertEqual(arr.num_bytes, 4) self.assertEqual(arr.width, 0) @@ -130,7 +130,7 @@ def test_compute_scale_params_from_image_vect(self): def test_fill_search_data(self): for num_bytes in [2, 4]: - arr = SearchData() + arr = PsiPhiArray() fill_search_data( arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], self.zeroed_times, False ) @@ -191,8 +191,8 @@ def test_fill_search_data_from_image_stack(self): ) im_stack = ImageStack(images) - # Create the SearchData from the ImageStack. - arr = SearchData() + # Create the PsiPhiArray from the ImageStack. + arr = PsiPhiArray() fill_search_data_from_image_stack(arr, im_stack, 4, False) # Check the meta data. From a0605b6db638729a78904fb841b1cf52a1f5ca28 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:23:41 -0500 Subject: [PATCH 13/27] Update psi_phi_array.cpp --- src/kbmod/search/psi_phi_array.cpp | 112 ++++++++++++++--------------- 1 file changed, 56 insertions(+), 56 deletions(-) diff --git a/src/kbmod/search/psi_phi_array.cpp b/src/kbmod/search/psi_phi_array.cpp index ae2e1c425..329d7493e 100644 --- a/src/kbmod/search/psi_phi_array.cpp +++ b/src/kbmod/search/psi_phi_array.cpp @@ -1,25 +1,25 @@ -#include "search_data_ds.h" -#include "search_data_utils.h" -#include "pydocs/search_data_docs.h" +#include "psi_phi_array_ds.h" +#include "psi_phi_array_utils.h" +#include "pydocs/psi_phi_array_docs.h" namespace search { // Declaration of CUDA functions that will be linked in. #ifdef HAVE_CUDA -extern "C" void device_allocate_search_data_arrays(SearchData* data); +extern "C" void device_allocate_psi_phi_array_arrays(PsiPhiArray* data); -extern "C" void device_free_search_data_arrays(SearchData* data); +extern "C" void device_free_psi_phi_array_arrays(PsiPhiArray* data); #endif // ------------------------------------------------------- // --- Implementation of core data structure functions --- // ------------------------------------------------------- -SearchData::SearchData() {} +PsiPhiArray::PsiPhiArray() {} -SearchData::~SearchData() { clear(); } +PsiPhiArray::~PsiPhiArray() { clear(); } -void SearchData::clear() { +void PsiPhiArray::clear() { // Free all used memory on CPU and GPU. if (cpu_array_ptr != nullptr) { free(cpu_array_ptr); @@ -31,7 +31,7 @@ void SearchData::clear() { } #ifdef HAVE_CUDA if ((gpu_array_ptr != nullptr) || (gpu_time_array != nullptr)) { - device_free_search_data_arrays(this); + device_free_psi_phi_array_arrays(this); gpu_array_ptr = nullptr; gpu_time_array = nullptr; } @@ -54,7 +54,7 @@ void SearchData::clear() { meta_data.phi_scale = 1.0; } -void SearchData::set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width) { +void PsiPhiArray::set_meta_data(int new_num_bytes, int new_num_times, int new_height, int new_width) { // Validity checking of parameters. if (new_num_bytes != -1 && new_num_bytes != 1 && new_num_bytes != 2 && new_num_bytes != 4) { throw std::runtime_error("Invalid setting of num_bytes. Must be (-1 [use default], 1, 2, or 4)."); @@ -86,7 +86,7 @@ void SearchData::set_meta_data(int new_num_bytes, int new_num_times, int new_hei meta_data.total_array_size = meta_data.block_size * meta_data.num_entries; } -void SearchData::set_psi_scaling(float min_val, float max_val, float scale_val) { +void PsiPhiArray::set_psi_scaling(float min_val, float max_val, float scale_val) { if (min_val > max_val) throw std::runtime_error("Min value needs to be < max value"); if (scale_val <= 0) throw std::runtime_error("Scale value must be greater than zero."); meta_data.psi_min_val = min_val; @@ -94,7 +94,7 @@ void SearchData::set_psi_scaling(float min_val, float max_val, float scale_val) meta_data.psi_scale = scale_val; } -void SearchData::set_phi_scaling(float min_val, float max_val, float scale_val) { +void PsiPhiArray::set_phi_scaling(float min_val, float max_val, float scale_val) { if (min_val > max_val) throw std::runtime_error("Min value needs to be < max value"); if (scale_val <= 0) throw std::runtime_error("Scale value must be greater than zero."); meta_data.phi_min_val = min_val; @@ -102,7 +102,7 @@ void SearchData::set_phi_scaling(float min_val, float max_val, float scale_val) meta_data.phi_scale = scale_val; } -PsiPhi SearchData::read_psi_phi(int time, int row, int col) { +PsiPhi PsiPhiArray::read_psi_phi(int time, int row, int col) { PsiPhi result = {NO_DATA, NO_DATA}; // Array allocation and bounds checking. @@ -136,7 +136,7 @@ PsiPhi SearchData::read_psi_phi(int time, int row, int col) { return result; } -float SearchData::read_time(int time_index) { +float PsiPhiArray::read_time(int time_index) { if (cpu_time_array == nullptr) throw std::runtime_error("Read from unallocated times array."); if ((time_index < 0) || (time_index >= meta_data.num_times)) { throw std::runtime_error("Out of bounds read for time step."); @@ -175,8 +175,8 @@ std::array compute_scale_params_from_image_vect(const std::vector -void set_encode_cpu_search_data(SearchData& data, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug) { +void set_encode_cpu_psi_phi_array(PsiPhiArray& data, const std::vector& psi_imgs, + const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); } @@ -219,8 +219,8 @@ void set_encode_cpu_search_data(SearchData& data, const std::vector& p data.set_cpu_array_ptr((void*)encoded); } -void set_float_cpu_search_data(SearchData& data, const std::vector& psi_imgs, - const std::vector& phi_imgs, bool debug) { +void set_float_cpu_psi_phi_array(PsiPhiArray& data, const std::vector& psi_imgs, + const std::vector& phi_imgs, bool debug) { if (data.get_cpu_array_ptr() != nullptr) { throw std::runtime_error("CPU PsiPhi already allocated."); } @@ -245,9 +245,9 @@ void set_float_cpu_search_data(SearchData& data, const std::vector& ps data.set_cpu_array_ptr((void*)encoded); } -void fill_search_data(SearchData& result_data, int num_bytes, const std::vector& psi_imgs, - const std::vector& phi_imgs, const std::vector zeroed_times, - bool debug) { +void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vector& psi_imgs, + const std::vector& phi_imgs, const std::vector zeroed_times, + bool debug) { if (result_data.get_cpu_array_ptr() != nullptr) { return; } @@ -282,16 +282,16 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< // Do the local encoding. if (result_data.get_num_bytes() == 1) { - set_encode_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); + set_encode_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); } else { - set_encode_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); + set_encode_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); } } else { if (debug) { printf("Encoding psi and phi as floats.\n"); } // Just interleave psi and phi images. - set_float_cpu_search_data(result_data, psi_imgs, phi_imgs, debug); + set_float_cpu_psi_phi_array(result_data, psi_imgs, phi_imgs, debug); } // Copy the time array. @@ -313,7 +313,7 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< printf("Allocating GPU memory for times array using %lu bytes.\n", times_bytes); } - device_allocate_search_data_arrays(&result_data); + device_allocate_psi_phi_array_arrays(&result_data); if (result_data.get_gpu_array_ptr() == nullptr) { throw std::runtime_error("Unable to allocate GPU PsiPhi array."); } @@ -323,8 +323,8 @@ void fill_search_data(SearchData& result_data, int num_bytes, const std::vector< #endif } -void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stack, int num_bytes, - bool debug) { +void fill_psi_phi_array_from_image_stack(PsiPhiArray& result_data, ImageStack& stack, int num_bytes, + bool debug) { // Compute Phi and Psi from convolved images while leaving masked pixels alone // Reinsert 0s for NO_DATA? std::vector psi_images; @@ -346,7 +346,7 @@ void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stac // Convert these into an array form. Needs the full psi and phi computed first so the // encoding can compute the bounds of each array. std::vector zeroed_times = stack.build_zeroed_times(); - fill_search_data(result_data, num_bytes, psi_images, phi_images, zeroed_times, debug); + fill_psi_phi_array(result_data, num_bytes, psi_images, phi_images, zeroed_times, debug); } // ------------------------------------------- @@ -354,55 +354,55 @@ void fill_search_data_from_image_stack(SearchData& result_data, ImageStack& stac // ------------------------------------------- #ifdef Py_PYTHON_H -static void search_data_binding(py::module& m) { - using ppa = search::SearchData; +static void psi_phi_array_binding(py::module& m) { + using ppa = search::PsiPhiArray; py::class_(m, "PsiPhi", pydocs::DOC_PsiPhi) .def(py::init<>()) .def_readwrite("psi", &search::PsiPhi::psi) .def_readwrite("phi", &search::PsiPhi::phi); - py::class_(m, "SearchData", pydocs::DOC_SearchData) + py::class_(m, "PsiPhiArray", pydocs::DOC_PsiPhiArray) .def(py::init<>()) - .def_property_readonly("num_bytes", &ppa::get_num_bytes, pydocs::DOC_SearchData_get_num_bytes) - .def_property_readonly("num_times", &ppa::get_num_times, pydocs::DOC_SearchData_get_num_times) - .def_property_readonly("width", &ppa::get_width, pydocs::DOC_SearchData_get_width) - .def_property_readonly("height", &ppa::get_height, pydocs::DOC_SearchData_get_height) + .def_property_readonly("num_bytes", &ppa::get_num_bytes, pydocs::DOC_PsiPhiArray_get_num_bytes) + .def_property_readonly("num_times", &ppa::get_num_times, pydocs::DOC_PsiPhiArray_get_num_times) + .def_property_readonly("width", &ppa::get_width, pydocs::DOC_PsiPhiArray_get_width) + .def_property_readonly("height", &ppa::get_height, pydocs::DOC_PsiPhiArray_get_height) .def_property_readonly("pixels_per_image", &ppa::get_pixels_per_image, - pydocs::DOC_SearchData_get_pixels_per_image) + pydocs::DOC_PsiPhiArray_get_pixels_per_image) .def_property_readonly("num_entries", &ppa::get_num_entries, - pydocs::DOC_SearchData_get_num_entries) + pydocs::DOC_PsiPhiArray_get_num_entries) .def_property_readonly("total_array_size", &ppa::get_total_array_size, - pydocs::DOC_SearchData_get_total_array_size) - .def_property_readonly("block_size", &ppa::get_block_size, pydocs::DOC_SearchData_get_block_size) + pydocs::DOC_PsiPhiArray_get_total_array_size) + .def_property_readonly("block_size", &ppa::get_block_size, pydocs::DOC_PsiPhiArray_get_block_size) .def_property_readonly("psi_min_val", &ppa::get_psi_min_val, - pydocs::DOC_SearchData_get_psi_min_val) + pydocs::DOC_PsiPhiArray_get_psi_min_val) .def_property_readonly("psi_max_val", &ppa::get_psi_max_val, - pydocs::DOC_SearchData_get_psi_max_val) - .def_property_readonly("psi_scale", &ppa::get_psi_scale, pydocs::DOC_SearchData_get_psi_scale) + pydocs::DOC_PsiPhiArray_get_psi_max_val) + .def_property_readonly("psi_scale", &ppa::get_psi_scale, pydocs::DOC_PsiPhiArray_get_psi_scale) .def_property_readonly("phi_min_val", &ppa::get_phi_min_val, - pydocs::DOC_SearchData_get_phi_min_val) + pydocs::DOC_PsiPhiArray_get_phi_min_val) .def_property_readonly("phi_max_val", &ppa::get_phi_max_val, - pydocs::DOC_SearchData_get_phi_max_val) - .def_property_readonly("phi_scale", &ppa::get_phi_scale, pydocs::DOC_SearchData_get_phi_scale) + pydocs::DOC_PsiPhiArray_get_phi_max_val) + .def_property_readonly("phi_scale", &ppa::get_phi_scale, pydocs::DOC_PsiPhiArray_get_phi_scale) .def_property_readonly("cpu_array_allocated", &ppa::cpu_array_allocated, - pydocs::DOC_SearchData_get_cpu_array_allocated) + pydocs::DOC_PsiPhiArray_get_cpu_array_allocated) .def_property_readonly("gpu_array_allocated", &ppa::gpu_array_allocated, - pydocs::DOC_SearchData_get_gpu_array_allocated) + pydocs::DOC_PsiPhiArray_get_gpu_array_allocated) .def_property_readonly("cpu_time_array_allocated", &ppa::cpu_time_array_allocated, - pydocs::DOC_SearchData_get_cpu_time_array_allocated) + pydocs::DOC_PsiPhiArray_get_cpu_time_array_allocated) .def_property_readonly("gpu_time_array_allocated", &ppa::gpu_time_array_allocated, - pydocs::DOC_SearchData_get_gpu_time_array_allocated) - .def("set_meta_data", &ppa::set_meta_data, pydocs::DOC_SearchData_set_meta_data) - .def("clear", &ppa::clear, pydocs::DOC_SearchData_clear) - .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_SearchData_read_psi_phi) - .def("read_time", &ppa::read_time, pydocs::DOC_SearchData_read_time); + pydocs::DOC_PsiPhiArray_get_gpu_time_array_allocated) + .def("set_meta_data", &ppa::set_meta_data, pydocs::DOC_PsiPhiArray_set_meta_data) + .def("clear", &ppa::clear, pydocs::DOC_PsiPhiArray_clear) + .def("read_psi_phi", &ppa::read_psi_phi, pydocs::DOC_PsiPhiArray_read_psi_phi) + .def("read_time", &ppa::read_time, pydocs::DOC_PsiPhiArray_read_time); m.def("compute_scale_params_from_image_vect", &search::compute_scale_params_from_image_vect); m.def("decode_uint_scalar", &search::decode_uint_scalar); m.def("encode_uint_scalar", &search::encode_uint_scalar); - m.def("fill_search_data", &search::fill_search_data, pydocs::DOC_SearchData_fill_search_data); - m.def("fill_search_data_from_image_stack", &search::fill_search_data_from_image_stack, - pydocs::DOC_SearchData_fill_search_data_from_image_stack); + m.def("fill_psi_phi_array", &search::fill_psi_phi_array, pydocs::DOC_PsiPhiArray_fill_psi_phi_array); + m.def("fill_psi_phi_array_from_image_stack", &search::fill_psi_phi_array_from_image_stack, + pydocs::DOC_PsiPhiArray_fill_psi_phi_array_from_image_stack); } #endif From 089778242689439f88c59155c98082f91837c192 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:24:43 -0500 Subject: [PATCH 14/27] Rename file --- .../search/pydocs/{search_data_docs.h => psi_phi_array_docs.h} | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename src/kbmod/search/pydocs/{search_data_docs.h => psi_phi_array_docs.h} (100%) diff --git a/src/kbmod/search/pydocs/search_data_docs.h b/src/kbmod/search/pydocs/psi_phi_array_docs.h similarity index 100% rename from src/kbmod/search/pydocs/search_data_docs.h rename to src/kbmod/search/pydocs/psi_phi_array_docs.h From f0062d9adc89b85e20c6204cf16d0527ebc7e402 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:27:14 -0500 Subject: [PATCH 15/27] Fix names from bad replace --- src/kbmod/search/kernels.cu | 4 ++-- src/kbmod/search/psi_phi_array.cpp | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/src/kbmod/search/kernels.cu b/src/kbmod/search/kernels.cu index c400c4380..50c497754 100644 --- a/src/kbmod/search/kernels.cu +++ b/src/kbmod/search/kernels.cu @@ -23,7 +23,7 @@ namespace search { -extern "C" void device_allocate_psi_phi_array_arrays(PsiPhiArray *data) { +extern "C" void device_allocate_psi_phi_arrays(PsiPhiArray *data) { if (!data->cpu_array_allocated() || !data->cpu_time_array_allocated()) { throw std::runtime_error("CPU data is not allocated."); } @@ -47,7 +47,7 @@ extern "C" void device_allocate_psi_phi_array_arrays(PsiPhiArray *data) { data->set_gpu_time_array_ptr(device_times_ptr); } -extern "C" void device_free_psi_phi_array_arrays(PsiPhiArray *data) { +extern "C" void device_free_psi_phi_arrays(PsiPhiArray *data) { if (data->gpu_array_allocated()) { checkCudaErrors(cudaFree(data->get_gpu_array_ptr())); data->set_gpu_array_ptr(nullptr); diff --git a/src/kbmod/search/psi_phi_array.cpp b/src/kbmod/search/psi_phi_array.cpp index 329d7493e..a7bad84e3 100644 --- a/src/kbmod/search/psi_phi_array.cpp +++ b/src/kbmod/search/psi_phi_array.cpp @@ -6,9 +6,9 @@ namespace search { // Declaration of CUDA functions that will be linked in. #ifdef HAVE_CUDA -extern "C" void device_allocate_psi_phi_array_arrays(PsiPhiArray* data); +extern "C" void device_allocate_psi_phi_arrays(PsiPhiArray* data); -extern "C" void device_free_psi_phi_array_arrays(PsiPhiArray* data); +extern "C" void device_free_psi_phi_arrays(PsiPhiArray* data); #endif // ------------------------------------------------------- From 5d1d76cd4dce4cffec362f040b6e367987d33cb0 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:28:37 -0500 Subject: [PATCH 16/27] Update test_psi_phi_array.py --- tests/test_psi_phi_array.py | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/tests/test_psi_phi_array.py b/tests/test_psi_phi_array.py index 0e805dd7c..c261e4edb 100644 --- a/tests/test_psi_phi_array.py +++ b/tests/test_psi_phi_array.py @@ -14,12 +14,12 @@ compute_scale_params_from_image_vect, decode_uint_scalar, encode_uint_scalar, - fill_search_data, - fill_search_data_from_image_stack, + fill_psi_phi_array, + fill_psi_phi_array_from_image_stack, ) -class test_search_data(unittest.TestCase): +class test_psi_phi_array(unittest.TestCase): def setUp(self): self.num_times = 2 self.width = 4 @@ -128,10 +128,10 @@ def test_compute_scale_params_from_image_vect(self): self.assertAlmostEqual(result_uint16[1], max_val, delta=1e-5) self.assertAlmostEqual(result_uint16[2], max_val / 65535.0, delta=1e-5) - def test_fill_search_data(self): + def test_fill_psi_phi_array(self): for num_bytes in [2, 4]: arr = PsiPhiArray() - fill_search_data( + fill_psi_phi_array( arr, num_bytes, [self.psi_1, self.psi_2], [self.phi_1, self.phi_2], self.zeroed_times, False ) @@ -173,7 +173,7 @@ def test_fill_search_data(self): self.assertFalse(arr.gpu_array_allocated) self.assertFalse(arr.gpu_time_array_allocated) - def test_fill_search_data_from_image_stack(self): + def test_fill_psi_phi_array_from_image_stack(self): # Build a fake image stack. num_times = 5 width = 21 @@ -193,7 +193,7 @@ def test_fill_search_data_from_image_stack(self): # Create the PsiPhiArray from the ImageStack. arr = PsiPhiArray() - fill_search_data_from_image_stack(arr, im_stack, 4, False) + fill_psi_phi_array_from_image_stack(arr, im_stack, 4, False) # Check the meta data. self.assertEqual(arr.num_times, num_times) From 17105527ffb9462af17c2b4c76b9e6d48f884b2b Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:31:04 -0500 Subject: [PATCH 17/27] Update psi_phi_array.cpp --- src/kbmod/search/psi_phi_array.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/kbmod/search/psi_phi_array.cpp b/src/kbmod/search/psi_phi_array.cpp index a7bad84e3..e0640e9da 100644 --- a/src/kbmod/search/psi_phi_array.cpp +++ b/src/kbmod/search/psi_phi_array.cpp @@ -31,7 +31,7 @@ void PsiPhiArray::clear() { } #ifdef HAVE_CUDA if ((gpu_array_ptr != nullptr) || (gpu_time_array != nullptr)) { - device_free_psi_phi_array_arrays(this); + device_free_psi_phi_arrays(this); gpu_array_ptr = nullptr; gpu_time_array = nullptr; } @@ -313,7 +313,7 @@ void fill_psi_phi_array(PsiPhiArray& result_data, int num_bytes, const std::vect printf("Allocating GPU memory for times array using %lu bytes.\n", times_bytes); } - device_allocate_psi_phi_array_arrays(&result_data); + device_allocate_psi_phi_arrays(&result_data); if (result_data.get_gpu_array_ptr() == nullptr) { throw std::runtime_error("Unable to allocate GPU PsiPhi array."); } From 0119b7c347715e769bc9051dc5f7a96cb484fc85 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Fri, 2 Feb 2024 16:56:30 -0500 Subject: [PATCH 18/27] Fix precision error --- src/kbmod/search/image_stack.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/kbmod/search/image_stack.cpp b/src/kbmod/search/image_stack.cpp index cf4244a19..0ba33319c 100644 --- a/src/kbmod/search/image_stack.cpp +++ b/src/kbmod/search/image_stack.cpp @@ -47,7 +47,7 @@ float ImageStack::get_zeroed_time(int index) const { std::vector ImageStack::build_zeroed_times() const { std::vector zeroed_times = std::vector(); if (images.size() > 0) { - float t0 = images[0].get_obstime(); + double t0 = images[0].get_obstime(); for (auto& i : images) { zeroed_times.push_back(i.get_obstime() - t0); } From 328e021bd13845e9990b73d91d4fc99c0ecf4f27 Mon Sep 17 00:00:00 2001 From: DinoBektesevic Date: Sun, 4 Feb 2024 00:48:38 -0800 Subject: [PATCH 19/27] Python<3.9 does not support OR operator for dictionaries, skip test. --- tests/test_std_config.py | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/tests/test_std_config.py b/tests/test_std_config.py index 5df4e946a..0110e657c 100644 --- a/tests/test_std_config.py +++ b/tests/test_std_config.py @@ -1,3 +1,5 @@ +import sys + import unittest from kbmod import StandardizerConfig @@ -27,7 +29,6 @@ def test_config(self): conf["a"] = 10 self.assertEqual(conf["a"], 10) - self.assertEqual(conf2 | conf, expected) self.assertEqual(list(iter(conf)), ["a", "b", "c"]) # Test .update method @@ -45,3 +46,14 @@ def test_config(self): with self.assertRaises(TypeError): conf2.update([1, 2, 3]) + + @unittest.skipIf(sys.version_info < (3, 9), "py<3.9 does not support or for dicts.") + def test_or(self): + expected = {"a": 1, "b": 2, "c": 3} + conf = StandardizerConfig(expected) + conf2 = StandardizerConfig(a=1, b=2, c=3) + self.assertEqual(conf2 | conf, expected) + + +if __name__ == "__main__": + unittest.main() From b349e5dd34d2af4d79213e6792a1c7fa5c9fd99a Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Tue, 6 Feb 2024 12:02:41 -0500 Subject: [PATCH 20/27] Clean up StackSearch --- src/kbmod/search/pydocs/stack_search_docs.h | 4 --- src/kbmod/search/stack_search.cpp | 27 ++++++--------------- src/kbmod/search/stack_search.h | 9 ++----- 3 files changed, 10 insertions(+), 30 deletions(-) diff --git a/src/kbmod/search/pydocs/stack_search_docs.h b/src/kbmod/search/pydocs/stack_search_docs.h index f52e2aece..8e2c5bd00 100644 --- a/src/kbmod/search/pydocs/stack_search_docs.h +++ b/src/kbmod/search/pydocs/stack_search_docs.h @@ -59,10 +59,6 @@ static const auto DOC_StackSearch_set_debug = R"doc( Set to ``True`` to turn on debug output and ``False`` to turn it off. )doc"; -static const auto DOC_StackSearch_filter_min_obs = R"doc( - todo - )doc"; - static const auto DOC_StackSearch_get_num_images = R"doc( "Returns the number of images to process. ")doc"; diff --git a/src/kbmod/search/stack_search.cpp b/src/kbmod/search/stack_search.cpp index cf06968a6..b75030ae2 100644 --- a/src/kbmod/search/stack_search.cpp +++ b/src/kbmod/search/stack_search.cpp @@ -68,7 +68,8 @@ void StackSearch::set_start_bounds_y(int y_min, int y_max) { void StackSearch::search(int ang_steps, int vel_steps, float min_ang, float max_ang, float min_vel, float mavx, int min_observations) { DebugTimer core_timer = DebugTimer("Running core search", debug_info); - create_search_list(ang_steps, vel_steps, min_ang, max_ang, min_vel, mavx); + std::vector search_list = + create_grid_search_list(ang_steps, vel_steps, min_ang, max_ang, min_vel, mavx); // Create a data stucture for the per-image data. std::vector image_times = stack.build_zeroed_times(); @@ -132,8 +133,9 @@ void StackSearch::prepare_psi_phi() { } } -void StackSearch::create_search_list(int angle_steps, int velocity_steps, float min_ang, float max_ang, - float min_vel, float mavx) { +std::vector StackSearch::create_grid_search_list(int angle_steps, int velocity_steps, + float min_ang, float max_ang, float min_vel, + float mavx) { DebugTimer timer = DebugTimer("Creating search candidate list", debug_info); std::vector angles(angle_steps); @@ -149,7 +151,7 @@ void StackSearch::create_search_list(int angle_steps, int velocity_steps, float } int trajCount = angle_steps * velocity_steps; - search_list = std::vector(trajCount); + std::vector search_list = std::vector(trajCount); for (int a = 0; a < angle_steps; ++a) { for (int v = 0; v < velocity_steps; ++v) { search_list[a * velocity_steps + v].vx = cos(angles[a]) * velocities[v]; @@ -157,6 +159,8 @@ void StackSearch::create_search_list(int angle_steps, int velocity_steps, float } } timer.stop(); + + return search_list; } std::vector StackSearch::create_curves(Trajectory t, const std::vector& imgs) { @@ -214,20 +218,6 @@ void StackSearch::sort_results() { [](Trajectory a, Trajectory b) { return b.lh < a.lh; }); } -void StackSearch::filter_results(int min_observations) { - results.erase(std::remove_if(results.begin(), results.end(), - std::bind([](Trajectory t, int cutoff) { return t.obs_count < cutoff; }, - std::placeholders::_1, min_observations)), - results.end()); -} - -void StackSearch::filter_results_lh(float min_lh) { - results.erase(std::remove_if(results.begin(), results.end(), - std::bind([](Trajectory t, float cutoff) { return t.lh < cutoff; }, - std::placeholders::_1, min_lh)), - results.end()); -} - std::vector StackSearch::get_results(int start, int count) { if (start + count >= results.size()) { count = results.size() - start; @@ -256,7 +246,6 @@ static void stack_search_bindings(py::module& m) { .def("set_start_bounds_x", &ks::set_start_bounds_x, pydocs::DOC_StackSearch_set_start_bounds_x) .def("set_start_bounds_y", &ks::set_start_bounds_y, pydocs::DOC_StackSearch_set_start_bounds_y) .def("set_debug", &ks::set_debug, pydocs::DOC_StackSearch_set_debug) - .def("filter_min_obs", &ks::filter_results, pydocs::DOC_StackSearch_filter_min_obs) .def("get_num_images", &ks::num_images, pydocs::DOC_StackSearch_get_num_images) .def("get_image_width", &ks::get_image_width, pydocs::DOC_StackSearch_get_image_width) .def("get_image_height", &ks::get_image_height, pydocs::DOC_StackSearch_get_image_height) diff --git a/src/kbmod/search/stack_search.h b/src/kbmod/search/stack_search.h index 48f3386d9..72d971dd4 100644 --- a/src/kbmod/search/stack_search.h +++ b/src/kbmod/search/stack_search.h @@ -50,10 +50,6 @@ class StackSearch { // Gets the vector of result trajectories. std::vector get_results(int start, int end); - // Filters the results based on various parameters. - void filter_results(int min_observations); - void filter_results_lh(float min_lh); - // Getters for the Psi and Phi data. std::vector get_psi_curves(Trajectory& t); std::vector get_phi_curves(Trajectory& t); @@ -71,13 +67,12 @@ class StackSearch { std::vector create_curves(Trajectory t, const std::vector& imgs); // Creates list of trajectories to search. - void create_search_list(int angle_steps, int velocity_steps, float min_ang, float max_ang, float min_vel, - float max_vel); + std::vector create_grid_search_list(int angle_steps, int velocity_steps, float min_ang, + float max_ang, float min_vel, float mavx); bool psi_phi_generated; bool debug_info; ImageStack stack; - std::vector search_list; std::vector psi_images; std::vector phi_images; std::vector results; From 4ed4643318e572713492f823309c6679019985c8 Mon Sep 17 00:00:00 2001 From: Colin Orion Chandler Date: Tue, 6 Feb 2024 20:29:21 -0800 Subject: [PATCH 21/27] New Notebooks and updated Region Search Notebook (#455) * Plot correction, clarifying text disable gridlines for the sky plotting * Create Region Searching Workbook.ipynb This contains the essence of Region Search for now. * Creating a structure for scratch notebooks Brainstorming, demos, and testing to share. * Update RegionSearchTesting.ipynb black --target-version py38 --line-length 110 is what works, but only if black was installed with [jupyter] * Update Region Searching Workbook.ipynb Consolidation into a single Pandas dataframe, Notebook cleanup, master function in preparation for a demo, TODO items added/updated, and a Next Steps added to the end. --- .../Region Searching Workbook.ipynb | 2938 +++++++++++++++++ .../coc/RegionSearchTesting.ipynb | 973 ++++++ notebooks/region_search/sky_patches.ipynb | 7 +- 3 files changed, 3915 insertions(+), 3 deletions(-) create mode 100644 notebooks/region_search/Region Searching Workbook.ipynb create mode 100644 notebooks/region_search/coc/RegionSearchTesting.ipynb diff --git a/notebooks/region_search/Region Searching Workbook.ipynb b/notebooks/region_search/Region Searching Workbook.ipynb new file mode 100644 index 000000000..5d7e6da65 --- /dev/null +++ b/notebooks/region_search/Region Searching Workbook.ipynb @@ -0,0 +1,2938 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "d94d8d2b", + "metadata": {}, + "source": [ + "# Butler Interface for User\n", + "\n", + "The point of this notebook is to do step-by-step exploration of the DEEP dataset that was first run through KBMOD for the first set of papers. That work was led by Hayden Smotherman, hence the reference to that name.\n", + "\n", + "The \"Steven\" name that appears is Steven Stetzler, who inherited the responsibilities of properly re/processing the entire DEEP dataset through data acquired through 2023.\n", + "\n", + "### Basic Idea\n", + "Here we are connecting to an existing Butler/repository with the intent of carrying out queries to find data suitable for KBMOD to use.\n", + "\n", + "#### FAQ\n", + "\n", + "Q: Who wrote this, and when?\\\n", + "A: Colin Orion Chandler (coc123@uw.edu), late January 2024.\n", + "\n", + "Q: What are the basic requirements to run this?\\\n", + "A: (a) Epyc access, (b) with the appropriate (LSST w_2022_06) weekly build active, (c) permissions to access the repo_path mentioned below, and (d) an acceptable Kernel in the Jupyter-Hub of Epyc (user or global).\n", + "\n", + "Q: Why don't we just query the DB (e.g., PostGres, SQLite) to get what we need?\\\n", + "A: Because (a) the underlying schema can (and has/does) change, and (b) the underlying DB does not contain views, meaning that we would have to recreate the very complex relational mapping ourselves. Moreover, aside from (b) being very challenging, the relationship mapping recreation would fail due to the reasons mentioned in (a)." + ] + }, + { + "cell_type": "markdown", + "id": "9ea4ebd7", + "metadata": {}, + "source": [ + "### Initial Setup" + ] + }, + { + "cell_type": "code", + "execution_count": 339, + "id": "d0189084", + "metadata": {}, + "outputs": [], + "source": [ + "# Import packages needed to run the notebook\n", + "import lsst\n", + "import lsst.daf.butler as dafButler\n", + "import os\n", + "import time\n", + "from matplotlib import pyplot as plt\n", + "import progressbar\n", + "from concurrent.futures import ProcessPoolExecutor, as_completed\n", + "from astropy.time import Time # for converting Butler visitInfo.date (TAI) to UTC strings\n", + "from astropy import units as u\n", + "import pandas as pd\n", + "import pickle\n", + "from dateutil import parser" + ] + }, + { + "cell_type": "code", + "execution_count": 476, + "id": "ceeec168", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "96 CPUs were reported as available by the multiprocessing module.\n" + ] + } + ], + "source": [ + "# We will use some kind of multiprocessing in a few places. Let's see what the sytsem thinks we have available.\n", + "# NOTE: we could set limits on executors later using this value, if desired. 2/6/2024 COC\n", + "\n", + "import multiprocessing\n", + "\n", + "available_cpus = multiprocessing.cpu_count()\n", + "print(f\"{available_cpus} CPUs were reported as available by the multiprocessing module.\")" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "693492d4", + "metadata": {}, + "outputs": [], + "source": [ + "# this code will run in different environments, so we need somewhere (not the working directory) to save output\n", + "basedir = f'{os.environ[\"HOME\"]}/kbmod_tmp'\n", + "os.makedirs(basedir, exist_ok=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "b13eb927", + "metadata": {}, + "outputs": [], + "source": [ + "# set up the Butler\n", + "# NOTE: the repo path contains configs that point us to the underlying registry (DB)\n", + "# NOTE: do NOT assume there is write protection! (i.e., don't make changes)\n", + "repo_path = f\"/epyc/users/smotherh/DEEP/PointingGroups/butler-repo\"\n", + "butler = dafButler.Butler(repo_path)" + ] + }, + { + "cell_type": "markdown", + "id": "85cc47d8", + "metadata": {}, + "source": [ + "#### Collections\n", + "1. Explore the available collections\n", + "2. Construct a list of the collections containing the data we care about.\n", + "\n", + "Different collections hold different datasets.\n", + "\n", + "For the Hayden DEEP repo, the collections we are concerned with are organized by pointing groups (discrete regions on the sky).\n", + "\n", + "We want to figure out what those are, how they are named, and what else is available.\n", + "\n", + "We will also dump a full list of collection names to disk. \\\n", + "NOTE: as of 2/1/2024, there are 1,292 named collections in the repo.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 465, + "id": "e6a546f0", + "metadata": {}, + "outputs": [], + "source": [ + "def get_collection_names(butler, basedir, verbose=False, export=True):\n", + " \"\"\"\n", + " Making this a function 2/6/2024 COC.\n", + " \"\"\"\n", + " all_collection_names = []\n", + "\n", + " for c in sorted(butler.registry.queryCollections(\"*\")):\n", + " all_collection_names.append(c)\n", + "\n", + " if export == True:\n", + " outfile = f\"{basedir}/all_collection_names.lst\"\n", + " with open(outfile, \"w\") as f:\n", + " for c in all_collection_names:\n", + " print(c, file=f)\n", + "\n", + " if verbose:\n", + " message = f\"Found {len(all_collection_names)} collections in the Butler.\"\n", + " if export == True:\n", + " message += f' Wrote to \"{outfile}\".'\n", + " print(message)\n", + " return all_collection_names" + ] + }, + { + "cell_type": "code", + "execution_count": 466, + "id": "3006e4fd", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Found 1292 collections in the Butler. Wrote to \"/astro/users/coc123/kbmod_tmp/all_collection_names.lst\".\n" + ] + } + ], + "source": [ + "all_collection_names = get_collection_names(butler=butler, basedir=basedir, verbose=True, export=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 468, + "id": "b409c810", + "metadata": {}, + "outputs": [], + "source": [ + "# We looked through the collections already.\n", + "# We will string manipulate to get to what we need.\n", + "# Previously, we used a list file on disk. (This could be a better option for some users.)\n", + "\n", + "\n", + "def get_desired_collections(all_collections_list, desired_collection_list=None):\n", + " \"\"\"\n", + " Produce a list of collections that will be used for querying the Butler.\n", + "\n", + " If desired_collection_list is None, then a hard-wired \"default\" approach\n", + " (for Haden/DEEP) is carried out, requiring:\n", + " 1. \"Pointing\" must be in the collection name.\n", + " 2. \"/imdiff_r/\" must be in the collection name.\n", + " 3. \"/2021\" may not be in the collection name.\n", + "\n", + " Otherwise, desired_collection_list can be either\n", + " 1. a Python list of desired collection names, or\n", + " 2. a filename (ending in .lst) that specifies the desired collections.\n", + " Either way, the collection names are verified against the (required) collections_list.\n", + "\n", + " Made this into a function 2/6/2024 COC.\n", + "\n", + " NOTE/TODO: untested are the supplied list and list file approaches.\n", + " \"\"\"\n", + "\n", + " desired_collections = []\n", + "\n", + " if desired_collection_list == None:\n", + " for collection_name in all_collection_names:\n", + " if (\n", + " \"Pointing\" in collection_name\n", + " and \"/imdiff_r\" in collection_name\n", + " and \"/2021\" not in collection_name\n", + " ):\n", + " desired_collections.append(collection_name)\n", + " else:\n", + " if type(desired_collection_list) == type(\"\"):\n", + " with open(desired_collection_list, \"r\") as f:\n", + " for line in f:\n", + " desired_collections.append(line.strip())\n", + " else:\n", + " for entry in desired_collection_list:\n", + " desired_collections.append(entry)\n", + " #\n", + " # Validate entries\n", + " for entry in desired_collections:\n", + " if entry not in all_collections_list:\n", + " raise KeyError(f'\"{entry}\" is not in the master list of collections supplied.')\n", + " #\n", + " return desired_collections" + ] + }, + { + "cell_type": "code", + "execution_count": 473, + "id": "dc9a4efc", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['PointingGroup006/imdiff_r',\n", + " 'PointingGroup008/imdiff_r',\n", + " 'PointingGroup009/imdiff_r',\n", + " 'PointingGroup016/imdiff_r',\n", + " 'PointingGroup018/imdiff_r',\n", + " 'PointingGroup019/imdiff_r',\n", + " 'PointingGroup021/imdiff_r',\n", + " 'PointingGroup023/imdiff_r']" + ] + }, + "execution_count": 473, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "desired_collections = get_desired_collections(all_collections_list=all_collection_names)\n", + "desired_collections" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "4537e06a", + "metadata": {}, + "outputs": [], + "source": [ + "# ASIDE: there is a set of collections with dates in their names\n", + "# (e.g., PointingGroup006/imdiff_r/20211110T184421Z).\n", + "# Those (only?) have the following datasetTypes, (so we use the name without the date for all the datasetTypes):\n", + "# Across all collections, we see the following numbers by datasetType:\n", + "# 47383 deepDiff_diaSrc\n", + "# 8 deepDiff_diaSrc_schema\n", + "# 47383 deepDiff_differenceExp\n", + "# 29445 deepDiff_warpedExp\n", + "# 8 imageDifference_config\n", + "# 17942 imageDifference_log\n", + "# 47383 imageDifference_metadata\n", + "# 8 packages\n", + "\n", + "# which is too little? we we will snag the parent Collections (stripping dates)" + ] + }, + { + "cell_type": "markdown", + "id": "2fcdae7b", + "metadata": {}, + "source": [ + "#### datasetTypes\n", + "\n", + "Here we explore another dimension of the Butler: datasetType.\n", + "\n", + "tldr; we just care about one currently: deepDiff_differenceExp" + ] + }, + { + "cell_type": "code", + "execution_count": 169, + "id": "47c8c37c", + "metadata": {}, + "outputs": [], + "source": [ + "# TIMING NOTE: about 2 minutes here\n", + "#\n", + "# Maybe a KBMOD user must know which datasetType(s) they need?\n", + "# Here we show how to explore them to figure that out.\n", + "#\n", + "# NOTE: we tested two approaches,\n", + "# (a) iterating over desired_collections, and\n", + "# (b) supply desired_collections.\n", + "# The output was the same, but the iterating method took 268s, and the supplied method took 97s.\n", + "# There *was* a point where we thought we were seeing different results depending on the approach,\n", + "# but this has been sorted out. (COC suspects a testing break in a loop somwhere.)\n", + "# COC NTS: [TODO] function, [TODO] caching\n", + "\n", + "\n", + "def getDatasetTypeStats(butler, overwrite=False):\n", + " \"\"\"\n", + " Get information on all datasetTypes found in a Butler.\n", + " TODO implement caching if desired. If not, get rid of overwrite option.\n", + " 2/1/2024 COC\n", + " \"\"\"\n", + " datasetTypes = {}\n", + "\n", + " import glob\n", + "\n", + " cache_file = f\"{basedir}/dataset_types.csv\"\n", + " cache_exists = False\n", + " if len(glob.glob(cache_file)) > 0:\n", + " cache_exists = True\n", + "\n", + " if overwrite == False and cache_exists == True:\n", + " print(f\"Recycling {cache_file} as overwrite was False...\")\n", + " with open(cache_file, \"r\") as f:\n", + " for line in f:\n", + " print(line)\n", + " line = line.strip().split(\",\")\n", + " datasetTypes[line[0]] = int(line[1])\n", + " print(f\"Read {len(datasetTypes)} datasetTypes from disk.\")\n", + " return datasetTypes\n", + "\n", + " q = sorted(butler.registry.queryDatasetTypes())\n", + "\n", + " with progressbar.ProgressBar(max_value=len(q)) as bar:\n", + " for j, dt in enumerate(q):\n", + " n = 0\n", + " for i, ref in enumerate(\n", + " butler.registry.queryDatasets(datasetType=dt, collections=desired_collections)\n", + " ):\n", + " n += 1\n", + " if n > 0:\n", + " if dt.name not in datasetTypes:\n", + " datasetTypes[dt.name] = 0\n", + " datasetTypes[dt.name] += n\n", + " bar.update(j)\n", + "\n", + " if cache_exists == False or overwrite == True:\n", + " print(f\"Saving {len(datasetTypes)} datasetTypes to {cache_file} now...\")\n", + " with open(cache_file, \"w\") as f:\n", + " for key in datasetTypes:\n", + " print(f\"{key},{datasetTypes[key]}\", file=f)\n", + " else:\n", + " print(f\"Saw {len(datasetTypes)} datasetTypes.\")\n", + " return datasetTypes" + ] + }, + { + "cell_type": "code", + "execution_count": 170, + "id": "b741015f", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "100% (129 of 129) |######################| Elapsed Time: 0:02:28 Time: 0:02:28\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Saving 46 datasetTypes to /astro/users/coc123/kbmod_tmp/dataset_types.csv now...\n", + "CPU times: user 1min 57s, sys: 2.96 s, total: 2min\n", + "Wall time: 2min 28s\n" + ] + } + ], + "source": [ + "%%time\n", + "# TIMING NOTE: this takes roughly 2.5 minutes without cache (2/6/2024 COC)\n", + "datasetTypes = getDatasetTypeStats(butler=butler, overwrite=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "6406f04c", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Across all collections, we see the following numbers by datasetType: \n", + "8 assembleCoadd_config\n", + "268 assembleCoadd_log\n", + "700 assembleCoadd_metadata\n", + "122856 cal_ref_cat\n", + "47403 calexp\n", + "47403 calexpBackground\n", + "8 calibrate_config\n", + "17961 calibrate_log\n", + "47403 calibrate_metadata\n", + "8 characterizeImage_config\n", + "18290 characterizeImage_log\n", + "47423 characterizeImage_metadata\n", + "693 deepCoadd\n", + "167085 deepCoadd_directWarp\n", + "693 deepCoadd_inputMap\n", + "167085 deepCoadd_psfMatchedWarp\n", + "47383 deepDiff_diaSrc\n", + "8 deepDiff_diaSrc_schema\n", + "47383 deepDiff_differenceExp\n", + "29445 deepDiff_warpedExp\n", + "524283 gaia_DR1_v1\n", + "47423 icExp\n", + "47423 icExpBackground\n", + "47423 icSrc\n", + "8 icSrc_schema\n", + "8 imageDifference_config\n", + "17942 imageDifference_log\n", + "47383 imageDifference_metadata\n", + "8 isr_config\n", + "18290 isr_log\n", + "48422 isr_metadata\n", + "8 makeWarp_config\n", + "64924 makeWarp_log\n", + "167085 makeWarp_metadata\n", + "48422 overscanRaw\n", + "8 overscan_config\n", + "18290 overscan_log\n", + "48422 overscan_metadata\n", + "32 packages\n", + "48422 postISRCCD\n", + "130924 ps1_pv3_3pi_20170110\n", + "48422 raw\n", + "1 skyMap\n", + "47403 src\n", + "47403 srcMatch\n", + "8 src_schema\n" + ] + } + ], + "source": [ + "# The number of records for each datasetType.\n", + "# This may be especially useful for users who do not yet know which datasetType(s) they need.\n", + "\n", + "print(f\"Across all collections, we see the following numbers by datasetType: \")\n", + "for dt in datasetTypes:\n", + " print(f\"{datasetTypes[dt]!s:10} {dt.name}\")" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "53a03c75", + "metadata": {}, + "outputs": [], + "source": [ + "# This is the datasetType that we care about.\n", + "# NOTE: we should allow this to be a list in case a user needs multiple.\n", + "desired_datasetTypes = [\"deepDiff_differenceExp\"]" + ] + }, + { + "cell_type": "markdown", + "id": "3c351fc7", + "metadata": {}, + "source": [ + "### Visit Detector Region (VDR) Querying\n", + "\n", + "Here we will query the Butler and extract all of the \"visit_detector_region\" information.\\\n", + "At this stage we are gathering:\n", + "1. dataIds for all future queries\n", + "2. lsst.sphgeom.region objects" + ] + }, + { + "cell_type": "code", + "execution_count": 608, + "id": "c47e5588", + "metadata": {}, + "outputs": [], + "source": [ + "def get_vdr_data(butler, desired_collections, desired_datasetTypes):\n", + " \"\"\"\n", + "\n", + " Made as function 2/6/2024 COC.\n", + " \"\"\"\n", + " # VDR === Visit Detector Region\n", + " # VDRs hold what we need in terms of region hashes and unique dataIds.\n", + " # NOTE: this typically takes < 5s to run 2/1/2024 COC\n", + " # NOTE: tried iterating over desired_collections vs supplying desired_collections; same output 2/1/2024 COC\n", + "\n", + " vdr_dict = {\"data_id\": [], \"region\": [], \"detector\": []}\n", + " # vdr_ids = []\n", + " # vdr_regions = []\n", + " # vdr_detectors = []\n", + "\n", + " for dt in desired_datasetTypes:\n", + " datasetRefs = butler.registry.queryDimensionRecords(\n", + " \"visit_detector_region\", datasets=dt, collections=desired_collections\n", + " )\n", + " for ref in datasetRefs:\n", + " vdr_dict[\"data_id\"].append(ref.dataId)\n", + " vdr_dict[\"region\"].append(\n", + " ref.region\n", + " ) # keeping as objects for now; should .encode() for caching/export\n", + " vdr_dict[\"detector\"].append(ref.detector) # 2/2/2024 COC\n", + " # BUT if we decided to export this or cache this, we should write the encode() version to disk\n", + " #\n", + " example_vdr_ref = ref # this leaves a VDR Python object we can play with\n", + " # other data available:\n", + " # id = ref.id# id -- e.g., 1592350 (for DEEP dataset, I think UUIDs for newer Butlers)\n", + " # visit = ref.dataId.full['visit'] # e.g., 946725\n", + " # vdr_filters.append(ref.dataId.full['band']) # e.g., VR\n", + " # vdr_detectors.append(ref.dataId.full['detector']) # e.g., 1\n", + " df = pd.DataFrame.from_dict(vdr_dict)\n", + " return df, example_vdr_ref" + ] + }, + { + "cell_type": "code", + "execution_count": 611, + "id": "eb222e02", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 1.82 s, sys: 83.2 ms, total: 1.91 s\n", + "Wall time: 2.4 s\n" + ] + } + ], + "source": [ + "%%time\n", + "# TIMING NOTE: requires about 2 seconds 2/6/2024 COC\n", + "df, example_vdr_ref = get_vdr_data(\n", + " butler=butler, desired_collections=desired_collections, desired_datasetTypes=desired_datasetTypes\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 612, + "id": "6e9462e1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
data_idregiondetector
0(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9847372525065534...1
1(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9847381014554984...1
2(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9847383417970056...1
3(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9847382159041213...1
4(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9847381374341414...1
............
47378(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.987608537646486,...62
47379(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9876085083003562...62
47380(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9876085761885252...62
47381(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9876085761885252...62
47382(instrument, detector, visit)ConvexPolygon([UnitVector3d(0.9876086828694174...62
\n", + "

47383 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " data_id \n", + "0 (instrument, detector, visit) \\\n", + "1 (instrument, detector, visit) \n", + "2 (instrument, detector, visit) \n", + "3 (instrument, detector, visit) \n", + "4 (instrument, detector, visit) \n", + "... ... \n", + "47378 (instrument, detector, visit) \n", + "47379 (instrument, detector, visit) \n", + "47380 (instrument, detector, visit) \n", + "47381 (instrument, detector, visit) \n", + "47382 (instrument, detector, visit) \n", + "\n", + " region detector \n", + "0 ConvexPolygon([UnitVector3d(0.9847372525065534... 1 \n", + "1 ConvexPolygon([UnitVector3d(0.9847381014554984... 1 \n", + "2 ConvexPolygon([UnitVector3d(0.9847383417970056... 1 \n", + "3 ConvexPolygon([UnitVector3d(0.9847382159041213... 1 \n", + "4 ConvexPolygon([UnitVector3d(0.9847381374341414... 1 \n", + "... ... ... \n", + "47378 ConvexPolygon([UnitVector3d(0.987608537646486,... 62 \n", + "47379 ConvexPolygon([UnitVector3d(0.9876085083003562... 62 \n", + "47380 ConvexPolygon([UnitVector3d(0.9876085761885252... 62 \n", + "47381 ConvexPolygon([UnitVector3d(0.9876085761885252... 62 \n", + "47382 ConvexPolygon([UnitVector3d(0.9876086828694174... 62 \n", + "\n", + "[47383 rows x 3 columns]" + ] + }, + "execution_count": 612, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df" + ] + }, + { + "cell_type": "code", + "execution_count": 610, + "id": "e04e2f35", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "We found 47383 regions spanning the 8 desired collections.\n" + ] + } + ], + "source": [ + "print(f\"We found {len(df['data_id'])} regions spanning the {len(desired_collections)} desired collections.\")" + ] + }, + { + "cell_type": "code", + "execution_count": 559, + "id": "08d5b443", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
visit_detector_region:\n",
+       "  instrument: 'DECam'\n",
+       "  detector: 62\n",
+       "  visit: 946176\n",
+       "  region: ConvexPolygon([UnitVector3d(0.9876086828694174, -0.13336028508776862, -0.08272922024438323), UnitVector3d(0.9873378171284917, -0.13332652431396907, -0.08595389916869185), UnitVector3d(0.9881047366097594, -0.12752395595185462, -0.08594573955553172), UnitVector3d(0.9883760335240734, -0.12755303452468866, -0.0827226676235914)])
"
+      ],
+      "text/plain": [
+       "visit_detector_region.RecordClass(instrument='DECam', detector=62, visit=946176, region=ConvexPolygon([UnitVector3d(0.9876086828694174, -0.13336028508776862, -0.08272922024438323), UnitVector3d(0.9873378171284917, -0.13332652431396907, -0.08595389916869185), UnitVector3d(0.9881047366097594, -0.12752395595185462, -0.08594573955553172), UnitVector3d(0.9883760335240734, -0.12755303452468866, -0.0827226676235914)]))"
+      ]
+     },
+     "execution_count": 559,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# For demonstration purposes we still have the last \"ref\" from the last cell's iteration\n",
+    "example_vdr_ref"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 560,
+   "id": "e28031c2",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{instrument: 'DECam', detector: 62, visit: 946176}"
+      ]
+     },
+     "execution_count": 560,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# This is the unique dataId we would need to retrieve this specific image later\n",
+    "example_vdr_ref.dataId"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 561,
+   "id": "761f3610",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "example_vdr_ref.instrument = DECam,     example_vdr_ref.detector = 62,     example_vdr_ref.visit = 946176\n"
+     ]
+    }
+   ],
+   "source": [
+    "# The unique dataId is made up of the following attributes:\n",
+    "print(\n",
+    "    f\"example_vdr_ref.instrument = {example_vdr_ref.instrument}, \\\n",
+    "    example_vdr_ref.detector = {example_vdr_ref.detector}, \\\n",
+    "    example_vdr_ref.visit = {example_vdr_ref.visit}\"\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 562,
+   "id": "5d6b2106",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "b'p\\xddnE\\x86}\\x9a\\xef?\\x0f\\xc3\\x84\\'\\xf3\\x11\\xc1\\xbf\\x80\\x8a_\\xff\\xbd-\\xb5\\xbf\\x04xUzE\\x98\\xef?\\x94\\x15\\xcf\\xf2\\xd7\\x10\\xc1\\xbf\\x9d\\xa9\\xe4!\\x13\\x01\\xb6\\xbf\\x1d_\\x18\\xd3\\x8d\\x9e\\xef?\\x80\\x87\"z\\xb4R\\xc0\\xbff\\x1d\\x9f<\\x8a\\x00\\xb6\\xbf\\xe4Z\\x84\\xc6\\xc6\\xa0\\xef?\\x1f\\x01\\xe5g\\xa8S\\xc0\\xbf\\xba\\xc9\\x14\\x10P-\\xb5\\xbf'"
+      ]
+     },
+     "execution_count": 562,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# This is the region hash we would use for \"region matching\" later\n",
+    "example_vdr_ref.region.encode()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 563,
+   "id": "aa653a8b",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "False"
+      ]
+     },
+     "execution_count": 563,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "# We check to see if we can crawl to other data from the dataId (False means no).\n",
+    "example_vdr_ref.dataId.hasRecords()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3f49186c",
+   "metadata": {},
+   "source": [
+    "# Dataframe Assembly\n",
+    "\n",
+    "This used to contain more, but after I moved everything to a dictionary, then a DF, this became less important.\n",
+    "TODO determine where this should go. Or remove."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 587,
+   "id": "acda18f4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 323 ms, sys: 68 ms, total: 391 ms\n",
+      "Wall time: 582 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "\n",
+    "# Save the dataframe to a pickle file for easier resuming of the notebook\n",
+    "# Size was < 20 Mb 2/5/2024 COC\n",
+    "# COC Note: this was not that useful, maybe TODO remove\n",
+    "df_filename = f\"{basedir}/region_search_df.pickle\"\n",
+    "df.to_pickle(df_filename)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bb076b4b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# load the pickle\n",
+    "# df = pd.read_pickle(file_name)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5bdaaf00",
+   "metadata": {},
+   "source": [
+    "### Instrument handling\n",
+    "Some Butler queries require the instrument to be specified.\\\n",
+    "For now, we are just supplying the one we care about (KLUDGE).\\\n",
+    "It's a list so we can mix-and-match shift-and-stack across instruments(!).\\\n",
+    "NOTE: will leave this as a list for future-proofing purpose"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 564,
+   "id": "0228bb4d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def getInstruments(butler, vdr_ids, first_instrument_only=True):\n",
+    "    \"\"\"Iterate through our records to determine which instrument(s) are involved.\n",
+    "    Return a list of the identified instruments.\n",
+    "    If first_instrument_only is True, stop as soon as we found an instrument.\n",
+    "    \"\"\"\n",
+    "    # KLUDGE: snag the instrument name of the first record we find in a visitInfo query.\n",
+    "    instrument_names = []\n",
+    "    for i, dataId in enumerate(vdr_ids):\n",
+    "        visitInfo = butler.get(\"calexp.visitInfo\", dataId=dataId, collections=desired_collections)\n",
+    "        instrument_name = visitInfo.instrumentLabel\n",
+    "        if instrument_name not in instrument_names:\n",
+    "            print(f'Found {instrument_name}. Adding to \"desired_instruments\" now.')\n",
+    "            instrument_names.append(instrument_name)\n",
+    "        if first_instrument_only == True and len(instrument_names) > 0:\n",
+    "            print(\n",
+    "                f\"WARNING: we are not iterating over all rows to find instruments, just taking the first one.\"\n",
+    "            )\n",
+    "            break\n",
+    "    return instrument_names"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 613,
+   "id": "6c3bb244",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Found DECam. Adding to \"desired_instruments\" now.\n",
+      "WARNING: we are not iterating over all rows to find instruments, just taking the first one.\n",
+      "CPU times: user 140 ms, sys: 19 ms, total: 159 ms\n",
+      "Wall time: 199 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "desired_instruments = getInstruments(butler=butler, vdr_ids=df[\"data_id\"])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "47a434b2",
+   "metadata": {},
+   "source": [
+    "### Butler Retrieval Example\n",
+    "\n",
+    "A quick stop to see how we can grab the full Butler record via a dataId."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 614,
+   "id": "dfc37b54",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 875 ms, sys: 108 ms, total: 983 ms\n",
+      "Wall time: 1.02 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# Back to the dataId, we can actually fetch the image from the Butler\n",
+    "# TIMING NOTE: it takes 1 to 2 seconds to do this, so we won't be able to do this at scale\n",
+    "\n",
+    "example_butler_get = butler.get(\n",
+    "    desired_datasetTypes[0], collections=desired_collections, dataId=example_vdr_ref.dataId\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 529,
+   "id": "789f1d42",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "62"
+      ]
+     },
+     "execution_count": 529,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "example_butler_get.detector.getId()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 530,
+   "id": "351e8d03",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'VR'"
+      ]
+     },
+     "execution_count": 530,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "example_butler_get.filterLabel.bandLabel"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 531,
+   "id": "1c1e5431",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       ""
+      ]
+     },
+     "execution_count": 531,
+     "metadata": {},
+     "output_type": "execute_result"
+    },
+    {
+     "data": {
+      "image/png": "",
+      "text/plain": [
+       "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# we can even view the image right here\n", + "plt.imshow(example_butler_get.image.array, cmap=\"gray\")" + ] + }, + { + "cell_type": "code", + "execution_count": 532, + "id": "ba1b7ab6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "FITS standard SkyWcs:\n", + "Sky Origin: (352.4630539808, -4.8516830845)\n", + "Pixel Origin: (1126.14, 1991.36)\n", + "Pixel Scale: 0.262593 arcsec/pixel" + ] + }, + "execution_count": 532, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# There IS a WCS here, which we did not see in the earlier VDR\n", + "example_butler_get.wcs" + ] + }, + { + "cell_type": "code", + "execution_count": 503, + "id": "4270995e", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Here are all the keywords available from this image:\n", + "NEXTEND\n", + "PROCTYPE\n", + "PRODTYPE\n", + "PIXSCAL1\n", + "PIXSCAL2\n", + "FILENAME\n", + "TELESCOP\n", + "OBSERVAT\n", + "INSTRUME\n", + "EXPREQ\n", + "OBSID\n", + "TIME-OBS\n", + "OPENSHUT\n", + "EXPNUM\n", + "OBJECT\n", + "OBSTYPE\n", + "CAMSHUT\n", + "PROGRAM\n", + "OBSERVER\n", + "PROPOSER\n", + "DTPI\n", + "PROPID\n", + "EXCLUDED\n", + "SEQID\n", + "SEQNUM\n", + "SEQTOT\n", + "AOS\n", + "BCAM\n", + "GUIDER\n", + "SKYSTAT\n", + "FILTER\n", + "INSTANCE\n", + "ERRORS\n", + "TELEQUIN\n", + "TELSTAT\n", + "RA\n", + "DEC\n", + "TELRA\n", + "TELDEC\n", + "HA\n", + "ZD\n", + "AZ\n", + "DOMEAZ\n", + "ZPDELRA\n", + "ZPDELDEC\n", + "TELFOCUS\n", + "VSUB\n", + "GSKYPHOT\n", + "LSKYPHOT\n", + "WINDSPD\n", + "WINDDIR\n", + "PRESSURE\n", + "DIMMSEE\n", + "DIMM2SEE\n", + "MASS2\n", + "ASTIG1\n", + "ASTIG2\n", + "OUTTEMP\n", + "AIRMASS\n", + "GSKYVAR\n", + "GSKYHOT\n", + "LSKYVAR\n", + "LSKYHOT\n", + "LSKYPOW\n", + "MSURTEMP\n", + "MAIRTEMP\n", + "UPTRTEMP\n", + "LWTRTEMP\n", + "PMOSTEMP\n", + "UTN-TEMP\n", + "UTS-TEMP\n", + "UTW-TEMP\n", + "UTE-TEMP\n", + "PMN-TEMP\n", + "PMS-TEMP\n", + "PMW-TEMP\n", + "PME-TEMP\n", + "DOMELOW\n", + "DOMEHIGH\n", + "DOMEFLOR\n", + "G-MEANX\n", + "G-MEANY\n", + "DONUTFS4\n", + "DONUTFS3\n", + "DONUTFS2\n", + "DONUTFS1\n", + "G-FLXVAR\n", + "G-MEANXY\n", + "DONUTFN1\n", + "DONUTFN2\n", + "DONUTFN3\n", + "DONUTFN4\n", + "TIME_RECORDED\n", + "G-FEEDBK\n", + "G-CCDNUM\n", + "DOXT\n", + "G-MAXX\n", + "FADZ\n", + "FADY\n", + "FADX\n", + "G-MODE\n", + "FAYT\n", + "DODZ\n", + "DODY\n", + "DODX\n", + "MULTIEXP\n", + "SKYUPDAT\n", + "G-SEEING\n", + "G-TRANSP\n", + "G-MEANY2\n", + "DOYT\n", + "G-LATENC\n", + "LUTVER\n", + "FAXT\n", + "G-MAXY\n", + "G-MEANX2\n", + "SISPIVER\n", + "CONSTVER\n", + "HDRVER\n", + "DTPROPID\n", + "DTCALDAT\n", + "DTSITE\n", + "DTTELESC\n", + "DTACQNAM\n", + "DTINSTRU\n", + "ODATEOBS\n", + "DTNSANAM\n", + "HISTORY\n", + "COMMENT\n", + "ZTENSION\n", + "ZPCOUNT\n", + "ZGCOUNT\n", + "BUNIT\n", + "DETSIZE\n", + "DETSEC\n", + "CCDSEC\n", + "DETSECA\n", + "CCDSECA\n", + "AMPSECA\n", + "DETSECB\n", + "CCDSECB\n", + "AMPSECB\n", + "DETECTOR\n", + "CCDNUM\n", + "DETPOS\n", + "EXTNAME\n", + "GAINA\n", + "RDNOISEA\n", + "SATURATA\n", + "GAINB\n", + "RDNOISEB\n", + "SATURATB\n", + "FPA\n", + "INHERIT\n", + "CCDBIN1\n", + "CCDBIN2\n", + "DHEINF\n", + "DHEFIRM\n", + "SLOT00\n", + "SLOT01\n", + "SLOT02\n", + "SLOT03\n", + "SLOT04\n", + "SLOT05\n", + "LTV2\n", + "LTV1\n", + "VALIDA\n", + "VALIDB\n", + "NDONUTS\n", + "CHECKVER\n", + "ASTRO METADATA FIX MODIFIED\n", + "ASTRO METADATA FIX DATE\n", + "ISR_OSCAN_LEVELA\n", + "ISR_OSCAN_SIGMAA\n", + "OVERSCAN\n", + "ISR_OSCAN_LEVELB\n", + "ISR_OSCAN_SIGMAB\n", + "SKYLEVEL\n", + "SKYSIGMA\n", + "FLATNESS_PP\n", + "FLATNESS_RMS\n", + "FLATNESS_NGRIDS\n", + "FLATNESS_MESHX\n", + "FLATNESS_MESHY\n", + "BGMEAN\n", + "BGVAR\n", + "SFM_ASTROM_OFFSET_MEAN\n", + "SFM_ASTROM_OFFSET_STD\n", + "MAGZERO\n", + "MAGZERO_RMS\n", + "MAGZERO_NOBJ\n", + "COLORTERM1\n", + "COLORTERM2\n", + "COLORTERM3\n" + ] + } + ], + "source": [ + "# We can access all kinds of metadata this way.\n", + "# NOTE: keywords are source data-dependent.\n", + "# NOTE: this linkage works with butler.get() but not necessarily elsewhere.\n", + "meta = example_butler_get.getInfo().getMetadata()\n", + "\n", + "print(f\"Here are all the keywords available from this image:\")\n", + "for k in meta.keys():\n", + " print(k)" + ] + }, + { + "cell_type": "markdown", + "id": "d4f8d811", + "metadata": {}, + "source": [ + "### URI / URL / Path Handling\n", + "Here we grab URIs for the dataIds we need." + ] + }, + { + "cell_type": "code", + "execution_count": 272, + "id": "7bbc916e", + "metadata": {}, + "outputs": [], + "source": [ + "# NOTE: getURIs() does not work as you'd think (i.e., it only handles a single dataId)\n", + "# butler.getURIs(desired_datasetTypes[0], vdr_ids, collections=desired_collections)" + ] + }, + { + "cell_type": "code", + "execution_count": 567, + "id": "e0f8f8f9", + "metadata": {}, + "outputs": [], + "source": [ + "# The single-thead approach (below) requires some 2 hours to execute. So instead we will multiprocess.\n", + "# paths = [butler.getURI(desired_datasetTypes[0], dataId=dataId, collections=desired_collections) for dataId in vdr_ids]\n", + "\n", + "\n", + "def chunked_dataIds(dataIds, chunk_size=200):\n", + " \"\"\"Yield successive chunk_size chunks from dataIds.\"\"\"\n", + " for i in range(0, len(dataIds), chunk_size):\n", + " yield dataIds[i : i + chunk_size]\n", + "\n", + "\n", + "def get_uris(dataIds_chunk, repo_path, desired_datasetTypes, desired_collections):\n", + " \"\"\"Fetch URIs for a list of dataIds.\"\"\"\n", + " chunk_uris = []\n", + " butler = dafButler.Butler(repo_path)\n", + " for dataId in dataIds_chunk:\n", + " try:\n", + " uri = butler.getURI(desired_datasetTypes[0], dataId=dataId, collections=desired_collections)\n", + " uri = uri.geturl() # Convert to URL string\n", + " chunk_uris.append(uri)\n", + " except Exception as e:\n", + " print(f\"Failed to retrieve path for dataId {dataId}: {e}\")\n", + " return chunk_uris\n", + "\n", + "\n", + "def getURIs(butler, dataIds, repo_path, desired_datasetTypes, desired_collections, overwrite=False):\n", + " \"\"\"\n", + " Get URIs from a Butler for a set of dataIDs.\n", + " Cache results to disk for future runs.\n", + " TODO: consider exporting as CSV so we can validate URIs against dataIds. 2/6/2024 COC\n", + " Updated 2/5/2024 COC\n", + " \"\"\"\n", + " paths = []\n", + "\n", + " cache_file = f\"{basedir}/uri_cache.lst\"\n", + " cached_exists = False\n", + " if len(glob.glob(cache_file)) > 0:\n", + " cached_exists = True\n", + "\n", + " if cached_exists == True and overwrite == False:\n", + " with open(cache_file, \"r\") as f:\n", + " for line in f:\n", + " paths.append(line.strip())\n", + " print(f\"Recycled {len(paths)} paths from {cache_file} as overwrite was {overwrite}.\")\n", + " return paths\n", + "\n", + " # Prepare dataId chunks\n", + " dataId_chunks = list(chunked_dataIds(dataIds))\n", + "\n", + " # Execute get_uris in parallel and preserve order\n", + " with ProcessPoolExecutor() as executor:\n", + " # Initialize progress bar\n", + " with progressbar.ProgressBar(max_value=len(dataId_chunks)) as bar:\n", + " # Use map to execute get_uris on each chunk and maintain order\n", + " result_chunks = list(\n", + " executor.map(\n", + " get_uris,\n", + " dataId_chunks,\n", + " [repo_path] * len(dataId_chunks),\n", + " [desired_datasetTypes] * len(dataId_chunks),\n", + " [desired_collections] * len(dataId_chunks),\n", + " )\n", + " )\n", + "\n", + " for i, chunk_uris in enumerate(result_chunks):\n", + " paths.extend(chunk_uris) # Add the retrieved URIs to the main list\n", + " bar.update(i)\n", + "\n", + " with open(cache_file, \"w\") as f:\n", + " for path in paths:\n", + " print(path, file=f)\n", + " print(f\"Wrote {len(paths)} paths to disk for caching purposes.\")\n", + "\n", + " return paths" + ] + }, + { + "cell_type": "code", + "execution_count": 628, + "id": "6dd2ea6a", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Recycled 47383 paths from /astro/users/coc123/kbmod_tmp/uri_cache.lst as overwrite was False.\n", + "CPU times: user 45 ms, sys: 32.1 ms, total: 77.1 ms\n", + "Wall time: 76.7 ms\n" + ] + } + ], + "source": [ + "%%time\n", + "\n", + "# TIMING NOTE: This required 90s uncached 2/5/2024 COC\n", + "\n", + "df[\"uri\"] = getURIs(\n", + " butler=butler,\n", + " dataIds=df[\"data_id\"],\n", + " repo_path=repo_path,\n", + " desired_datasetTypes=desired_datasetTypes,\n", + " desired_collections=desired_collections,\n", + " overwrite=False,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 617, + "id": "eae8d366", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'file:///epyc/users/smotherh/DEEP/PointingGroups/butler-repo/PointingGroup021/imdiff_r/20210723T174135Z/deepDiff_differenceExp/20190927/VR/VR_DECam_c0007_6300.0_2600.0/898286/deepDiff_differenceExp_DECam_VR_VR_DECam_c0007_6300_0_2600_0_898286_S29_PointingGroup021_imdiff_r_20210723T174135Z.fits'" + ] + }, + "execution_count": 617, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# example URI\n", + "df[\"uri\"].iloc()[0]" + ] + }, + { + "cell_type": "markdown", + "id": "fb728cee", + "metadata": {}, + "source": [ + "### Timestamp Handling\n", + "Here we will access the timestamp (datetime) information from the Butler for our records." + ] + }, + { + "cell_type": "code", + "execution_count": 619, + "id": "df7ff31f", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0 DateTime(\"2019-09-27T00:20:59.932016000\", TAI) 120.0 (351.3806941054, -5.2403083277)\n", + "CPU times: user 126 ms, sys: 12 ms, total: 138 ms\n", + "Wall time: 175 ms\n" + ] + } + ], + "source": [ + "%%time\n", + "# Now we want to get metadata like datetime, exposure time, etc.\n", + "for i, dataId in enumerate(df[\"data_id\"]):\n", + " visitInfo = butler.get(\"calexp.visitInfo\", dataId=dataId, collections=desired_collections)\n", + " print(i, visitInfo.date, visitInfo.exposureTime, visitInfo.boresightRaDec)\n", + " break\n", + "# We have the visitInfo object for the exploration below." + ] + }, + { + "cell_type": "code", + "execution_count": 572, + "id": "3ccadfaa", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "lsst.daf.base.dateTime.dateTime.DateTime" + ] + }, + "execution_count": 572, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# That visitInfo.date format may not look familiar. Let's find out why:\n", + "type(visitInfo.date)" + ] + }, + { + "cell_type": "code", + "execution_count": 573, + "id": "d73d8119", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'2019-09-27T00:20:22.932'" + ] + }, + "execution_count": 573, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Let's convert to a plain string, UTC (handles 37 s offset).\n", + "t = Time(testing, format=\"isot\", scale=\"tai\")\n", + "str(t.utc)" + ] + }, + { + "cell_type": "code", + "execution_count": 574, + "id": "89822691", + "metadata": {}, + "outputs": [], + "source": [ + "def getTimestamps(dataIds, overwrite=False):\n", + " \"\"\"Get timestamps for a bunch of dataIds.\n", + " Convert the LSST/Butler TAI to UTC in the process.\n", + " Do this all in a chunked, multiprocessing way.\n", + " Takes about 3 minutes as of 2/1/2024 (Hayden DEEP).\n", + " BUT if we have the values cached, just read those instead, unless overwrite is True.\n", + " 2/1/2024 COC\n", + " \"\"\"\n", + " # thank you ChatGPT 4 for helping parallelize\n", + "\n", + " timestamps = []\n", + "\n", + " import glob\n", + "\n", + " cache_file = f\"{basedir}/vdr_timestamps.lst\"\n", + "\n", + " cache_file_exists = False\n", + " if len(glob.glob(cache_file)) > 0:\n", + " cache_file_exists = True\n", + "\n", + " if overwrite == False and cache_file_exists == True:\n", + " print(f\"Overwrite is False, so we will read the timestamps from file now...\")\n", + " with open(cache_file, \"r\") as f:\n", + " for line in f:\n", + " timestamps.append(line.strip())\n", + " print(f\"Recycled {len(timestamps)} from {cache_file}.\")\n", + " return timestamps\n", + "\n", + " if overwrite or not cache_file_exists:\n", + " timestamps = [] # Re-initialize timestamps here to ensure it's fresh\n", + "\n", + " with ProcessPoolExecutor() as executor:\n", + " dataId_chunks = list(chunked_dataIds(dataIds))\n", + " # Initialize progress bar\n", + " with progressbar.ProgressBar(max_value=len(dataId_chunks)) as bar:\n", + " # Use map for preserving order and simplifying the code\n", + " results = executor.map(get_timestamps, dataId_chunks)\n", + "\n", + " # Process results and maintain the order\n", + " for i, chunk_result in enumerate(results):\n", + " timestamps.extend(chunk_result) # Correctly extend with the result of each future\n", + " bar.update(i)\n", + "\n", + " # Write to cache if necessary\n", + " if overwrite or not cache_file_exists:\n", + " with open(cache_file, \"w\") as f:\n", + " for ts in timestamps:\n", + " print(ts, file=f)\n", + " print(f\"Wrote {len(timestamps)} lines to {cache_file} for future use.\")\n", + "\n", + " print(f\"Obtained {len(timestamps)} timestamps.\")\n", + " return timestamps" + ] + }, + { + "cell_type": "code", + "execution_count": 620, + "id": "5ea2f086", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'2019-09-27T00:20:22.932'" + ] + }, + "execution_count": 620, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Double-check that we can convert Butler timestamp (TAI) to UTC string\n", + "visitInfo = butler.get(\"calexp.visitInfo\", dataId=df[\"data_id\"].iloc()[0], collections=desired_collections)\n", + "t = Time(str(visitInfo.date).split('\"')[1], format=\"isot\", scale=\"tai\")\n", + "tutc = str(t.utc)\n", + "tutc" + ] + }, + { + "cell_type": "code", + "execution_count": 621, + "id": "7e0d33c0", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Overwrite is False, so we will read the timestamps from file now...\n", + "Recycled 47383 from /astro/users/coc123/kbmod_tmp/vdr_timestamps.lst.\n", + "CPU times: user 24.1 ms, sys: 9.07 ms, total: 33.2 ms\n", + "Wall time: 30.1 ms\n" + ] + } + ], + "source": [ + "%%time\n", + "\n", + "# TIMING NOTE: this took < 5 minutes 2/5/2024 COC\n", + "df[\"ut\"] = getTimestamps(dataIds=df[\"data_id\"], overwrite=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 622, + "id": "adddf1e4", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0 2019-09-27T00:20:22.932\n", + "1 2019-09-27T00:22:51.015\n", + "2 2019-09-27T00:25:19.136\n", + "3 2019-09-27T00:27:47.118\n", + "4 2019-09-27T00:30:15.537\n", + " ... \n", + "47378 2020-10-17T04:00:51.409\n", + "47379 2020-10-17T04:03:19.873\n", + "47380 2020-10-17T04:05:48.949\n", + "47381 2020-10-17T04:08:17.445\n", + "47382 2020-10-17T04:10:46.218\n", + "Name: ut, Length: 47383, dtype: object" + ] + }, + "execution_count": 622, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[\"ut\"]" + ] + }, + { + "cell_type": "code", + "execution_count": 364, + "id": "a789a331", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0 : 2019-09-27T00:20:22.932 for {instrument: 'DECam', detector: 1, visit: 898286}. Dict had: 2019-09-27\n", + "1000 : 2019-09-27T02:24:03.066 for {instrument: 'DECam', detector: 12, visit: 898336}. Dict had: 2019-08-29\n", + "2000 : 2019-09-27T00:32:44.405 for {instrument: 'DECam', detector: 23, visit: 898291}. Dict had: 2019-08-29\n", + "3000 : 2019-09-27T02:36:24.497 for {instrument: 'DECam', detector: 33, visit: 898341}. Dict had: 2019-08-29\n", + "4000 : 2019-09-27T00:45:05.306 for {instrument: 'DECam', detector: 44, visit: 898296}. Dict had: 2019-08-29\n", + "5000 : 2019-09-27T02:51:16.295 for {instrument: 'DECam', detector: 54, visit: 898347}. Dict had: 2019-08-29\n", + "6000 : 2019-08-29T07:25:55.714 for {instrument: 'DECam', detector: 4, visit: 891512}. Dict had: 2019-08-30\n", + "7000 : 2019-08-29T06:36:25.673 for {instrument: 'DECam', detector: 14, visit: 891492}. Dict had: 2019-08-30\n", + "8000 : 2019-08-29T05:46:48.259 for {instrument: 'DECam', detector: 24, visit: 891472}. Dict had: 2019-08-29\n", + "9000 : 2019-08-29T09:11:52.823 for {instrument: 'DECam', detector: 33, visit: 891554}. Dict had: 2020-10-19\n", + "10000: 2019-08-29T08:24:43.475 for {instrument: 'DECam', detector: 43, visit: 891535}. Dict had: 2020-10-19\n", + "11000: 2019-08-29T07:39:44.133 for {instrument: 'DECam', detector: 53, visit: 891517}. Dict had: 2020-10-19\n", + "12000: 2020-10-19T03:57:38.040 for {instrument: 'DECam', detector: 1, visit: 946776}. Dict had: 2020-10-19\n", + "13000: 2020-10-19T03:55:07.913 for {instrument: 'DECam', detector: 13, visit: 946775}. Dict had: 2020-10-19\n", + "14000: 2020-10-19T03:52:39.901 for {instrument: 'DECam', detector: 24, visit: 946774}. Dict had: 2020-10-19\n", + "15000: 2020-10-19T03:50:11.828 for {instrument: 'DECam', detector: 35, visit: 946773}. Dict had: 2019-09-27\n", + "16000: 2020-10-19T03:47:43.087 for {instrument: 'DECam', detector: 46, visit: 946772}. Dict had: 2019-09-27\n", + "17000: 2020-10-19T03:45:14.564 for {instrument: 'DECam', detector: 57, visit: 946771}. Dict had: 2019-09-27\n", + "18000: 2019-08-30T07:36:47.123 for {instrument: 'DECam', detector: 7, visit: 891898}. Dict had: 2019-09-27\n", + "19000: 2019-08-30T07:11:50.193 for {instrument: 'DECam', detector: 17, visit: 891888}. Dict had: 2019-09-27\n", + "20000: 2019-08-30T06:47:05.343 for {instrument: 'DECam', detector: 27, visit: 891878}. Dict had: 2019-08-30\n", + "21000: 2019-08-30T06:22:19.105 for {instrument: 'DECam', detector: 37, visit: 891868}. Dict had: 2019-08-30\n", + "22000: 2019-08-30T05:57:29.152 for {instrument: 'DECam', detector: 47, visit: 891858}. Dict had: 2019-08-30\n", + "23000: 2019-08-30T05:32:32.635 for {instrument: 'DECam', detector: 57, visit: 891848}. Dict had: 2019-08-30\n", + "24000: 2019-09-28T01:46:11.541 for {instrument: 'DECam', detector: 6, visit: 898736}. Dict had: 2019-09-28\n", + "25000: 2019-09-28T03:00:31.172 for {instrument: 'DECam', detector: 16, visit: 898766}. Dict had: 2019-09-28\n", + "26000: 2019-09-28T00:17:03.748 for {instrument: 'DECam', detector: 27, visit: 898700}. Dict had: 2019-09-28\n", + "27000: 2019-09-28T01:31:18.723 for {instrument: 'DECam', detector: 37, visit: 898730}. Dict had: 2019-09-28\n", + "28000: 2019-09-28T02:45:39.745 for {instrument: 'DECam', detector: 47, visit: 898760}. Dict had: 2019-09-28\n", + "29000: 2019-09-28T04:00:09.666 for {instrument: 'DECam', detector: 57, visit: 898790}. Dict had: 2019-08-28\n", + "30000: 2019-08-28T06:43:48.523 for {instrument: 'DECam', detector: 7, visit: 891114}. Dict had: 2019-08-28\n", + "31000: 2019-08-28T05:29:20.494 for {instrument: 'DECam', detector: 17, visit: 891084}. Dict had: 2019-08-28\n", + "32000: 2019-08-28T08:31:09.143 for {instrument: 'DECam', detector: 26, visit: 891157}. Dict had: 2019-08-28\n", + "33000: 2019-08-28T07:21:26.793 for {instrument: 'DECam', detector: 36, visit: 891129}. Dict had: 2019-08-28\n", + "34000: 2019-08-28T06:06:34.210 for {instrument: 'DECam', detector: 46, visit: 891099}. Dict had: 2019-08-28\n", + "35000: 2019-08-28T09:08:44.560 for {instrument: 'DECam', detector: 55, visit: 891172}. Dict had: 2019-09-28\n", + "36000: 2019-09-29T00:19:06.349 for {instrument: 'DECam', detector: 5, visit: 899020}. Dict had: 2019-09-29\n", + "37000: 2019-09-29T01:58:29.441 for {instrument: 'DECam', detector: 15, visit: 899060}. Dict had: 2019-09-29\n", + "38000: 2019-09-29T03:37:44.590 for {instrument: 'DECam', detector: 25, visit: 899100}. Dict had: 2019-09-29\n", + "39000: 2019-09-29T01:18:42.912 for {instrument: 'DECam', detector: 36, visit: 899044}. Dict had: 2019-09-29\n", + "40000: 2019-09-29T02:58:02.739 for {instrument: 'DECam', detector: 46, visit: 899084}. Dict had: 2019-09-29\n", + "41000: 2019-09-29T00:38:58.257 for {instrument: 'DECam', detector: 57, visit: 899028}. Dict had: 2019-09-29\n", + "42000: 2020-10-17T03:45:59.925 for {instrument: 'DECam', detector: 6, visit: 946166}. Dict had: 2020-10-17\n", + "43000: 2020-10-17T01:26:44.472 for {instrument: 'DECam', detector: 17, visit: 946110}. Dict had: 2020-10-17\n", + "44000: 2020-10-17T03:06:21.338 for {instrument: 'DECam', detector: 27, visit: 946150}. Dict had: 2020-10-17\n", + "45000: 2020-10-17T00:46:58.038 for {instrument: 'DECam', detector: 38, visit: 946094}. Dict had: 2020-10-17\n", + "46000: 2020-10-17T02:26:33.210 for {instrument: 'DECam', detector: 48, visit: 946134}. Dict had: 2020-10-17\n", + "47000: 2020-10-17T04:05:48.949 for {instrument: 'DECam', detector: 58, visit: 946174}. Dict had: 2020-10-17\n" + ] + } + ], + "source": [ + "# This is for coming back to later to make sure the stamps line up\n", + "# IGNORE FOR NOW 2/6/2024 COC\n", + "# for i in range(0,len(vdr_ids),1000):\n", + "# dataId = vdr_ids[i]\n", + "# visitInfo = butler.get(\"calexp.visitInfo\", dataId=dataId, collections=desired_collections)\n", + "# t = Time(str(visitInfo.date).split('\"')[1], format=\"isot\", scale=\"tai\")\n", + "# tutc = str(t.utc)\n", + "# print(f\"{i!s:5}: {tutc} for {dataId}. Dict had: {id_to_date[dataId]}\")" + ] + }, + { + "cell_type": "markdown", + "id": "6f355bcf", + "metadata": {}, + "source": [ + "### Working with the Regions\n", + "\n", + "We still don't know what will be ideal to do for Region Search.\\\n", + "So, to start with, we will work on extract the (RA, Dec) of the (1) center coordinate of a chip, and (2) four corners associated with a chip." + ] + }, + { + "cell_type": "markdown", + "id": "f060a724", + "metadata": {}, + "source": [ + "#### We will start with corners (i.e., quadilateral vertices from the convexPolygon sphgeom.regions)" + ] + }, + { + "cell_type": "code", + "execution_count": 578, + "id": "e45d7199", + "metadata": {}, + "outputs": [], + "source": [ + "def getRegionCorners(region):\n", + " \"\"\"\n", + " Using the 2D boundingBox() from an input region (convexPolygon), we\n", + " extract the (RA, Dec) coordinates of each vertex.\n", + " As there are four vertices, the input object is a quadrilateral.\n", + " 2/2/2024 COC\n", + " \"\"\"\n", + " corners = []\n", + " bbox = region.getBoundingBox()\n", + " corners.append((bbox.getLon().getA().asDegrees(), bbox.getLat().getA().asDegrees()))\n", + " corners.append((bbox.getLon().getA().asDegrees(), bbox.getLat().getB().asDegrees()))\n", + " corners.append((bbox.getLon().getB().asDegrees(), bbox.getLat().getA().asDegrees()))\n", + " corners.append((bbox.getLon().getB().asDegrees(), bbox.getLat().getB().asDegrees()))\n", + " return corners" + ] + }, + { + "cell_type": "code", + "execution_count": 579, + "id": "9b278b50", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[(352.30950511932116, -4.930880058593892),\n", + " (352.30950511932116, -4.7450820235469715),\n", + " (352.64644359666477, -4.930880058593892),\n", + " (352.64644359666477, -4.7450820235469715)]" + ] + }, + "execution_count": 579, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Example\n", + "corners = getRegionCorners(example_vdr_ref.region)\n", + "corners" + ] + }, + { + "cell_type": "code", + "execution_count": 580, + "id": "b37bfe47", + "metadata": {}, + "outputs": [], + "source": [ + "def getMinMaxRaDec(ra_dec_touples, verbose=False):\n", + " \"\"\"\n", + " Highly unoptimized way to find and return\n", + " (minRA, maxRA) and (minDec, MaxDec).\n", + " 2/2/2024 COC\n", + " \"\"\"\n", + " min_ra = min([i[0] for i in ra_dec_touples])\n", + " min_dec = min([i[1] for i in ra_dec_touples])\n", + " max_ra = max([i[0] for i in ra_dec_touples])\n", + " max_dec = max([i[1] for i in ra_dec_touples])\n", + " if verbose:\n", + " print(f\"RA range: {min_ra} to {max_ra}\")\n", + " print(f\"Dec range: {min_dec} to {max_dec}\")\n", + " return (min_ra, max_ra), (min_dec, max_dec)" + ] + }, + { + "cell_type": "code", + "execution_count": 581, + "id": "ef329736", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "((352.30950511932116, 352.64644359666477),\n", + " (-4.930880058593892, -4.7450820235469715))" + ] + }, + "execution_count": 581, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Example\n", + "getMinMaxRaDec(ra_dec_touples=corners)" + ] + }, + { + "cell_type": "markdown", + "id": "d95593bb", + "metadata": {}, + "source": [ + "#### Centers\n", + "\n", + "It may be easer to just work with center (RA, Dec) coordinates.\\\n", + "We can later store this in a DB (e.g., Postgres) for cone searches." + ] + }, + { + "cell_type": "code", + "execution_count": 582, + "id": "4c89be9e", + "metadata": {}, + "outputs": [], + "source": [ + "def getCenterRaDec(region):\n", + " \"\"\"\n", + " We pull the 2D boundingBox (not the boundingBox3d) from a region.\n", + " Then we extract the center's (RA, Dec) coordinates.\n", + " 2/2/2024 COC\n", + " \"\"\"\n", + " bbox_center = region.getBoundingBox().getCenter()\n", + " ra = bbox_center.getLon().asDegrees()\n", + " dec = bbox_center.getLat().asDegrees()\n", + " return (ra, dec)" + ] + }, + { + "cell_type": "code", + "execution_count": 182, + "id": "8e1e764c", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(352.477974357993, -4.837981041070432)" + ] + }, + "execution_count": 182, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "getCenterRaDec(tmpref.region)" + ] + }, + { + "cell_type": "code", + "execution_count": 624, + "id": "8e54db29", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 363 ms, sys: 19 ms, total: 382 ms\n", + "Wall time: 379 ms\n" + ] + } + ], + "source": [ + "%%time\n", + "df[\"center_coord\"] = [getCenterRaDec(i) for i in df[\"region\"]]" + ] + }, + { + "cell_type": "code", + "execution_count": 625, + "id": "64908868", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "47383" + ] + }, + "execution_count": 625, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(df[\"center_coord\"])" + ] + }, + { + "cell_type": "code", + "execution_count": 626, + "id": "625de417", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(351.0694028401149, -4.336598368890197)" + ] + }, + "execution_count": 626, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[\"center_coord\"].iloc()[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 627, + "id": "67b57215", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 1.2 s, sys: 26 ms, total: 1.23 s\n", + "Wall time: 1.22 s\n" + ] + }, + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 627, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%%time\n", + "# Let us visualize where on the sky our chip centers reside\n", + "fig = plt.figure(figsize=(4, 4))\n", + "plt.xlabel(\"RA\")\n", + "plt.ylabel(\"Dec\")\n", + "plt.scatter(\n", + " [i[0] for i in df[\"center_coord\"].iloc()], [i[1] for i in df[\"center_coord\"].iloc()], s=1, alpha=0.5\n", + ")" + ] + }, + { + "cell_type": "markdown", + "id": "41d4fd38", + "metadata": {}, + "source": [ + "The DECam mosaic shape is clearly visible, thrice.\\\n", + "There is an offset from each of the three pointings, too.\n", + "\n", + "In the most simple approach, each of these \"dots\" represents a set of images that can be fed to KBMOD." + ] + }, + { + "cell_type": "code", + "execution_count": 554, + "id": "c2dc4e1a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{instrument: 'DECam', detector: 1, visit: 898286}" + ] + }, + "execution_count": 554, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# look at the first dataId, which does not show up in a pretty way in the DF\n", + "df[\"data_id\"].iloc[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 435, + "id": "580ac4ed", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 435, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Let us look at just detector 62 pointings.\n", + "# This will give us a decent idea of how many pointings there are (here, 8).\n", + "\n", + "df62 = df[df[\"detector\"] == 62]\n", + "plt.clf()\n", + "plt.scatter(*zip(*df62[\"center_coord\"]), s=1, alpha=0.5)" + ] + }, + { + "cell_type": "code", + "execution_count": 237, + "id": "6ee544b8", + "metadata": {}, + "outputs": [], + "source": [ + "# chip62_coord0 = df62['center_coord'][0]" + ] + }, + { + "cell_type": "markdown", + "id": "df7d441d", + "metadata": {}, + "source": [ + "### Region Matching\n", + "Here region matching means comparing two lsst.sphgeom.region objects.\\\n", + "Purpose: to see if they have any overlap whatsoever. \\\n", + "NOTE: a partial or full overlap is called an \"intersection\" in sphgeom lingo.\n", + "\n", + "NOTE: Work in progress, but pausing this avenue for now. 2/2/2024 COC" + ] + }, + { + "cell_type": "code", + "execution_count": 589, + "id": "2c770982", + "metadata": {}, + "outputs": [], + "source": [ + "# manual region-region matching between all chips\n", + "# NOTE: estimate time is 1 hour, so skipping this for now\n", + "\n", + "doit = False\n", + "if doit == True:\n", + " lastTime = time.time()\n", + "\n", + " matches = {}\n", + "\n", + " with progressbar.ProgressBar(max_value=len(vdr_regions)) as bar:\n", + " for i, l in enumerate(vdr_regions):\n", + " my_id = vdr_ids[i]\n", + " matches[my_id] = []\n", + " for j, r in enumerate(vdr_regions):\n", + " if i == j:\n", + " continue\n", + " if l.intersects(r):\n", + " matches[my_id].append(vdr_ids[j])\n", + " bar.update(i)\n", + " elapsed = round(time.time() - lastTime, 1)\n", + " print(f\"It took {elapsed} seconds.\")" + ] + }, + { + "cell_type": "markdown", + "id": "ba8db514", + "metadata": {}, + "source": [ + "To be continued..." + ] + }, + { + "cell_type": "markdown", + "id": "f00d9b2f", + "metadata": {}, + "source": [ + "### HTM Exploration" + ] + }, + { + "cell_type": "code", + "execution_count": 202, + "id": "2fcdd8b3", + "metadata": {}, + "outputs": [], + "source": [ + "# Colin playing 1/15/2024 COC\n", + "def getHTMstuff(ra, dec, level=7, verbose=False):\n", + " \"\"\"\n", + " 1/16/2024 COC inception.\n", + " A function that\n", + " 1. Fetches an HTM ID for a pixelization of a user-supplied level.\n", + " 2. Determines the angular size (radius, in arcseconds) of the pixelization level.\n", + " LSST stores the unique HTM ID for level 7 pixelization in the Butler, hence the default level=7.\n", + " \"\"\"\n", + " pixelization = lsst.sphgeom.HtmPixelization(level)\n", + "\n", + " try: # kludges; use the Butler way, but if being passed normal numbers, use those\n", + " ra = ra.asDegrees()\n", + " except AttributeError as msg:\n", + " pass\n", + " try:\n", + " dec = dec.asDegrees()\n", + " except AttributeError as msg:\n", + " pass\n", + "\n", + " htm_id = pixelization.index(\n", + " lsst.sphgeom.UnitVector3d(\n", + " # sphgeom.LonLat.fromDegrees(ra.asDegrees(), dec.asDegrees())\n", + " lsst.sphgeom.LonLat.fromDegrees(ra, dec)\n", + " )\n", + " )\n", + " circle = pixelization.triangle(htm_id).getBoundingCircle()\n", + " scale = circle.getOpeningAngle().asDegrees() * 3600.0\n", + " level = pixelization.getLevel()\n", + " if verbose:\n", + " print(f\"HTM ID={htm_id} at level={level} is bounded by a circle of radius ~{scale:0.2f} arcsec.\")\n", + " return (htm_id, scale)" + ] + }, + { + "cell_type": "code", + "execution_count": 204, + "id": "c0916372", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "HTM ID=189361 at level=7 is bounded by a circle of radius ~1895.11 arcsec.\n" + ] + }, + { + "data": { + "text/plain": [ + "(189361, 1895.111766130883)" + ] + }, + "execution_count": 204, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "getHTMstuff(vdr_centers[0][0], vdr_centers[0][1], verbose=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 588, + "id": "47c447c5", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0\n" + ] + } + ], + "source": [ + "dsRefs = butler.registry.queryDatasets(\n", + " datasetType=desired_datasetTypes[0], htm7=147116, collections=desired_collections\n", + ")\n", + "print(len(sorted(dsRefs)))" + ] + }, + { + "cell_type": "markdown", + "id": "d59bcdde", + "metadata": {}, + "source": [ + "To be continued..." + ] + }, + { + "cell_type": "markdown", + "id": "10339ac6", + "metadata": {}, + "source": [ + "### Brute force approach for (small) discrete datasets\n", + "\n", + "The idea here is that we can organize discrete piles of images, such as DEEP, DDF." + ] + }, + { + "cell_type": "code", + "execution_count": 441, + "id": "048e38e1", + "metadata": {}, + "outputs": [], + "source": [ + "def find_overlapping_coords(df, uncertainty_radius, overwrite=False):\n", + " \"\"\"\n", + "\n", + " Added caching 2/5/2024 COC\n", + " \"\"\"\n", + " import glob\n", + "\n", + " cache_file = f\"{basedir}/overlapping_sets.pickle\"\n", + "\n", + " cache_exists = False\n", + " if len(glob.glob(cache_file)) > 0:\n", + " cache_exists = True\n", + "\n", + " if overwrite == False and cache_exists == True:\n", + " with open(cache_file, \"rb\") as f:\n", + " print(f\"Recycling {cache_file} as overwrite={overwrite}.\")\n", + " overlapping_sets = pickle.load(f)\n", + " return overlapping_sets\n", + "\n", + " df_copy = df.copy()\n", + "\n", + " # Assuming uncertainty_radius is provided as a float in arcseconds\n", + " uncertainty_radius_as = uncertainty_radius * u.arcsec\n", + "\n", + " all_coords = SkyCoord(\n", + " ra=[x[0] for x in df_copy[\"center_coord\"]] * u.degree,\n", + " dec=[x[1] for x in df_copy[\"center_coord\"]] * u.degree,\n", + " )\n", + "\n", + " overlapping_sets = {}\n", + " set_counter = 1\n", + " processed_data_ids = []\n", + "\n", + " periodic_update_counter = 0\n", + " with progressbar.ProgressBar(max_value=len(all_coords)) as bar:\n", + " for index, coord in enumerate(all_coords):\n", + " data_id = df_copy.iloc[index][\"data_id\"]\n", + " if data_id not in processed_data_ids:\n", + " distances = (\n", + " coord.separation(all_coords).to(u.arcsec).value\n", + " ) # Convert distances to arcseconds as numeric values\n", + "\n", + " # Perform comparison as numeric values, bypassing direct unit comparison\n", + " within_radius = (distances <= uncertainty_radius_as.value) & (distances > 0)\n", + "\n", + " if any(within_radius):\n", + " overlapping_indices = [\n", + " i\n", + " for i, distance in enumerate(distances)\n", + " if (distance <= uncertainty_radius_as.value) and i != index\n", + " ]\n", + " overlapping_data_ids = df_copy.iloc[overlapping_indices][\"data_id\"].tolist()\n", + " overlapping_data_ids.append(data_id)\n", + "\n", + " processed_data_ids.extend(overlapping_data_ids)\n", + "\n", + " overlapping_sets[f\"set_{set_counter}\"] = overlapping_data_ids\n", + " set_counter += 1\n", + " #\n", + " # mitigate too much output 2/5/2024 COC\n", + " periodic_update_counter += 1\n", + " if periodic_update_counter >= 250:\n", + " periodic_update_counter = 0\n", + " bar.update(index)\n", + "\n", + " with open(cache_file, \"wb\") as f:\n", + " pickle.dump(overlapping_sets, f, protocol=pickle.HIGHEST_PROTOCOL)\n", + " print(f\"Saved overlapping_sets to {cache_file} for caching purposes.\")\n", + "\n", + " return overlapping_sets" + ] + }, + { + "cell_type": "code", + "execution_count": 442, + "id": "25710a99", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Recycling /astro/users/coc123/kbmod_tmp/overlapping_sets.pickle as overwrite=False.\n", + "CPU times: user 173 ms, sys: 22.1 ms, total: 195 ms\n", + "Wall time: 192 ms\n" + ] + } + ], + "source": [ + "%%time\n", + "\n", + "# TIMING NOTE: this takes about 1.25 hours [TODO update that number]\n", + "# TODO test caching\n", + "\n", + "overlapping_sets = find_overlapping_coords(df=df, uncertainty_radius=30, overwrite=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 590, + "id": "5f2d5a03", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "There are 488 discrete chip-level pointings.\n" + ] + } + ], + "source": [ + "print(f\"There are {len(overlapping_sets.keys())} discrete chip-level pointings.\") # should be 488" + ] + }, + { + "cell_type": "code", + "execution_count": 591, + "id": "9ed24e28", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 503 ms, sys: 24.9 ms, total: 527 ms\n", + "Wall time: 526 ms\n" + ] + }, + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 591, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%%time\n", + "\n", + "# Looking at the processed data.\n", + "\n", + "# Create a lookup table for data_id to center_coord\n", + "id_to_coord = df.set_index(\"data_id\")[\"center_coord\"].to_dict()\n", + "\n", + "# Preparing for bulk plotting (if every point uses the same label, adjust as needed)\n", + "coords = [id_to_coord[overlapping_sets[p][0]] for p in overlapping_sets]\n", + "x_coords, y_coords = zip(*coords) # Assuming coords are tuples or lists\n", + "\n", + "# Plotting in bulk\n", + "plt.scatter(x_coords, y_coords, s=1)" + ] + }, + { + "cell_type": "code", + "execution_count": 594, + "id": "55ffd374", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'2019-09-27T00:20:22.932'" + ] + }, + "execution_count": 594, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[\"ut\"].iloc()[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 595, + "id": "fcd39c41", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + ":19: MatplotlibDeprecationWarning: The get_cmap function was deprecated in Matplotlib 3.7 and will be removed two minor releases later. Use ``matplotlib.colormaps[name]`` or ``matplotlib.colormaps.get_cmap(obj)`` instead.\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 6.24 s, sys: 526 ms, total: 6.77 s\n", + "Wall time: 6.24 s\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%%time\n", + "\n", + "# TIMING NOTE: this requires about 7 seconds\n", + "\n", + "from matplotlib.cm import get_cmap\n", + "from matplotlib.colors import Normalize\n", + "\n", + "# Convert \"ut\" column to datetime\n", + "df[\"ut_datetime\"] = pd.to_datetime(df[\"ut\"])\n", + "\n", + "# Create lookup tables for data_id to center_coord and ut_datetime\n", + "id_to_coord = df.set_index(\"data_id\")[\"center_coord\"].to_dict()\n", + "id_to_date = df.set_index(\"data_id\")[\"ut_datetime\"].dt.date.to_dict()\n", + "\n", + "# Extract unique dates and create a color map\n", + "unique_dates = sorted(set(id_to_date.values()))\n", + "date_to_color = {date: i for i, date in enumerate(unique_dates)}\n", + "norm = Normalize(vmin=0, vmax=len(unique_dates) - 1)\n", + "cmap = get_cmap(\"tab20\", len(unique_dates)) # Choose a colormap that fits the data\n", + "\n", + "# Preparing data for plotting\n", + "coords = [id_to_coord[overlapping_sets[p][0]] for p in overlapping_sets]\n", + "dates = [id_to_date[overlapping_sets[p][0]] for p in overlapping_sets]\n", + "colors = [cmap(norm(date_to_color[date])) for date in dates]\n", + "\n", + "# Plotting\n", + "lcount = 0\n", + "for (x, y), color, date in zip(coords, colors, dates):\n", + " lcount += 1\n", + " plt.scatter(x, y, color=color, label=date.strftime(\"%Y-%m-%d\"), alpha=0.75, s=2)\n", + "\n", + "# To avoid duplicate labels in the legend, handle legend entries manually\n", + "handles, labels = plt.gca().get_legend_handles_labels()\n", + "by_label = dict(zip(labels, handles)) # Removing duplicates\n", + "plt.legend(by_label.values(), by_label.keys())\n", + "plt.savefig(f\"{basedir}/pointings.pdf\")\n", + "# plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 596, + "id": "418c97ee", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Index(['data_id', 'region', 'detector', 'uri', 'center_coord', 'ut',\n", + " 'ut_datetime'],\n", + " dtype='object')" + ] + }, + "execution_count": 596, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns" + ] + }, + { + "cell_type": "code", + "execution_count": 597, + "id": "d06ed515", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[datetime.date(2019, 8, 28),\n", + " datetime.date(2019, 8, 29),\n", + " datetime.date(2019, 8, 30),\n", + " datetime.date(2019, 9, 27),\n", + " datetime.date(2019, 9, 28),\n", + " datetime.date(2019, 9, 29),\n", + " datetime.date(2020, 10, 17),\n", + " datetime.date(2020, 10, 19)]" + ] + }, + "execution_count": 597, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Here are the unique dates found in the discrete dataset\n", + "unique_dates = sorted(set(id_to_date.values()))\n", + "unique_dates" + ] + }, + { + "cell_type": "markdown", + "id": "3dc0bb58", + "metadata": {}, + "source": [ + "##### Double-checking a single date" + ] + }, + { + "cell_type": "code", + "execution_count": 598, + "id": "58158f47", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "data_id (instrument, detector, visit)\n", + "region ConvexPolygon([UnitVector3d(0.9847372525065534...\n", + "detector 1\n", + "uri file:///epyc/users/smotherh/DEEP/PointingGroup...\n", + "center_coord (351.0694028401149, -4.336598368890197)\n", + "ut 2019-09-27T00:20:22.932\n", + "ut_datetime 2019-09-27 00:20:22.932000\n", + "Name: 0, dtype: object" + ] + }, + "execution_count": 598, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.iloc()[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 599, + "id": "2ff625e7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "datetime.date(2019, 9, 27)" + ] + }, + "execution_count": 599, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "id_to_date[df[\"data_id\"].iloc()[0]]" + ] + }, + { + "cell_type": "code", + "execution_count": 600, + "id": "c3b48b13", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(351.0694028401149, -4.336598368890197)" + ] + }, + "execution_count": 600, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "id_to_coord[df[\"data_id\"].iloc()[0]]" + ] + }, + { + "cell_type": "code", + "execution_count": 601, + "id": "16506478", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "6267" + ] + }, + "execution_count": 601, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# We will make a dataframe with just the date we are checking\n", + "df20190828 = df[df[\"ut_datetime\"].dt.date == parser.parse(\"2019-08-28\").date()]\n", + "len(df20190828)" + ] + }, + { + "cell_type": "code", + "execution_count": 603, + "id": "166c9137", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 933 ms, sys: 33 ms, total: 966 ms\n", + "Wall time: 962 ms\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAjgAAAGxCAYAAABvIsx7AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAA0xUlEQVR4nO3de3xU1b3///cQkiFEMgVGSFImhKJIy0UuUQSsgGDAclOUS6FaHiKtp6LSAxWwxyZYa5CKN/S0tqVIkRZogUIFWpBbKxx/QhAFeowQCASTkCI4w81JgPX9oz/mMOQ2g0wms3g9H4/9eMzsvfbe67Mmm3mz954ZhzHGCAAAwCINot0BAACAq42AAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADoEobN27UQw89pPbt2yspKUlf/epXNXz4cOXl5VVqu3PnTg0YMEDXXXedvvKVr2jEiBE6cOBApXYvv/yyRowYoTZt2sjhcKhv377V7v9vf/ubevfurcTERLlcLg0dOlR79+4Nq4ZQ+1VSUqLx48erRYsWatSokTp37qx58+aFvJ9wxsoYo1//+tfq3r27kpOT1bx5c/Xp00erV68OqzYANSPgAKjSL37xCxUWFuqJJ57QmjVr9Morr6isrEy33XabNm7cGGj38ccfq2/fviovL9fSpUv129/+Vp988om++c1v6l//+lfQNn/5y1/q0KFDuvPOO3X99ddXu++VK1fq7rvvVosWLbRs2TL98pe/1L59+/TNb35TBQUFIfU/1H55vV7dfvvt2rBhg2bPnq2VK1eqW7duevjhh/Xiiy9e1bGSpOzsbH3ve9/TrbfeqmXLlunNN9+U0+nUkCFDtHz58pD2ByAEBgCqcPTo0UrzTp48aVq2bGn69+8fmDdy5EjjdruN1+sNzCssLDTx8fHmySefDFr//PnzgccdOnQwffr0qXLfN910k+ncubO5cOFC0DYTEhLM2LFjQ+p/qP3Kzc01ksyOHTuC1s/KyjJJSUnmxIkTte4r1LEyxpivfvWr5vbbbw+ad/bsWeNyucywYcNCKQ1ACDiDA6BKLVq0qDTvuuuu0ze+8Q0VFRVJks6dO6e3335b9913n5KTkwPtWrdurX79+mnFihVB6zdoUPs/OZ999pny8/N19913y+FwBG2zY8eO+vOf/6zz58/XuI1w+rV161a1bNlS3bt3D9rGkCFDdPr0af31r3+ttc+hjNVF8fHxcrlcQfMaNWoUmABcHQQcACHzer3auXOnOnToIEkqKCjQ2bNn1blz50ptO3furP379+uLL74Iax/l5eWSJKfTWWmZ0+nUmTNnar1MFU6/ysvLq92XJH300Udh9f+iy8fqoieeeEJ//etfNW/ePJ04cUIlJSX6z//8T3m9Xj3++ONXtC8AlRFwAITs0Ucf1enTp/XjH/9Y0r/PtkhSs2bNKrVt1qyZjDE6ceJEWPto2bKlmjVrpq1btwbN//zzz7Vnz56g/VYnnH594xvf0JEjR3T48OGgdu+++25I+6rO5WN10eTJk/X666/r0UcfVbNmzZSWlqYFCxboL3/5i3r37n1F+wJQGQEHQEiefvppLVq0SC+99FKlyzmXXkq6XE3LqtKgQQM9+uij2rBhg37605+qrKxM+/fv13e+8x2dOXMm0EaSLly4oHPnzgWmyy9dhdKv733ve4qPj9e4ceO0d+9effbZZ3r99de1ZMmSoH0ZY4L2de7cuWq3XdNYzZ8/X0888YQmTZqkd955R2vWrFFWVpaGDx+uv/3tb2GNFYAaRPkeIAAxICcnx0gyP/vZz4Lmf/zxx0aSef311yutM3XqVONwOMzZs2er3GZNNxlXVFSYH/7whyYhIcFIMpLM4MGDzcMPP2wkmaKiImOMMd/97ncDyyUFthduv9asWWM8Hk9gOx6Px8ydO9dIMj/96U+NMcZs2rQpaF+SzMGDB0MeK2OMOX78uElMTDSPPvpopWV9+vQxGRkZVY4HgPA1rPNEBSCmzJw5Uzk5OcrJydFTTz0VtKxt27ZKTEzU7t27K623e/du3XDDDVd042zDhg314osv6plnntHBgwfldruVmpqqgQMHqk2bNmrVqpUkKScnR5MmTQqs16RJkyvq1913361Dhw5p//79OnfunNq1a6elS5dKku644w5JUvfu3bV9+/agbaWlpQU9r2msJCk/P19nz57VLbfcUmlZZmamtmzZolOnTum6664LaZwA1CDaCQtA/fXMM88YSea//uu/qm0zatQo06JFC+Pz+QLzDh06ZBISEsy0adOqXa+mMzhVycvLM3Fxcebll18Oqf2V9ssYY/x+v+nRo4fp0qVLyP0LZawOHTpkJJlHHnkkaP6FCxdM7969TdOmTYM+Gg/gynEGB0CV5syZo5/85CcaNGiQBg8erPfeey9o+W233Sbp32ctbrnlFg0ZMkTTp0/XF198oZ/85Cdyu92aMmVK0Do7duxQYWGhJMnn88kYoz/96U+SpFtuuUWtW7eWJG3evFnbt29X586dZYzR+++/r+eff16DBg0KOmNTk3D69dhjj6lv375q3ry5Dhw4oFdffVVHjhzRli1brupYpaena8SIEfrVr34lp9Opb33rW/L7/VqwYIG2bt2qn/70p2HfswSgGtFOWADqpz59+lS65+TS6VI7duww/fv3N40bNzbJycnmnnvuMfv376+0zcvvmbl0mj9/fqDd1q1bTY8ePUxycrJxOp2mY8eO5oUXXjDl5eVh1RBqv4YPH25SU1NNfHy8SUlJMePHjzeFhYUh7yecsTp79qz5+c9/bjp37myaNGlimjVrZm677Tbz1ltvcfYGuIocxhhTt5EKAAAgsviYOAAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAda7JL/q7cOGCiouL1aRJE75UCwCAGGGM0cmTJ5WWlhb4IdzqXJMBp7i4WB6PJ9rdAAAAV6CoqCjwm3TVuSYDzsUf5CsqKlJycnKUewMAAELh8/nk8XgC7+M1uSYDzsXLUsnJyQQcAABiTCi3l3CTMQAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWuSZ/bBMAIGVMXx147JB0cNbg6HUGuMoIOEAMuPSNqJA3IUSAiXYHgKuMS1QAAMA6EQs4hYWFmjBhgtq0aaPExES1bdtW2dnZKi8vr3E9h8NR5fTzn/880KZv376Vlo8ZMyZSpQCAlbK+0UJxDikxvoEm978h2t0BrqqIXaL6+OOPdeHCBb3xxhu64YYbtGfPHk2cOFGnT5/WCy+8UO16JSUlQc/Xrl2rCRMm6L777guaP3HiRD3zzDOB54mJiVe3AKAe4bIUIuFXD94S7S4AEROxgDNo0CANGjQo8PxrX/ua8vPz9Ytf/KLGgJOSkhL0fOXKlerXr5++9rWvBc1v3LhxpbYAAABSHd+D4/V61axZs5DbHz16VKtXr9aECRMqLVu0aJHcbrc6dOigqVOn6uTJk9Vux+/3y+fzBU0AAMBedfYpqoKCAs2dO1dz5swJeZ0FCxaoSZMmGjFiRND8cePGqU2bNkpJSdGePXs0Y8YMffjhh1q/fn2V28nNzdXMmTO/VP8BAEDscBhjwvp0YE5OTq1hYfv27crMzAw8Ly4uVp8+fdSnTx/95je/CXlf7du311133aW5c+fW2C4vL0+ZmZnKy8tTt27dKi33+/3y+/2B5z6fTx6PR16vV8nJySH3BwAARI/P55PL5Qrp/TvsMziTJk2q9RNLGRkZgcfFxcXq16+fevbsqV/96lch7+cf//iH8vPztWTJklrbduvWTfHx8dq3b1+VAcfpdMrpdIa8bwAAENvCDjhut1tutzuktp9++qn69eun7t27a/78+WrQIPRbfubNm6fu3bvr5ptvrrXt3r17VVFRodTU1JC3DwAA7BWxm4yLi4vVt29feTwevfDCC/rXv/6l0tJSlZaWBrVr3769VqxYETTP5/Ppj3/8ox5++OFK2y0oKNAzzzyjHTt2qLCwUGvWrNHIkSPVtWtX9e7dO1LlAACAGBKxm4zXrVun/fv3a//+/WrVqlXQsktv+8nPz5fX6w1avnjxYhlj9O1vf7vSdhMSErRhwwa98sorOnXqlDwejwYPHqzs7GzFxcVFphgAABBTwr7J2Abh3KQEAADqh3Dev/ktKgAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGCdhtHuAFDfZExfHXhcOGtwFHtS/zFWoWOsQsdY4WrgDA4AALAOAQcAAFjHYYwx0e5EXfP5fHK5XPJ6vUpOTo52dwAAQAjCef/mDA4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOhENOMOGDVN6eroaNWqk1NRUPfDAAyouLq5xHWOMcnJylJaWpsTERPXt21d79+4NauP3+/XYY4/J7XYrKSlJw4YN05EjRyJZCgAAiCERDTj9+vXT0qVLlZ+fr2XLlqmgoED3339/jevMnj1bL774ol577TVt375dKSkpuuuuu3Ty5MlAm8mTJ2vFihVavHix3n33XZ06dUpDhgzR+fPnI1kOAACIEQ5jjKmrna1atUr33HOP/H6/4uPjKy03xigtLU2TJ0/WtGnTJP37bE3Lli31/PPP6/vf/768Xq+uv/56LVy4UKNHj5YkFRcXy+PxaM2aNRo4cGCt/fD5fHK5XPJ6vUpOTr66RQIAgIgI5/27zu7BOX78uBYtWqRevXpVGW4k6eDBgyotLVVWVlZgntPpVJ8+fbRt2zZJUl5enioqKoLapKWlqWPHjoE2l/P7/fL5fEETAACwV8QDzrRp05SUlKTmzZvr8OHDWrlyZbVtS0tLJUktW7YMmt+yZcvAstLSUiUkJKhp06bVtrlcbm6uXC5XYPJ4PF+mJAAAUM+FHXBycnLkcDhqnHbs2BFo/6Mf/UgffPCB1q1bp7i4OD344IOq7aqYw+EIem6MqTTvcjW1mTFjhrxeb2AqKioKsVoAABCLGoa7wqRJkzRmzJga22RkZAQeu91uud1utWvXTl//+tfl8Xj03nvvqWfPnpXWS0lJkfTvszSpqamB+WVlZYGzOikpKSovL9eJEyeCzuKUlZWpV69eVfbH6XTK6XSGXCMAAIhtYQeci4HlSlw8c+P3+6tc3qZNG6WkpGj9+vXq2rWrJKm8vFxbtmzR888/L0nq3r274uPjtX79eo0aNUqSVFJSoj179mj27NlX1C8AAGCXsANOqN5//329//77uv3229W0aVMdOHBAP/nJT9S2bdugszft27dXbm6u7r33XjkcDk2ePFnPPfecbrzxRt1444167rnn1LhxY40dO1aS5HK5NGHCBE2ZMkXNmzdXs2bNNHXqVHXq1EkDBgyIVDkAACCGRCzgJCYmavny5crOztbp06eVmpqqQYMGafHixUGXi/Lz8+X1egPPn3zySZ09e1Y/+MEPdOLECfXo0UPr1q1TkyZNAm1eeuklNWzYUKNGjdLZs2fVv39/vfnmm4qLi4tUOQAAIIbU6ffg1Bd8Dw4AALEnnPfviJ3BAXD1ZExfHXhcOGtwFHtS/zFWobt0rCTGC3Yh4CBqeCMCECsIg7GHXxMHAADW4QwOEAP432LoGKvQMVawGTcZc5MxAAAxoV7+2CYAAEBdIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrNIx2B1A3MqavDjwunDU4ij2p3y4dJ4mxqg1/V6FjrELHWIWOsaoeZ3AAAIB1CDgAAMA6DmOMiXYn6prP55PL5ZLX61VycnK0uwMAAEIQzvt3RM/gDBs2TOnp6WrUqJFSU1P1wAMPqLi4uNr2FRUVmjZtmjp16qSkpCSlpaXpwQcfrLRO37595XA4gqYxY8ZEshQAABBDIhpw+vXrp6VLlyo/P1/Lli1TQUGB7r///mrbnzlzRjt37tTTTz+tnTt3avny5frkk080bNiwSm0nTpyokpKSwPTGG29EshQAABBD6vQS1apVq3TPPffI7/crPj4+pHW2b9+uW2+9VYcOHVJ6erqkf5/B6dKli15++eUr6geXqAAAiD315hLVpY4fP65FixapV69eIYcbSfJ6vXI4HPrKV74SNH/RokVyu93q0KGDpk6dqpMnT1a7Db/fL5/PFzQBAAB7RTzgTJs2TUlJSWrevLkOHz6slStXhrzuF198oenTp2vs2LFBSW3cuHH6wx/+oM2bN+vpp5/WsmXLNGLEiGq3k5ubK5fLFZg8Hs+XqgkAANRvYV+iysnJ0cyZM2tss337dmVmZkqSjh07puPHj+vQoUOaOXOmXC6X3n77bTkcjhq3UVFRoZEjR+rw4cPavHlzjaei8vLylJmZqby8PHXr1q3Scr/fL7/fH3ju8/nk8Xi4RAUAQAwJ5xJV2AHn2LFjOnbsWI1tMjIy1KhRo0rzjxw5Io/Ho23btqlnz57Vrl9RUaFRo0bpwIED2rhxo5o3b17j/owxcjqdWrhwoUaPHl1rDdyDAwBA7Ann/Tvsn2pwu91yu91X1LGLWerSsymXuxhu9u3bp02bNtUabiRp7969qqioUGpq6hX1CwAA2CVi9+C8//77eu2117Rr1y4dOnRImzZt0tixY9W2bdugszft27fXihUrJEnnzp3T/fffrx07dmjRokU6f/68SktLVVpaqvLycklSQUGBnnnmGe3YsUOFhYVas2aNRo4cqa5du6p3796RKgcAAMSQiP3YZmJiopYvX67s7GydPn1aqampGjRokBYvXiyn0xlol5+fL6/XK+nfl7BWrVolSerSpUvQ9jZt2qS+ffsqISFBGzZs0CuvvKJTp07J4/Fo8ODBys7OVlxcXKTKAQAAMYSfauAeHAAAYkK9/B4cAACAukLAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALBOw2h3AACuBRnTVwceF84aHMWeANcGAs41gn9cQ3PpOEmMVW34u0Ik8HcVOsaqelyiAgAA1uEMDgDUAf53DdQthzHGRLsTdc3n88nlcsnr9So5OTna3QEAACEI5/2bS1QAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdSIacIYNG6b09HQ1atRIqampeuCBB1RcXFzjOuPHj5fD4QiabrvttqA2fr9fjz32mNxut5KSkjRs2DAdOXIkkqUAAIAYEtGA069fPy1dulT5+flatmyZCgoKdP/999e63qBBg1RSUhKY1qxZE7R88uTJWrFihRYvXqx3331Xp06d0pAhQ3T+/PlIlQIAAGKIwxhj6mpnq1at0j333CO/36/4+Pgq24wfP16ff/65/vznP1e53Ov16vrrr9fChQs1evRoSVJxcbE8Ho/WrFmjgQMH1toPn88nl8slr9er5OTkK64HAADUnXDev+vsHpzjx49r0aJF6tWrV7Xh5qLNmzerRYsWateunSZOnKiysrLAsry8PFVUVCgrKyswLy0tTR07dtS2bduq3J7f75fP5wuaAACAvSIecKZNm6akpCQ1b95chw8f1sqVK2tsf/fdd2vRokXauHGj5syZo+3bt+vOO++U3++XJJWWliohIUFNmzYNWq9ly5YqLS2tcpu5ublyuVyByePxXJ3iAABAvRR2wMnJyal0E/Dl044dOwLtf/SjH+mDDz7QunXrFBcXpwcffFA1XRUbPXq0Bg8erI4dO2ro0KFau3atPvnkE61evbrGfhlj5HA4qlw2Y8YMeb3ewFRUVBRu2QAAIIY0DHeFSZMmacyYMTW2ycjICDx2u91yu91q166dvv71r8vj8ei9995Tz549Q9pfamqqWrdurX379kmSUlJSVF5erhMnTgSdxSkrK1OvXr2q3IbT6ZTT6QxpfwAAIPaFHXAuBpYrcfHMzcXLTaH47LPPVFRUpNTUVElS9+7dFR8fr/Xr12vUqFGSpJKSEu3Zs0ezZ8++on4BAAC7ROwenPfff1+vvfaadu3apUOHDmnTpk0aO3as2rZtG3T2pn379lqxYoUk6dSpU5o6dar+53/+R4WFhdq8ebOGDh0qt9ute++9V5Lkcrk0YcIETZkyRRs2bNAHH3yg73znO+rUqZMGDBgQqXIAAEAMCfsMTqgSExO1fPlyZWdn6/Tp00pNTdWgQYO0ePHioMtF+fn58nq9kqS4uDjt3r1bv/vd7/T5558rNTVV/fr105IlS9SkSZPAOi+99JIaNmyoUaNG6ezZs+rfv7/efPNNxcXFRaocAAAQQ+r0e3Dqi0h+D07G9P+7Gbpw1uCrum3bMFahY6xCd+lYSYxXbfjbCh1jFbpIjVW9/B4cAACAukLAAQAA1uESFT/VAABATOASFQAAuKYRcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoNo90B22RMXx14XDhrcBR7Uv8xVqFjrELHWIVu9Bvb9P8dPBF4znjVjL+t0NWHseIMDgBco3YUnqi9ERCjCDgAcI3KzGga7S4AEeMwxphod6Ku+Xw+uVwueb1eJScnR7s7AAAgBOG8f3MGBwAAWCeiAWfYsGFKT09Xo0aNlJqaqgceeEDFxcU1ruNwOKqcfv7znwfa9O3bt9LyMWPGRLIUAAAQQyIacPr166elS5cqPz9fy5YtU0FBge6///4a1ykpKQmafvvb38rhcOi+++4Lajdx4sSgdm+88UYkSwEAADEkoh8T/+EPfxh43Lp1a02fPl333HOPKioqFB8fX+U6KSkpQc9Xrlypfv366Wtf+1rQ/MaNG1dqCwAAINXhPTjHjx/XokWL1KtXr2rDzeWOHj2q1atXa8KECZWWLVq0SG63Wx06dNDUqVN18uTJarfj9/vl8/mCJgAAYK+IB5xp06YpKSlJzZs31+HDh7Vy5cqQ112wYIGaNGmiESNGBM0fN26c/vCHP2jz5s16+umntWzZskptLpWbmyuXyxWYPB7PFdcDAADqv7A/Jp6Tk6OZM2fW2Gb79u3KzMyUJB07dkzHjx/XoUOHNHPmTLlcLr399ttyOBy17qt9+/a66667NHfu3Brb5eXlKTMzU3l5eerWrVul5X6/X36/P/Dc5/PJ4/HwMXEAAGJIOB8TDzvgHDt2TMeOHauxTUZGhho1alRp/pEjR+TxeLRt2zb17Nmzxm384x//0B133KFdu3bp5ptvrrGtMUZOp1MLFy7U6NGja62B78EBACD2hPP+HfZNxm63W263+4o6djFLXXo2pTrz5s1T9+7daw03krR3715VVFQoNTX1ivoFAADsErF7cN5//3299tpr2rVrlw4dOqRNmzZp7Nixatu2bdDZm/bt22vFihVB6/p8Pv3xj3/Uww8/XGm7BQUFeuaZZ7Rjxw4VFhZqzZo1GjlypLp27arevXtHqhwAABBDIhZwEhMTtXz5cvXv31833XSTHnroIXXs2FFbtmyR0+kMtMvPz5fX6w1ad/HixTLG6Nvf/nal7SYkJGjDhg0aOHCgbrrpJj3++OPKysrSO++8o7i4uEiVAwAAYgi/RcU9OAAAxAR+iwoAAFzTCDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArNMw2h1A5GVMXx14PGdkZ93X3RPF3tRvl45V4azBUexJbGC8QvfRkc/17v5juv0Gtzq3+kq0u1Ov8XcVOsaqepzBucas/LA42l0ArknDXtuq2X/N17DXtka7K8A1gYBzjRl+c1q0uwAAQMQ5jDEm2p2oaz6fTy6XS16vV8nJydHuDoBrAJcSgC8vnPdv7sEBgDpAqAHqFpeoAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHXqJOD4/X516dJFDodDu3btqrGtMUY5OTlKS0tTYmKi+vbtq71791ba3mOPPSa3262kpCQNGzZMR44ciWAFAAAgltRJwHnyySeVlpYWUtvZs2frxRdf1Guvvabt27crJSVFd911l06ePBloM3nyZK1YsUKLFy/Wu+++q1OnTmnIkCE6f/58pEoAAAAxJOIBZ+3atVq3bp1eeOGFWtsaY/Tyyy/rxz/+sUaMGKGOHTtqwYIFOnPmjH7/+99Lkrxer+bNm6c5c+ZowIAB6tq1q9566y3t3r1b77zzTqTLAQAAMSCiAefo0aOaOHGiFi5cqMaNG9fa/uDBgyotLVVWVlZgntPpVJ8+fbRt2zZJUl5enioqKoLapKWlqWPHjoE2l/P7/fL5fEETAACwV8QCjjFG48eP1yOPPKLMzMyQ1iktLZUktWzZMmh+y5YtA8tKS0uVkJCgpk2bVtvmcrm5uXK5XIHJ4/GEWw4AAIghYQecnJwcORyOGqcdO3Zo7ty58vl8mjFjRtidcjgcQc+NMZXmXa6mNjNmzJDX6w1MRUVFYfcJAADEjobhrjBp0iSNGTOmxjYZGRl69tln9d5778npdAYty8zM1Lhx47RgwYJK66WkpEj691ma1NTUwPyysrLAWZ2UlBSVl5frxIkTQWdxysrK1KtXryr743Q6K/UDAADYK+yA43a75Xa7a2336quv6tlnnw08Ly4u1sCBA7VkyRL16NGjynXatGmjlJQUrV+/Xl27dpUklZeXa8uWLXr++eclSd27d1d8fLzWr1+vUaNGSZJKSkq0Z88ezZ49O9xyAACAhcIOOKFKT08Pen7ddddJktq2batWrVoF5rdv3165ubm699575XA4NHnyZD333HO68cYbdeONN+q5555T48aNNXbsWEmSy+XShAkTNGXKFDVv3lzNmjXT1KlT1alTJw0YMCBS5QAAgBgSsYATqvz8fHm93sDzJ598UmfPntUPfvADnThxQj169NC6devUpEmTQJuXXnpJDRs21KhRo3T27Fn1799fb775puLi4qJRQr2XMX114HHhrMFR7En9x1iFh/EKHWMVOsYqdIxV9eos4GRkZMgYU2n+5fMcDodycnKUk5NT7bYaNWqkuXPnau7cuVe7mwAAwAL8FhUAALCOw1R1WsVyPp9PLpdLXq9XycnJ0e4OAAAIQTjv35zBAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6zSMdgdw7cqYvjrwuHDW4Cj2BABqx79ZsYWAA8QA/mEN3aVjNWdkZ93X3RPF3tR//G3BVlyiAmCtlR8WR7sLAKKEMziIGv63iEgbfnNatLsAi/BvVmxxGGNMtDtR13w+n1wul7xer5KTk6PdHQAAEIJw3r+5RAUAAKxDwAEAANapk4Dj9/vVpUsXORwO7dq1q9p2FRUVmjZtmjp16qSkpCSlpaXpwQcfVHFx8I2Cffv2lcPhCJrGjBkT4SoAAECsqJOA8+STTyotrfab/c6cOaOdO3fq6aef1s6dO7V8+XJ98sknGjZsWKW2EydOVElJSWB64403ItF1AAAQgyL+Kaq1a9dq3bp1WrZsmdauXVtjW5fLpfXr1wfNmzt3rm699VYdPnxY6enpgfmNGzdWSkpKRPoMAABiW0TP4Bw9elQTJ07UwoUL1bhx4yvahtfrlcPh0Fe+8pWg+YsWLZLb7VaHDh00depUnTx5stpt+P1++Xy+oAkAANgrYmdwjDEaP368HnnkEWVmZqqwsDDsbXzxxReaPn26xo4dG/RxsHHjxqlNmzZKSUnRnj17NGPGDH344YeVzv5clJubq5kzZ15pKQAAIMaE/T04OTk5tYaF7du3a9u2bVqyZIn+/ve/Ky4uToWFhWrTpo0++OADdenSpdb9VFRUaOTIkTp8+LA2b95c4+fd8/LylJmZqby8PHXr1q3Scr/fL7/fH3ju8/nk8Xj4HhwAAGJION+DE3bAOXbsmI4dO1Zjm4yMDI0ZM0Z/+ctf5HA4AvPPnz+vuLg4jRs3TgsWLKh2/YqKCo0aNUoHDhzQxo0b1bx58xr3Z4yR0+nUwoULNXr06Fpr4Iv+AACIPeG8f4d9icrtdsvtdtfa7tVXX9Wzzz4beF5cXKyBAwdqyZIl6tGjR7XrXQw3+/bt06ZNm2oNN5K0d+9eVVRUKDU1NbQiAACA1SJ2D86ln3iSpOuuu06S1LZtW7Vq1Sowv3379srNzdW9996rc+fO6f7779fOnTv19ttv6/z58yotLZUkNWvWTAkJCSooKNCiRYv0rW99S263W//85z81ZcoUde3aVb17945UOQAAIIZE/cc28/Pz5fV6JUlHjhzRqlWrJKnSfTqbNm1S3759lZCQoA0bNuiVV17RqVOn5PF4NHjwYGVnZysuLq6uuw8AAOohfmyTe3AAAIgJ/NgmAAC4phFwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWIeAAAADrEHAAAIB1CDgAAMA6BBwAAGAdAg4AALBOw2h3AKhvMqavDjwunDU4ij2p/xir0DFWoWOscDVwBgcAAFiHgAMAAKzjMMaYaHeirvl8PrlcLnm9XiUnJ0e7OwAAIAThvH9zBgcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOgQcAABgHQIOAACwDgEHAABYh4ADAACsQ8ABAADWqZOA4/f71aVLFzkcDu3atavGtuPHj5fD4Qiabrvttkrbe+yxx+R2u5WUlKRhw4bpyJEjEawAAADEkjoJOE8++aTS0tJCbj9o0CCVlJQEpjVr1gQtnzx5slasWKHFixfr3Xff1alTpzRkyBCdP3/+ancdAADEoIaR3sHatWu1bt06LVu2TGvXrg1pHafTqZSUlCqXeb1ezZs3TwsXLtSAAQMkSW+99ZY8Ho/eeecdDRw48Kr1HQAAxKaInsE5evSoJk6cqIULF6px48Yhr7d582a1aNFC7dq108SJE1VWVhZYlpeXp4qKCmVlZQXmpaWlqWPHjtq2bVuV2/P7/fL5fEETAACwV8QCjjFG48eP1yOPPKLMzMyQ17v77ru1aNEibdy4UXPmzNH27dt15513yu/3S5JKS0uVkJCgpk2bBq3XsmVLlZaWVrnN3NxcuVyuwOTxeK68MAAAUO+FHXBycnIq3QR8+bRjxw7NnTtXPp9PM2bMCGv7o0eP1uDBg9WxY0cNHTpUa9eu1SeffKLVq1fXuJ4xRg6Ho8plM2bMkNfrDUxFRUVh9QkAAMSWsO/BmTRpksaMGVNjm4yMDD377LN677335HQ6g5ZlZmZq3LhxWrBgQUj7S01NVevWrbVv3z5JUkpKisrLy3XixImgszhlZWXq1atXldtwOp2V+gEAAOwVdsBxu91yu921tnv11Vf17LPPBp4XFxdr4MCBWrJkiXr06BHy/j777DMVFRUpNTVVktS9e3fFx8dr/fr1GjVqlCSppKREe/bs0ezZs8OsBogNGdP/7wxm4azBUexJ/cdYhYfxgq0i9imq9PT0oOfXXXedJKlt27Zq1apVYH779u2Vm5ure++9V6dOnVJOTo7uu+8+paamqrCwUE899ZTcbrfuvfdeSZLL5dKECRM0ZcoUNW/eXM2aNdPUqVPVqVOnwKeqAADAtS3iHxOvTX5+vrxeryQpLi5Ou3fv1u9+9zt9/vnnSk1NVb9+/bRkyRI1adIksM5LL72khg0batSoUTp79qz69++vN998U3FxcdEqAwAA1CMOY4yJdifqms/nk8vlktfrVXJycrS7AwAAQhDO+ze/RQUAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYB0CDgAAsA4BBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4AADAOg2j3YFouPgD6j6fL8o9AQAAobr4vn3xfbwm12TAOXnypCTJ4/FEuScAACBcJ0+elMvlqrGNw4QSgyxz4cIFFRcXq0mTJnI4HBHbj8/nk8fjUVFRkZKTkyO2n/riWqtXuvZqvtbqla69mqnXfrFcszFGJ0+eVFpamho0qPkum2vyDE6DBg3UqlWrOttfcnJyzP0RfRnXWr3StVfztVavdO3VTL32i9WaaztzcxE3GQMAAOsQcAAAgHUIOBHkdDqVnZ0tp9MZ7a7UiWutXunaq/laq1e69mqmXvtdKzVfkzcZAwAAu3EGBwAAWIeAAwAArEPAAQAA1iHgAAAA6xBwAACAdQg4kn7xi1+oc+fOgW917Nmzp9auXRtYPn78eDkcjqDptttuCyw/fvy4HnvsMd10001q3Lix0tPT9fjjj8vr9da67//+7/9WmzZt1KhRI3Xv3l3/+Mc/gpYbY5STk6O0tDQlJiaqb9++2rt3b0zWm5ubq1tuuUVNmjRRixYtdM899yg/Pz+oTW37jrWac3JyKm03JSUlqI1Nr3FGRkal7TocDj366KMh7zsa9UrS97//fbVt21aJiYm6/vrrNXz4cH388ce17jsax3A0a47WcRytemP1GL7SeqN1DEeEgVm1apVZvXq1yc/PN/n5+eapp54y8fHxZs+ePcYYY7773e+aQYMGmZKSksD02WefBdbfvXu3GTFihFm1apXZv3+/2bBhg7nxxhvNfffdV+N+Fy9ebOLj482vf/1r889//tM88cQTJikpyRw6dCjQZtasWaZJkyZm2bJlZvfu3Wb06NEmNTXV+Hy+mKt34MCBZv78+WbPnj1m165dZvDgwSY9Pd2cOnUq0Ka2fcdazdnZ2aZDhw5B2y0rKwtqY9NrXFZWFrTN9evXG0lm06ZNgTaReI2/bL3GGPPGG2+YLVu2mIMHD5q8vDwzdOhQ4/F4zLlz56rdb7SO4WjWHK3jOFr1xuoxfKX1RusYjgQCTjWaNm1qfvOb3xhj/v1iDh8+PKz1ly5dahISEkxFRUW1bW699VbzyCOPBM1r3769mT59ujHGmAsXLpiUlBQza9aswPIvvvjCuFwu88tf/jKs/tSmLuq9XFlZmZFktmzZEph3Jfu+UnVRc3Z2trn55purXW77a/zEE0+Ytm3bmgsXLgTm1dVr/GXr/fDDD40ks3///mrb1Kdj2Ji6qfly0TyO66Jem47hK3l9o3kMf1lcorrM+fPntXjxYp0+fVo9e/YMzN+8ebNatGihdu3aaeLEiSorK6txO16vV8nJyWrYsOrfMy0vL1deXp6ysrKC5mdlZWnbtm2SpIMHD6q0tDSojdPpVJ8+fQJtvqy6qre6dSSpWbNmQfPD3Xe46rrmffv2KS0tTW3atNGYMWN04MCBwDKbX+Py8nK99dZbeuihh+RwOIKWRfI1vhr1nj59WvPnz1ebNm3k8XiqbFNfjmGp7mquSjSO47qu14Zj+Epe32gdw1dNtBNWffHRRx+ZpKQkExcXZ1wul1m9enVg2eLFi83bb79tdu/ebVatWmVuvvlm06FDB/PFF19Uua1jx46Z9PR08+Mf/7ja/X366adGktm6dWvQ/J/97GemXbt2xhhjtm7daiSZTz/9NKjNxIkTTVZW1pWWaoyp+3ovd+HCBTN06FBz++23B80Pd9/hiEbNa9asMX/605/MRx99ZNavX2/69OljWrZsaY4dO2aMsfs1XrJkiYmLi6tUW6Re46tR7+uvv26SkpKMJNO+ffsa/6cb7WPYmLqv+XJ1fRxHo95YP4a/zOtb18fw1UbA+f/5/X6zb98+s337djN9+nTjdrvN3r17q2xbXFxs4uPjzbJlyyot83q9pkePHmbQoEGmvLy82v1d/Mdx27ZtQfOfffZZc9NNNxlj/u/AKS4uDmrz8MMPm4EDB4ZbYpC6rvdyP/jBD0zr1q1NUVFRje1q2ne4ol2zMcacOnXKtGzZ0syZM8cYY/drnJWVZYYMGVJru6v1Gl+Nej///HPzySefmC1btpihQ4eabt26mbNnz1a5jWgfw8bUfc2Xq+vjONr1GhN7x/CXqbeuj+GrjYBTjf79+5vvfe971S6/4YYbgq65GmOMz+czPXv2NP3796/1D8jv95u4uDizfPnyoPmPP/64ueOOO4wxxhQUFBhJZufOnUFthg0bZh588MFwyqlVpOu91KRJk0yrVq3MgQMHQmpf1b6vhrqs+VIDBgwI3Ldh62tcWFhoGjRoYP785z+H1D4Sr/GV1Hspv99vGjdubH7/+99Xu7w+HcPGRL7mS9WH47gu671ULB3Dlwqn3vpwDH9Z3INTDWOM/H5/lcs+++wzFRUVKTU1NTDP5/MpKytLCQkJWrVqlRo1alTj9hMSEtS9e3etX78+aP769evVq1cvSVKbNm2UkpIS1Ka8vFxbtmwJtLlaIl3vxX1MmjRJy5cv18aNG9WmTZta16lq31dLXdR8Ob/fr//93/8NbNe21/ii+fPnq0WLFho8eHCtbSP1Godbb7jbqG/HcG39vRo1X1xeX47juqj3crF0DIe7jUvVh2P4S4tGqqpvZsyYYf7+97+bgwcPmo8++sg89dRTpkGDBmbdunXm5MmTZsqUKWbbtm3m4MGDZtOmTaZnz57mq1/9auAjgD6fz/To0cN06tTJ7N+/P+ijc5d+HO/OO+80c+fODTy/+BHTefPmmX/+859m8uTJJikpyRQWFgbazJo1y7hcLrN8+XKze/du8+1vf/tLf/wwWvX+x3/8h3G5XGbz5s1B65w5c8YYY0Lad6zVPGXKFLN582Zz4MAB895775khQ4aYJk2aWPsaG2PM+fPnTXp6upk2bVqlfkXqNf6y9RYUFJjnnnvO7Nixwxw6dMhs27bNDB8+3DRr1swcPXq02nqjdQxHs+ZoHcfRqjdWj+ErrdeY6BzDkUDAMcY89NBDpnXr1iYhIcFcf/31pn///mbdunXGGGPOnDljsrKyzPXXX2/i4+NNenq6+e53v2sOHz4cWH/Tpk1GUpXTwYMHA+1at25tsrOzg/b9+uuvB/bdrVu3oI9aGvPvm/iys7NNSkqKcTqd5o477jC7d++OyXqrW2f+/Pkh7zvWar74fRjx8fEmLS3NjBgxotI1dJteY2OM+dvf/mYkmfz8/Er9itRr/GXr/fTTT83dd99tWrRoYeLj402rVq3M2LFjzccffxy0n/pyDEez5mgdx9GqN1aP4S/zNx2NYzgSHMYYE8kzRAAAAHWNe3AAAIB1CDgAAMA6BBwAAGAdAg4AALAOAQcAAFiHgAMAAKxDwAEAANYh4AAAAOsQcAAAgHUIOAAAwDoEHAAAYJ3/B6FEIRJUNX7LAAAAAElFTkSuQmCC", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%%time\n", + "# Visualize all of the unique dates, one at a time.\n", + "for dt in unique_dates:\n", + " fig = plt.figure()\n", + " tmpdf = df[df[\"ut_datetime\"].dt.date == parser.parse(\"2019-08-28\").date()]\n", + " plt.scatter(*zip(*tmpdf[\"center_coord\"]), s=1, alpha=0.5)\n", + " plt.title(f\"{dt}\")\n", + "del tmpdf" + ] + }, + { + "cell_type": "markdown", + "id": "337ceedc", + "metadata": {}, + "source": [ + "# Recap and Master Function\n", + "Here is a master function that takes a repo_path and returns \\\n", + "(1) a Pandas dataframe with needed info, and\\\n", + "(2) a dictionary with the images in discrete piles (sets)." + ] + }, + { + "cell_type": "code", + "execution_count": 634, + "id": "fccdee6b", + "metadata": {}, + "outputs": [], + "source": [ + "def retrieve_image_sets(\n", + " repo_path,\n", + " basedir=\"default\",\n", + " desired_datasetTypes=[\"deepDiff_differenceExp\"],\n", + " overwrite=False,\n", + " overlap_uncertainty_radius_arcsec=30,\n", + "):\n", + " \"\"\"2/6/2024 COC\"\"\"\n", + " import lsst\n", + " import lsst.daf.butler as dafButler\n", + " import os\n", + " import time\n", + " from matplotlib import pyplot as plt\n", + " import progressbar\n", + " from concurrent.futures import ProcessPoolExecutor, as_completed\n", + " from astropy.time import Time # for converting Butler visitInfo.date (TAI) to UTC strings\n", + " from astropy import units as u\n", + " import pandas as pd\n", + " import pickle\n", + " from dateutil import parser\n", + "\n", + " if basedir == \"default\":\n", + " basedir = f'{os.environ[\"HOME\"]}/kbmod_tmp'\n", + " print(f'Changing \"default\" basedir to {basedir} now.')\n", + "\n", + " os.makedirs(basedir, exist_ok=True)\n", + "\n", + " # repo_path = f\"/epyc/users/smotherh/DEEP/PointingGroups/butler-repo\"\n", + " butler = dafButler.Butler(repo_path)\n", + "\n", + " all_collection_names = get_collection_names(butler=butler, basedir=basedir, verbose=True, export=True)\n", + " desired_collections = get_desired_collections(all_collections_list=all_collection_names)\n", + " # datasetTypes = getDatasetTypeStats(butler=butler, overwrite=False) # not used 2/6/2024 COC\n", + " # desired_datasetTypes = [\"deepDiff_differenceExp\"]\n", + " df, example_vdr_ref = get_vdr_data(\n", + " butler=butler, desired_collections=desired_collections, desired_datasetTypes=desired_datasetTypes\n", + " )\n", + " desired_instruments = getInstruments(butler=butler, vdr_ids=df[\"data_id\"])\n", + " df[\"uri\"] = getURIs(\n", + " butler=butler,\n", + " dataIds=df[\"data_id\"],\n", + " repo_path=repo_path,\n", + " desired_datasetTypes=desired_datasetTypes,\n", + " desired_collections=desired_collections,\n", + " overwrite=overwrite,\n", + " )\n", + "\n", + " df[\"ut\"] = getTimestamps(dataIds=df[\"data_id\"], overwrite=overwrite)\n", + " df[\"ut_datetime\"] = pd.to_datetime(df[\"ut\"])\n", + " overlapping_sets = find_overlapping_coords(\n", + " df=df, uncertainty_radius=overlap_uncertainty_radius_arcsec, overwrite=overwrite\n", + " )\n", + " return df, overlapping_sets" + ] + }, + { + "cell_type": "code", + "execution_count": 638, + "id": "cf221f77", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Changing \"default\" basedir to /astro/users/coc123/kbmod_tmp now.\n", + "Found 1292 collections in the Butler. Wrote to \"/astro/users/coc123/kbmod_tmp/all_collection_names.lst\".\n", + "Found DECam. Adding to \"desired_instruments\" now.\n", + "WARNING: we are not iterating over all rows to find instruments, just taking the first one.\n", + "Recycled 47383 paths from /astro/users/coc123/kbmod_tmp/uri_cache.lst as overwrite was False.\n", + "Overwrite is False, so we will read the timestamps from file now...\n", + "Recycled 47383 from /astro/users/coc123/kbmod_tmp/vdr_timestamps.lst.\n", + "Recycling /astro/users/coc123/kbmod_tmp/overlapping_sets.pickle as overwrite=False.\n", + "CPU times: user 3.91 s, sys: 413 ms, total: 4.32 s\n", + "Wall time: 5.54 s\n" + ] + } + ], + "source": [ + "%%time\n", + "# TIMING NOTE: this requires about 7 seconds to run ***with everything already cached***.\n", + "df1, overlapping_sets1 = retrieve_image_sets(\n", + " repo_path=f\"/epyc/users/smotherh/DEEP/PointingGroups/butler-repo\"\n", + ")" + ] + }, + { + "cell_type": "markdown", + "id": "3df17bc4", + "metadata": {}, + "source": [ + "# Next Steps\n", + "\n", + "In no particular order:\n", + "\n", + "1. User-specified (RA, Dec) pair.\n", + "2. Heat map / histogrammed results.\n", + "3. Sky patches approach.\n", + "4. Reflex correction." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "LSST w_2022_06", + "language": "python", + "name": "opt_lsst_w_2022_06" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.18" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/notebooks/region_search/coc/RegionSearchTesting.ipynb b/notebooks/region_search/coc/RegionSearchTesting.ipynb new file mode 100644 index 000000000..4fd1681be --- /dev/null +++ b/notebooks/region_search/coc/RegionSearchTesting.ipynb @@ -0,0 +1,973 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "ab967f8a-b2eb-4af9-9b28-3552c80f2801", + "metadata": {}, + "outputs": [], + "source": [ + "# NOTE: must do this before launching Jupyter Notebook!\n", + "# (1) source setupLSST.zsh\n", + "# (2) run the demodata/pipeline_check setup -r .\n", + "# (3) run the setup -r . for rc2_subset" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "71fb6969-878e-48d3-901b-47468694bfbb", + "metadata": {}, + "outputs": [], + "source": [ + "from lsst.daf.butler import Butler\n", + "import os\n", + "import time\n", + "from lsst import sphgeom" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "2c3dcb5d-8bf6-4073-b332-70342da9a847", + "metadata": {}, + "outputs": [], + "source": [ + "repo_path = os.path.join(os.environ[\"RC2_SUBSET_DIR\"], \"SMALL_HSC\")\n", + "butler = Butler(repo_path)\n", + "registry = butler.registry\n", + "# collection = f\"u/{os.environ['USER']}/single_frame\"\n", + "# d = butler.registry.queryDatasets('calexp', physical_filter='HSC-R', collections=collection, instrument='HSC')\n", + "# calexp = butler.get('calexp', visit=23718, detector=41, collections=collection, instrument='HSC')\n", + "# calexp.visitInfo.boresightRaDec" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "2f94e6a3-d7b4-45b0-9ba5-6a784559f604", + "metadata": {}, + "outputs": [], + "source": [ + "collection = f\"u/{os.environ['USER']}/single_frame\"\n", + "# vdr = butler.registry.queryDimensionRecords(\"visit_detector_region\")\n", + "# vdr = butler.registry.queryDimensionRecords(\"visit_detector_region\", collections=collection)\n", + "vdr = butler.registry.queryDimensionRecords(\n", + " \"visit_detector_region\",\n", + " datasets=\"calexp\",\n", + " collections=collection,\n", + " instrument=\"HSC\",\n", + " physical_filter=\"HSC-R\",\n", + ") # more specific, just the calex stuff" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "3c65104b-fd14-4344-9b62-7c4eea2485d5", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "First VDR record:\n", + "{instrument: 'HSC', detector: 41, visit: 1204}\n", + "ConvexPolygon([UnitVector3d(-0.8685370178854345, 0.49439163180184836, 0.03493369386397754), UnitVector3d(-0.8684746456459038, 0.4943508977169074, 0.036999726981556666), UnitVector3d(-0.8665881263897214, 0.4976505625849847, 0.036999145384733166), UnitVector3d(-0.8666527966506773, 0.4976875474603122, 0.03492900171060283)])\n" + ] + } + ], + "source": [ + "print(f\"First VDR record:\")\n", + "for i in vdr:\n", + " first_vdr_rec = i\n", + " break\n", + "print(first_vdr_rec.dataId) # {instrument: 'HSC', detector: 41, visit: 1204}\n", + "print(\n", + " first_vdr_rec.region\n", + ") # ConvexPolygon([UnitVector3d(-0.8685370178854345, 0.49439163180184836, 0.03493369386397754), UnitVector3d(-0.8684746456459038, 0.4943508977169074, 0.036999726981556666), UnitVector3d(-0.8665881263897214, 0.4976505625849847, 0.036999145384733166), UnitVector3d(-0.8666527966506773, 0.4976875474603122, 0.03492900171060283)])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "83e23099-2e0f-4e35-81c3-c64b05e77a24", + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "9ce47103-6350-47b0-a91d-369180706388", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Last VDR record:\n", + "{instrument: 'HSC', detector: 58, visit: 23718}\n", + "ConvexPolygon([UnitVector3d(-0.8652234119418918, 0.49972867464192744, 0.04073940559524716), UnitVector3d(-0.8652923227482628, 0.4997734451226977, 0.03867427753825506), UnitVector3d(-0.8671859739320048, 0.49648028531881305, 0.03867574052749735), UnitVector3d(-0.8671146883772648, 0.4964392228880602, 0.04074573816606947)])\n" + ] + } + ], + "source": [ + "print(f\"Last VDR record:\")\n", + "for i in vdr:\n", + " last_vdr_rec = i\n", + "print(last_vdr_rec.dataId) # {instrument: 'HSC', detector: 58, visit: 23718}\n", + "print(\n", + " last_vdr_rec.region\n", + ") # ConvexPolygon([UnitVector3d(-0.8652234119418918, 0.49972867464192744, 0.04073940559524716), UnitVector3d(-0.8652923227482628, 0.4997734451226977, 0.03867427753825506), UnitVector3d(-0.8671859739320048, 0.49648028531881305, 0.03867574052749735), UnitVector3d(-0.8671146883772648, 0.4964392228880602, 0.04074573816606947)])" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "5894c666-be1b-474e-86b4-0f16009b0415", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "first_vdr_rec.region.contains(first_vdr_rec.region) = True\n", + "first_vdr_rec.region.contains(last_vdr_rec.region) = False\n" + ] + } + ], + "source": [ + "# silly test first\n", + "print(\n", + " f\"first_vdr_rec.region.contains(first_vdr_rec.region) = {first_vdr_rec.region.contains(first_vdr_rec.region)}\"\n", + ") # should be True!!\n", + "print(\n", + " f\"first_vdr_rec.region.contains(last_vdr_rec.region) = {first_vdr_rec.region.contains(last_vdr_rec.region)}\"\n", + ") # False" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "060b973b-5591-42ba-ae65-5bf1e4c4f825", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Checking matches of first_vdr.region against all records region for matchces...\n", + "There were 1 matches:\n", + "{instrument: 'HSC', detector: 41, visit: 1204}\n" + ] + } + ], + "source": [ + "print(f\"Checking matches of first_vdr.region against all records region for matchces...\")\n", + "matches = []\n", + "for vdr_rec in vdr:\n", + " if vdr_rec.region.contains(first_vdr_rec.region):\n", + " matches.append(vdr_rec.dataId)\n", + "print(f\"There were {len(matches)} matches:\")\n", + "for i in matches:\n", + " print(i)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "507ce759-1e30-4be7-ac44-fbc434d8e753", + "metadata": {}, + "outputs": [], + "source": [ + "# TODO: find all corners, and double-check the overlap 11/16/2023 COC\n", + "# HSC/calib/gen2/20180117" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "09020453-1b37-4538-9aaf-a725bc979858", + "metadata": {}, + "outputs": [], + "source": [ + "# datasetRefs = registry.queryDatasets(datasetType='calexp', collections='HSC/calib/gen2/20180117')" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "1e34d83b-eb07-4e2d-961c-8e9e47355ab2", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "calexp@{instrument: 'HSC', detector: 41, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=4d673e07-c749-4d80-9dcf-b39615a802a4)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=9f3ea177-6daa-4e00-9bcb-8b0616c9b855)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=b3965daf-39b4-43f1-a1ac-49f6dd399c6f)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=b65a71c7-6c0f-476d-9c52-4c93e4d8b12a)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=bef09c5b-3fb5-49c2-80d1-327bc1120fd2)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=f061d55c-64a5-4d74-8ce2-3eb822c6ffbd)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=4a509cbe-f46a-46e6-85bc-f3274dd59524)\n", + "calexp@{instrument: 'HSC', detector: 41, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=91b1f763-f776-42f4-a474-5ff3492acc0b)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=87055aa3-9e11-4d64-b2ed-e0233c24c403)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=5b87e4f6-5a95-4a3b-af93-22c4b8c0e6e0)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=945468ce-3d0e-4030-b823-dd1d5a532876)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=9d42d8cd-a07b-4b1e-b0d8-79666a1464b9)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=df6a6120-72d3-43b0-b392-a83fdaf69398)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=096f41bd-4216-4424-9681-104fde395d2c)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=aa208f29-6d2f-4d78-b940-3250c7c50fb7)\n", + "calexp@{instrument: 'HSC', detector: 42, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=733f733e-6a8d-4125-89fd-45624e8c71bc)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=07536c48-b4c8-4c32-961f-b6261015d417)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=de2250b1-920a-47ff-bf17-41ee4bcdbb2c)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=7f2fc43c-ae5c-434e-b738-d58677e028a1)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=9140c30b-654e-4f46-9cfe-56ce57877d5d)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=022f049f-7369-4514-9372-dbfd2fa764ef)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=4aa4a48b-35d9-4979-a33a-7355c032942e)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=56320e78-6121-4047-913a-6fe064cd16ab)\n", + "calexp@{instrument: 'HSC', detector: 47, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=596b32cb-5e35-4257-b9c7-2b45fc36630f)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=53963b41-b927-461d-bf0e-5986a0471ecb)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=f66b0a47-4135-4fd7-a317-da8a8d1d6170)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=e8774d73-3efa-4076-bac8-b84a59f6605b)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=ae7dde19-9233-42ef-8f91-e6428511d660)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=6b05023d-86cf-4e77-a9a8-7d8591fc195c)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=199133f5-8823-4458-a20a-0dbfaa2bbc3e)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=05e57fc0-4ef1-46f5-bb62-38a08b1c4201)\n", + "calexp@{instrument: 'HSC', detector: 49, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=b24c2672-2512-4e65-9740-74022802f82c)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=81e47e75-83c4-4341-9a07-c35a6cb38a9a)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=2c3d592f-9bba-48e3-abac-80fc92a7283a)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=4978031c-4bde-4f2f-ba4c-8069e4afac53)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=064a52d4-68b1-4d12-b3e8-65fa945cb518)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=a3e09cb0-3304-4a6b-9e5a-251b96c857c5)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=b7bca4ff-a559-4f7f-9691-3b86368dbf28)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=aa1ff092-2bd7-4d62-873d-5e5f82717b22)\n", + "calexp@{instrument: 'HSC', detector: 50, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=c7b5bc6d-0991-494b-921b-76a0e9b7f2d3)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 1204, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=151a35cb-b254-4474-84d6-5c3004fe56c9)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 1206, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=1a827f6f-c666-4edd-88a5-0002524485b7)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 1214, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=51f76937-7f49-4157-aae7-fed4281e46a8)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 1220, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=1015b0f9-3470-4ab7-9dfa-729a9888db29)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 23694, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=f4256be0-f277-4a16-b656-5294017cd9a4)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 23704, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=010d7808-855d-4f6b-80ec-49bc460d8a6f)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 23706, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=b5fcbe18-caf0-4e6b-810d-b9c79a7cba16)\n", + "calexp@{instrument: 'HSC', detector: 58, visit: 23718, ...} [sc=ExposureF] (run=u/colinchandler/single_frame/20231110T234552Z id=784f36f1-98f3-4ecd-b35e-7bd04cecbdb7)\n" + ] + } + ], + "source": [ + "# using collection = f\"u/{os.environ['USER']}/single_frame\"\n", + "for ref in butler.registry.queryDatasets(\n", + " \"calexp\", physical_filter=\"HSC-R\", collections=collection, instrument=\"HSC\"\n", + "):\n", + " print(ref)\n", + "\n", + "for ref in butler.registry.queryDatasets(\n", + " \"calexp\", physical_filter=\"HSC-R\", collections=collection, instrument=\"HSC\"\n", + "):\n", + " first_dsr = ref\n", + " break" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "4351a801-39e1-405b-8d5c-add0da0933be", + "metadata": {}, + "outputs": [], + "source": [ + "# TODO do an example that spans filters and demonstrates .contains(), and also the one we have below with .intersects()." + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "eddd8177-8447-4f6c-92aa-f793351b3b2a", + "metadata": {}, + "outputs": [], + "source": [ + "# all_ds = [ ds for ds in registry.queryDatasets('calexp',collections=collection, instrument='HSC, physical_filter='HSC-R')]\n", + "# lol now it's the same as above. Result count this way is 48. Removing physical_filter and instrument results in 240.\n", + "# NOTE: there are 48 in the directory structure, as so from bash:\n", + "# find /Users/colinchandler/lsst_stack_w_2023_44/rc2_subset/SMALL_HSC/u/colinchandler/single_frame/20231110T234552Z/calexp -name \\*HSC-R\\*.fits" + ] + }, + { + "cell_type": "code", + "execution_count": 48, + "id": "8dc71a26-ca04-476d-8580-7862f8d4f79d", + "metadata": {}, + "outputs": [], + "source": [ + "dsq = registry.queryDatasets(\"calexp\", collections=collection, instrument=\"HSC\", physical_filter=\"HSC-R\")\n", + "dsrecords = [i for i in dsq] # 12/20/2023 COC\n", + "dataIds = [i.dataId for i in dsq]" + ] + }, + { + "cell_type": "code", + "execution_count": 64, + "id": "550bfd1a-c129-4e8e-812b-18dc5a5ff543", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{band: 'r', instrument: 'HSC', detector: 41, physical_filter: 'HSC-R', visit_system: 0, visit: 1204}" + ] + }, + "execution_count": 64, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dataIds[0].full" + ] + }, + { + "cell_type": "code", + "execution_count": 65, + "id": "bcf75eb3-0fd1-4327-a94d-aab20ac7bf98", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "DatasetRef(DatasetType('calexp', {band, instrument, detector, physical_filter, visit_system, visit}, ExposureF), {instrument: 'HSC', detector: 41, visit: 1204, ...}, run='u/colinchandler/single_frame/20231110T234552Z', id=4d673e07-c749-4d80-9dcf-b39615a802a4)" + ] + }, + "execution_count": 65, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dsrecords[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "id": "54f4ea99-6799-45b8-9dc5-3f12e1994fd6", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "UUID('4d673e07-c749-4d80-9dcf-b39615a802a4')" + ] + }, + "execution_count": 62, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# here we get unique IDs back from the butler 12/20/2023 COC\n", + "testid = dsrecords[0].id\n", + "testid" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "id": "b2258648-8939-4607-a408-331bc731f618", + "metadata": {}, + "outputs": [ + { + "ename": "UserExpressionSyntaxError", + "evalue": "Failed to parse user expression 'id=4d673e07-c749-4d80-9dcf-b39615a802a4'.", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mParseError\u001b[0m Traceback (most recent call last)", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/_predicate.py:136\u001b[0m, in \u001b[0;36mmake_string_expression_predicate\u001b[0;34m(string, dimensions, column_types, bind, data_id, defaults, dataset_type_name, allow_orphans)\u001b[0m\n\u001b[1;32m 135\u001b[0m parser \u001b[38;5;241m=\u001b[39m ParserYacc()\n\u001b[0;32m--> 136\u001b[0m tree \u001b[38;5;241m=\u001b[39m \u001b[43mparser\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mparse\u001b[49m\u001b[43m(\u001b[49m\u001b[43mstring\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 137\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m exc:\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/parser/parserYacc.py:270\u001b[0m, in \u001b[0;36mParserYacc.parse\u001b[0;34m(self, input, lexer, debug, tracking)\u001b[0m\n\u001b[1;32m 269\u001b[0m lexer \u001b[38;5;241m=\u001b[39m ParserLex\u001b[38;5;241m.\u001b[39mmake_lexer()\n\u001b[0;32m--> 270\u001b[0m tree \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mparser\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mparse\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mlexer\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mlexer\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdebug\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdebug\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtracking\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mtracking\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 271\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m tree\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/parser/ply/yacc.py:349\u001b[0m, in \u001b[0;36mLRParser.parse\u001b[0;34m(self, input, lexer, debug, tracking, tokenfunc)\u001b[0m\n\u001b[1;32m 348\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 349\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mparseopt_notrack\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mlexer\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdebug\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtracking\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtokenfunc\u001b[49m\u001b[43m)\u001b[49m\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/parser/ply/yacc.py:1214\u001b[0m, in \u001b[0;36mLRParser.parseopt_notrack\u001b[0;34m(self, input, lexer, debug, tracking, tokenfunc)\u001b[0m\n\u001b[1;32m 1213\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstate \u001b[38;5;241m=\u001b[39m state\n\u001b[0;32m-> 1214\u001b[0m tok \u001b[38;5;241m=\u001b[39m \u001b[43mcall_errorfunc\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43merrorfunc\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43merrtoken\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[43m)\u001b[49m\n\u001b[1;32m 1215\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39merrorok:\n\u001b[1;32m 1216\u001b[0m \u001b[38;5;66;03m# User must have done some kind of panic\u001b[39;00m\n\u001b[1;32m 1217\u001b[0m \u001b[38;5;66;03m# mode recovery on their own. The\u001b[39;00m\n\u001b[1;32m 1218\u001b[0m \u001b[38;5;66;03m# returned token is the next lookahead\u001b[39;00m\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/parser/ply/yacc.py:202\u001b[0m, in \u001b[0;36mcall_errorfunc\u001b[0;34m(errorfunc, token, parser)\u001b[0m\n\u001b[1;32m 201\u001b[0m _restart \u001b[38;5;241m=\u001b[39m parser\u001b[38;5;241m.\u001b[39mrestart\n\u001b[0;32m--> 202\u001b[0m r \u001b[38;5;241m=\u001b[39m \u001b[43merrorfunc\u001b[49m\u001b[43m(\u001b[49m\u001b[43mtoken\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 203\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/parser/parserYacc.py:450\u001b[0m, in \u001b[0;36mParserYacc.p_error\u001b[0;34m(self, p)\u001b[0m\n\u001b[1;32m 449\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 450\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m ParseError(p\u001b[38;5;241m.\u001b[39mlexer\u001b[38;5;241m.\u001b[39mlexdata, p\u001b[38;5;241m.\u001b[39mvalue, p\u001b[38;5;241m.\u001b[39mlexpos, p\u001b[38;5;241m.\u001b[39mlineno)\n", + "\u001b[0;31mParseError\u001b[0m: Syntax error at or near 'd673e07' (line: 1, pos: 5)", + "\nThe above exception was the direct cause of the following exception:\n", + "\u001b[0;31mUserExpressionSyntaxError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[0;32mIn[63], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m bulteridtest \u001b[38;5;241m=\u001b[39m \u001b[43mregistry\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mqueryDatasets\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mcalexp\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mcollections\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcollection\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mwhere\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;124;43mf\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mid=\u001b[39;49m\u001b[38;5;132;43;01m{\u001b[39;49;00m\u001b[43mtestid\u001b[49m\u001b[38;5;132;43;01m}\u001b[39;49;00m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m)\u001b[49m\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/_registry_shim.py:312\u001b[0m, in \u001b[0;36mRegistryShim.queryDatasets\u001b[0;34m(self, datasetType, collections, dimensions, dataId, where, findFirst, components, bind, check, **kwargs)\u001b[0m\n\u001b[1;32m 297\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mqueryDatasets\u001b[39m(\n\u001b[1;32m 298\u001b[0m \u001b[38;5;28mself\u001b[39m,\n\u001b[1;32m 299\u001b[0m datasetType: Any,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 310\u001b[0m ) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m DatasetQueryResults:\n\u001b[1;32m 311\u001b[0m \u001b[38;5;66;03m# Docstring inherited from a base class.\u001b[39;00m\n\u001b[0;32m--> 312\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_registry\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mqueryDatasets\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 313\u001b[0m \u001b[43m \u001b[49m\u001b[43mdatasetType\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 314\u001b[0m \u001b[43m \u001b[49m\u001b[43mcollections\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcollections\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 315\u001b[0m \u001b[43m \u001b[49m\u001b[43mdimensions\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdimensions\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 316\u001b[0m \u001b[43m \u001b[49m\u001b[43mdataId\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdataId\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 317\u001b[0m \u001b[43m \u001b[49m\u001b[43mwhere\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mwhere\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 318\u001b[0m \u001b[43m \u001b[49m\u001b[43mfindFirst\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mfindFirst\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 319\u001b[0m \u001b[43m \u001b[49m\u001b[43mcomponents\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcomponents\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 320\u001b[0m \u001b[43m \u001b[49m\u001b[43mbind\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbind\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 321\u001b[0m \u001b[43m \u001b[49m\u001b[43mcheck\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcheck\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 322\u001b[0m \u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 323\u001b[0m \u001b[43m \u001b[49m\u001b[43m)\u001b[49m\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/sql_registry.py:2097\u001b[0m, in \u001b[0;36mSqlRegistry.queryDatasets\u001b[0;34m(self, datasetType, collections, dimensions, dataId, where, findFirst, components, bind, check, **kwargs)\u001b[0m\n\u001b[1;32m 2094\u001b[0m dimension_names\u001b[38;5;241m.\u001b[39mupdate(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdimensions\u001b[38;5;241m.\u001b[39mextract(dimensions)\u001b[38;5;241m.\u001b[39mnames)\n\u001b[1;32m 2095\u001b[0m \u001b[38;5;66;03m# Construct the summary structure needed to construct a\u001b[39;00m\n\u001b[1;32m 2096\u001b[0m \u001b[38;5;66;03m# QueryBuilder.\u001b[39;00m\n\u001b[0;32m-> 2097\u001b[0m summary \u001b[38;5;241m=\u001b[39m \u001b[43mqueries\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mQuerySummary\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 2098\u001b[0m \u001b[43m \u001b[49m\u001b[43mrequested\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mDimensionGraph\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdimensions\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mnames\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdimension_names\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2099\u001b[0m \u001b[43m \u001b[49m\u001b[43mcolumn_types\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_managers\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mcolumn_types\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2100\u001b[0m \u001b[43m \u001b[49m\u001b[43mdata_id\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdata_id\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2101\u001b[0m \u001b[43m \u001b[49m\u001b[43mexpression\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mwhere\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2102\u001b[0m \u001b[43m \u001b[49m\u001b[43mbind\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbind\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2103\u001b[0m \u001b[43m \u001b[49m\u001b[43mdefaults\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdefaults\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdataId\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2104\u001b[0m \u001b[43m \u001b[49m\u001b[43mcheck\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcheck\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2105\u001b[0m \u001b[43m \u001b[49m\u001b[43mdatasets\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43m[\u001b[49m\u001b[43mparent_dataset_type\u001b[49m\u001b[43m]\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 2106\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 2107\u001b[0m builder \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_makeQueryBuilder(summary)\n\u001b[1;32m 2108\u001b[0m \u001b[38;5;66;03m# Add the dataset subquery to the query, telling the QueryBuilder\u001b[39;00m\n\u001b[1;32m 2109\u001b[0m \u001b[38;5;66;03m# to include the rank of the selected collection in the results\u001b[39;00m\n\u001b[1;32m 2110\u001b[0m \u001b[38;5;66;03m# only if we need to findFirst. Note that if any of the\u001b[39;00m\n\u001b[1;32m 2111\u001b[0m \u001b[38;5;66;03m# collections are actually wildcard expressions, and\u001b[39;00m\n\u001b[1;32m 2112\u001b[0m \u001b[38;5;66;03m# findFirst=True, this will raise TypeError for us.\u001b[39;00m\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/_structs.py:384\u001b[0m, in \u001b[0;36mQuerySummary.__init__\u001b[0;34m(self, requested, column_types, data_id, expression, region, bind, defaults, datasets, order_by, limit, check)\u001b[0m\n\u001b[1;32m 382\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 383\u001b[0m dataset_type_name \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n\u001b[0;32m--> 384\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mwhere \u001b[38;5;241m=\u001b[39m \u001b[43mQueryWhereClause\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mcombine\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 385\u001b[0m \u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrequested\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 386\u001b[0m \u001b[43m \u001b[49m\u001b[43mexpression\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mexpression\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 387\u001b[0m \u001b[43m \u001b[49m\u001b[43mcolumn_types\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcolumn_types\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 388\u001b[0m \u001b[43m \u001b[49m\u001b[43mbind\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbind\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 389\u001b[0m \u001b[43m \u001b[49m\u001b[43mdata_id\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdata_id\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 390\u001b[0m \u001b[43m \u001b[49m\u001b[43mregion\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mregion\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 391\u001b[0m \u001b[43m \u001b[49m\u001b[43mdefaults\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdefaults\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 392\u001b[0m \u001b[43m \u001b[49m\u001b[43mdataset_type_name\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdataset_type_name\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 393\u001b[0m \u001b[43m \u001b[49m\u001b[43mallow_orphans\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mcheck\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 394\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 395\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39morder_by \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;28;01mif\u001b[39;00m order_by \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;28;01melse\u001b[39;00m OrderByClause\u001b[38;5;241m.\u001b[39mparse_general(order_by, requested)\n\u001b[1;32m 396\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlimit \u001b[38;5;241m=\u001b[39m limit\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/_structs.py:114\u001b[0m, in \u001b[0;36mQueryWhereClause.combine\u001b[0;34m(cls, dimensions, expression, column_types, bind, data_id, region, defaults, dataset_type_name, allow_orphans)\u001b[0m\n\u001b[1;32m 112\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m defaults \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m 113\u001b[0m defaults \u001b[38;5;241m=\u001b[39m DataCoordinate\u001b[38;5;241m.\u001b[39mmakeEmpty(dimensions\u001b[38;5;241m.\u001b[39muniverse)\n\u001b[0;32m--> 114\u001b[0m expression_predicate, governor_constraints \u001b[38;5;241m=\u001b[39m \u001b[43mmake_string_expression_predicate\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m 115\u001b[0m \u001b[43m \u001b[49m\u001b[43mexpression\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 116\u001b[0m \u001b[43m \u001b[49m\u001b[43mdimensions\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 117\u001b[0m \u001b[43m \u001b[49m\u001b[43mcolumn_types\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcolumn_types\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 118\u001b[0m \u001b[43m \u001b[49m\u001b[43mbind\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbind\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 119\u001b[0m \u001b[43m \u001b[49m\u001b[43mdata_id\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdata_id\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 120\u001b[0m \u001b[43m \u001b[49m\u001b[43mdefaults\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdefaults\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 121\u001b[0m \u001b[43m \u001b[49m\u001b[43mdataset_type_name\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdataset_type_name\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 122\u001b[0m \u001b[43m \u001b[49m\u001b[43mallow_orphans\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mallow_orphans\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 123\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 124\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m QueryWhereClause(\n\u001b[1;32m 125\u001b[0m expression_predicate,\n\u001b[1;32m 126\u001b[0m data_id,\n\u001b[1;32m 127\u001b[0m region\u001b[38;5;241m=\u001b[39mregion,\n\u001b[1;32m 128\u001b[0m governor_constraints\u001b[38;5;241m=\u001b[39mgovernor_constraints,\n\u001b[1;32m 129\u001b[0m )\n", + "File \u001b[0;32m~/lsst_stack_w_2023_44/stack/miniconda3-py38_4.9.2-7.0.1/DarwinX86/daf_butler/ge89626a060+c4141ea9c4/python/lsst/daf/butler/registry/queries/expressions/_predicate.py:138\u001b[0m, in \u001b[0;36mmake_string_expression_predicate\u001b[0;34m(string, dimensions, column_types, bind, data_id, defaults, dataset_type_name, allow_orphans)\u001b[0m\n\u001b[1;32m 136\u001b[0m tree \u001b[38;5;241m=\u001b[39m parser\u001b[38;5;241m.\u001b[39mparse(string)\n\u001b[1;32m 137\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m exc:\n\u001b[0;32m--> 138\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m UserExpressionSyntaxError(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mFailed to parse user expression \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mstring\u001b[38;5;132;01m!r}\u001b[39;00m\u001b[38;5;124m.\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mexc\u001b[39;00m\n\u001b[1;32m 139\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m bind \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m 140\u001b[0m bind \u001b[38;5;241m=\u001b[39m {}\n", + "\u001b[0;31mUserExpressionSyntaxError\u001b[0m: Failed to parse user expression 'id=4d673e07-c749-4d80-9dcf-b39615a802a4'." + ] + } + ], + "source": [ + "bulteridtest = registry.queryDatasets(\"calexp\", collections=collection, where=f\"id={testid}\")" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "id": "9beca3d0-2e1d-4459-a6ad-d859c12b64fa", + "metadata": {}, + "outputs": [], + "source": [ + "# vdr2 = butler.registry.queryDimensionRecords(\"visit_detector_region\", datasets='calexp', collections=collection, instrument='HSC', physical_filter='HSC-R')\n", + "# all_vdr = butler.registry.queryDatasets('calexp', physical_filter='HSC-R', collections=collection, instrument='HSC') # nope 11/27/2023 COC" + ] + }, + { + "cell_type": "code", + "execution_count": 40, + "id": "8249ccc7-e595-44ce-8f33-2b2c74e10a56", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "There are 240 records in all_vdr.\n", + "Rate was 21614.0134 matches/second. (We performed 21406 matches in 0.9903759956359863 seconds.)\n" + ] + } + ], + "source": [ + "match_dict = {}\n", + "match_by_keys = {}\n", + "\n", + "# all_vdr = vdr\n", + "all_vdr = butler.registry.queryDimensionRecords(\n", + " \"visit_detector_region\", datasets=\"calexp\", collections=collection, instrument=\"HSC\"\n", + ") # removing , physical_filter='HSC-R'\n", + "all_vdr_count = 0\n", + "\n", + "for i in all_vdr:\n", + " all_vdr_count += 1\n", + "print(f\"There are {all_vdr_count} records in all_vdr.\")\n", + "\n", + "\n", + "def make_key(vdr):\n", + " this_key = f'{this_vdr.dataId[\"instrument\"]}_{this_vdr.dataId[\"detector\"]}_{this_vdr.dataId[\"visit\"]}'\n", + " return this_key\n", + "\n", + "\n", + "check_count = 0\n", + "start_time = time.time()\n", + "for i, this_vdr in enumerate(all_vdr):\n", + " this_key = make_key(this_vdr)\n", + " # print(this_key)\n", + " matches_ = []\n", + " matches_by_keys_ = []\n", + " # print(this_vdr.region)\n", + " for j, other_vdr in enumerate(all_vdr):\n", + " other_key = make_key(other_vdr)\n", + " if j == i:\n", + " continue\n", + " # if this_vdr.region.contains(other_vdr.region):\n", + " if this_vdr.region.intersects(other_vdr.region):\n", + " check_count += 1\n", + " # print('hi') # testing; many showed up here but not in dict?\n", + " matches.append(this_vdr)\n", + " matches_by_keys_.append(f\"{this_key} intersects {other_key}\")\n", + " match_dict[this_vdr] = matches_\n", + " match_by_keys[this_key] = matches_by_keys_\n", + "\n", + "elapsed = time.time() - start_time\n", + "rate = check_count / elapsed # seeing ~20,000/s on my MBP 11/27/2023 COC\n", + "print(f\"Rate was {round(rate,4)} matches/second. (We performed {check_count} matches in {elapsed} seconds.)\")" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "id": "892331f6-f907-4eeb-aeb2-a963e7d20cc6", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Reminder: all_vdr_count = 240\n", + "HSC_41_322: 134\n", + "HSC_41_346: 95\n", + "HSC_41_358: 141\n", + "HSC_41_1178: 70\n", + "HSC_41_1184: 100\n", + "HSC_41_1204: 71\n", + "HSC_41_1206: 91\n", + "HSC_41_1214: 70\n", + "HSC_41_1220: 100\n", + "HSC_41_1242: 97\n", + "HSC_41_1248: 138\n", + "HSC_41_11690: 90\n", + "HSC_41_11694: 93\n", + "HSC_41_11696: 139\n", + "HSC_41_11698: 96\n", + "HSC_41_11704: 48\n", + "HSC_41_11710: 131\n", + "HSC_41_11724: 139\n", + "HSC_41_11738: 131\n", + "HSC_41_11740: 122\n", + "HSC_41_17900: 90\n", + "HSC_41_17904: 93\n", + "HSC_41_17906: 139\n", + "HSC_41_17926: 64\n", + "HSC_41_17948: 107\n", + "HSC_41_17950: 135\n", + "HSC_41_19680: 139\n", + "HSC_41_19684: 64\n", + "HSC_41_19694: 41\n", + "HSC_41_19696: 48\n", + "HSC_41_22632: 90\n", + "HSC_41_22662: 72\n", + "HSC_41_23694: 69\n", + "HSC_41_23704: 93\n", + "HSC_41_23706: 139\n", + "HSC_41_23718: 64\n", + "HSC_41_29336: 134\n", + "HSC_41_29350: 69\n", + "HSC_41_30482: 107\n", + "HSC_41_30490: 69\n", + "HSC_42_322: 107\n", + "HSC_42_346: 139\n", + "HSC_42_358: 100\n", + "HSC_42_1178: 74\n", + "HSC_42_1184: 60\n", + "HSC_42_1204: 72\n", + "HSC_42_1206: 122\n", + "HSC_42_1214: 74\n", + "HSC_42_1220: 60\n", + "HSC_42_1242: 139\n", + "HSC_42_1248: 103\n", + "HSC_42_11690: 81\n", + "HSC_42_11694: 128\n", + "HSC_42_11696: 110\n", + "HSC_42_11698: 57\n", + "HSC_42_11704: 94\n", + "HSC_42_11710: 107\n", + "HSC_42_11724: 110\n", + "HSC_42_11738: 107\n", + "HSC_42_11740: 118\n", + "HSC_42_17900: 81\n", + "HSC_42_17904: 128\n", + "HSC_42_17906: 110\n", + "HSC_42_17926: 92\n", + "HSC_42_17948: 134\n", + "HSC_42_17950: 88\n", + "HSC_42_19680: 110\n", + "HSC_42_19684: 92\n", + "HSC_42_19694: 69\n", + "HSC_42_19696: 94\n", + "HSC_42_22632: 141\n", + "HSC_42_22662: 68\n", + "HSC_42_23694: 72\n", + "HSC_42_23704: 128\n", + "HSC_42_23706: 110\n", + "HSC_42_23718: 92\n", + "HSC_42_29336: 63\n", + "HSC_42_29350: 42\n", + "HSC_42_30482: 134\n", + "HSC_42_30490: 42\n", + "HSC_47_322: 41\n", + "HSC_47_346: 37\n", + "HSC_47_358: 39\n", + "HSC_47_1178: 33\n", + "HSC_47_1184: 37\n", + "HSC_47_1204: 33\n", + "HSC_47_1206: 38\n", + "HSC_47_1214: 33\n", + "HSC_47_1220: 37\n", + "HSC_47_1242: 37\n", + "HSC_47_1248: 39\n", + "HSC_47_11690: 36\n", + "HSC_47_11694: 37\n", + "HSC_47_11696: 39\n", + "HSC_47_11698: 36\n", + "HSC_47_11704: 21\n", + "HSC_47_11710: 25\n", + "HSC_47_11724: 39\n", + "HSC_47_11738: 25\n", + "HSC_47_11740: 36\n", + "HSC_47_17900: 36\n", + "HSC_47_17904: 37\n", + "HSC_47_17906: 39\n", + "HSC_47_17926: 33\n", + "HSC_47_17948: 21\n", + "HSC_47_17950: 15\n", + "HSC_47_19680: 39\n", + "HSC_47_19684: 33\n", + "HSC_47_19694: 31\n", + "HSC_47_19696: 21\n", + "HSC_47_22632: 38\n", + "HSC_47_22662: 33\n", + "HSC_47_23694: 33\n", + "HSC_47_23704: 37\n", + "HSC_47_23706: 39\n", + "HSC_47_23718: 33\n", + "HSC_47_29336: 32\n", + "HSC_47_29350: 36\n", + "HSC_47_30482: 21\n", + "HSC_47_30490: 36\n", + "HSC_49_322: 137\n", + "HSC_49_346: 89\n", + "HSC_49_358: 148\n", + "HSC_49_1178: 113\n", + "HSC_49_1184: 145\n", + "HSC_49_1204: 116\n", + "HSC_49_1206: 96\n", + "HSC_49_1214: 113\n", + "HSC_49_1220: 145\n", + "HSC_49_1242: 92\n", + "HSC_49_1248: 142\n", + "HSC_49_11690: 113\n", + "HSC_49_11694: 94\n", + "HSC_49_11696: 134\n", + "HSC_49_11698: 149\n", + "HSC_49_11704: 68\n", + "HSC_49_11710: 87\n", + "HSC_49_11724: 134\n", + "HSC_49_11738: 87\n", + "HSC_49_11740: 89\n", + "HSC_49_17900: 113\n", + "HSC_49_17904: 94\n", + "HSC_49_17906: 134\n", + "HSC_49_17926: 99\n", + "HSC_49_17948: 55\n", + "HSC_49_17950: 68\n", + "HSC_49_19680: 134\n", + "HSC_49_19684: 99\n", + "HSC_49_19694: 82\n", + "HSC_49_19696: 68\n", + "HSC_49_22632: 81\n", + "HSC_49_22662: 116\n", + "HSC_49_23694: 113\n", + "HSC_49_23704: 94\n", + "HSC_49_23706: 134\n", + "HSC_49_23718: 99\n", + "HSC_49_29336: 102\n", + "HSC_49_29350: 141\n", + "HSC_49_30482: 55\n", + "HSC_49_30490: 141\n", + "HSC_50_322: 122\n", + "HSC_50_346: 149\n", + "HSC_50_358: 117\n", + "HSC_50_1178: 128\n", + "HSC_50_1184: 91\n", + "HSC_50_1204: 127\n", + "HSC_50_1206: 144\n", + "HSC_50_1214: 128\n", + "HSC_50_1220: 91\n", + "HSC_50_1242: 149\n", + "HSC_50_1248: 118\n", + "HSC_50_11690: 119\n", + "HSC_50_11694: 144\n", + "HSC_50_11696: 119\n", + "HSC_50_11698: 90\n", + "HSC_50_11704: 125\n", + "HSC_50_11710: 78\n", + "HSC_50_11724: 119\n", + "HSC_50_11738: 78\n", + "HSC_50_11740: 100\n", + "HSC_50_17900: 119\n", + "HSC_50_17904: 144\n", + "HSC_50_17906: 119\n", + "HSC_50_17926: 150\n", + "HSC_50_17948: 81\n", + "HSC_50_17950: 55\n", + "HSC_50_19680: 119\n", + "HSC_50_19684: 150\n", + "HSC_50_19694: 141\n", + "HSC_50_19696: 125\n", + "HSC_50_22632: 151\n", + "HSC_50_22662: 122\n", + "HSC_50_23694: 127\n", + "HSC_50_23704: 144\n", + "HSC_50_23706: 119\n", + "HSC_50_23718: 150\n", + "HSC_50_29336: 57\n", + "HSC_50_29350: 85\n", + "HSC_50_30482: 81\n", + "HSC_50_30490: 85\n", + "HSC_58_322: 76\n", + "HSC_58_346: 86\n", + "HSC_58_358: 74\n", + "HSC_58_1178: 119\n", + "HSC_58_1184: 77\n", + "HSC_58_1204: 125\n", + "HSC_58_1206: 94\n", + "HSC_58_1214: 119\n", + "HSC_58_1220: 77\n", + "HSC_58_1242: 90\n", + "HSC_58_1248: 74\n", + "HSC_58_11690: 91\n", + "HSC_58_11694: 91\n", + "HSC_58_11696: 73\n", + "HSC_58_11698: 79\n", + "HSC_58_11704: 83\n", + "HSC_58_11710: 31\n", + "HSC_58_11724: 73\n", + "HSC_58_11738: 31\n", + "HSC_58_11740: 50\n", + "HSC_58_17900: 91\n", + "HSC_58_17904: 91\n", + "HSC_58_17906: 73\n", + "HSC_58_17926: 117\n", + "HSC_58_17948: 27\n", + "HSC_58_17950: 17\n", + "HSC_58_19680: 73\n", + "HSC_58_19684: 117\n", + "HSC_58_19694: 149\n", + "HSC_58_19696: 83\n", + "HSC_58_22632: 87\n", + "HSC_58_22662: 116\n", + "HSC_58_23694: 123\n", + "HSC_58_23704: 91\n", + "HSC_58_23706: 73\n", + "HSC_58_23718: 117\n", + "HSC_58_29336: 30\n", + "HSC_58_29350: 102\n", + "HSC_58_30482: 27\n", + "HSC_58_30490: 101\n" + ] + } + ], + "source": [ + "# for i, a_vdr in enumerate(match_dict.keys()): print(f'{i}: {len(match_dict[a_vdr])}')\n", + "# for i, a_vdr in enumerate(match_dict.keys()): print(f'{len(match_dict[a_vdr])!s:>5} matches for {a_vdr.dataId}')\n", + "# print(match_by_keys.keys())\n", + "print(f\"Reminder: all_vdr_count = {all_vdr_count}\")\n", + "for i, a_key in enumerate(match_by_keys.keys()):\n", + " print(f\"{a_key}: {len(match_by_keys[a_key])}\")" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "id": "6f87f462-789b-424b-b2a6-85080d7e3bab", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "6000000" + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "n_chips_month_lsst = 1000 * 30 * 200\n", + "n_chips_month_lsst" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "id": "f2f388e6-763a-4127-b731-fa9ac48b6dab", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Brute force chip-chip (all): 51.1 years (single-thread) to match 1 month of LSST chips.\n" + ] + } + ], + "source": [ + "compute_yrs_for_lsst_month = ((n_chips_month_lsst * n_chips_month_lsst) / rate) / 60 / 60 / 24 / 365\n", + "print(\n", + " f\"Brute force chip-chip (all): {round(compute_yrs_for_lsst_month,1)} years (single-thread) to match 1 month of LSST chips.\"\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "2326484e-d4c1-4f3b-a01d-d78136d24af5", + "metadata": {}, + "outputs": [], + "source": [ + "# vdr = butler.registry.queryDimensionRecords(\"visit_detector_region\", datasets='calexp', collections=collection, instrument='HSC', physical_filter='HSC-R') # more specific, just the calex stuff\n", + "# butler.registry.queryDatasets('calexp', physical_filter='HSC-R', collections=collection, instrument='HSC')\n", + "datasetRefs = butler.registry.queryDatasets(\n", + " \"calexp\",\n", + " # physical_filter='HSC-R',\n", + " collections=collection,\n", + " instrument=\"HSC\",\n", + ")\n", + "# datasetRefs = butler.registry.queryDatasets(datasetType='calexp',\n", + "# collection = f\"u/{os.environ['USER']}/single_frame\", # recall\n", + "# # band='i', detector=175,\n", + "# # where='visit > 192000 and visit < 193000'\n", + "# )" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "id": "6e129012-cf56-4b50-a543-a7b8d5c378a5", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{band: 'y', instrument: 'HSC', detector: 41, physical_filter: 'HSC-Y', visit_system: 0, visit: 322}\n", + "{band: 'y', instrument: 'HSC', detector: 41, physical_filter: 'HSC-Y', visit_system: 0, visit: 346}\n", + "{band: 'y', instrument: 'HSC', detector: 41, physical_filter: 'HSC-Y', visit_system: 0, visit: 358}\n", + "{band: 'z', instrument: 'HSC', detector: 41, physical_filter: 'HSC-Z', visit_system: 0, visit: 1178}\n", + "{band: 'z', instrument: 'HSC', detector: 41, physical_filter: 'HSC-Z', visit_system: 0, visit: 1184}\n", + "...\n", + "There are 239 records total.\n" + ] + } + ], + "source": [ + "thiscounter = 0\n", + "for i, ref in enumerate(datasetRefs.expanded()):\n", + " thiscounter = i\n", + " if i < 5:\n", + " print(ref.dataId.full)\n", + "print(\"...\") # like this idea in the DP0.2 notebook 12/4/2023 COC\n", + "print(f\"There are {thiscounter} records total.\")" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "id": "69cf7f05-1373-4054-94fc-fc7273596723", + "metadata": {}, + "outputs": [], + "source": [ + "# for i, ref in enumerate(datasetRefs.expanded()):\n", + "# bbox = butler.get('calexp.bbox', dataId=ref.dataId)\n", + "# wcs = butler.get('calexp.wcs', dataId=ref.dataId)\n", + "# crnr_ra, crnr_dec = get_corners_radec(wcs, bbox)\n", + "# tmp = ''\n", + "# for c in range(4):\n", + "# tmp += f'({crnr_ra[c]:.3f},{crnr_dec[c]:.3f}) '\n", + "# print(i, tmp)" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "id": "5a8e930d-7b9c-4bb0-95a1-ab5e5abbf284", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Example region: ConvexPolygon([UnitVector3d(-0.8679157412883791, 0.4953768322146207, 0.03638763703307745), UnitVector3d(-0.8678508112373716, 0.49533452653358495, 0.038453559762199246), UnitVector3d(-0.8659604515352447, 0.49863199273540854, 0.03845298684875526), UnitVector3d(-0.8660276891555382, 0.4986705548678019, 0.036382953752507885)])\n" + ] + } + ], + "source": [ + "pointing_regions = []\n", + "for i, ref in enumerate(datasetRefs.expanded()):\n", + " if i == 0:\n", + " print(f\"Example region: {ref.dataId.region}\")\n", + " tmpref = ref\n", + " pointing_regions.append(ref.dataId.region)" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "id": "64834ef2-eba6-4512-a117-1acc14425bbf", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "ConvexPolygon([UnitVector3d(-0.8679157412883791, 0.4953768322146207, 0.03638763703307745), UnitVector3d(-0.8678508112373716, 0.49533452653358495, 0.038453559762199246), UnitVector3d(-0.8659604515352447, 0.49863199273540854, 0.03845298684875526), UnitVector3d(-0.8660276891555382, 0.4986705548678019, 0.036382953752507885)])" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "tmpref.dataId.region" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "id": "06ce5618-40e8-46e7-b825-ea0fe0c5e847", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Box(NormalizedAngleInterval.fromRadians(0.0, 0.05235987755982989), AngleInterval.fromRadians(-1.5707963267948966, -1.5184364492350666))" + ] + }, + "execution_count": 36, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# from separate Patches on Sky Notebook\n", + "r = b\"b\\x00\\x00\\x00\\x00\\x00\\x00\\x00\\x00\\xd6\\xeb{\\xf3\\xe9\\xce\\xaa?\\x18-DT\\xfb!\\xf9\\xbf\\xb9M\\xa8\\x04\\x84K\\xf8\\xbf\"\n", + "rd = sphgeom.Region.decode(r)\n", + "rd" + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "id": "870f142c-d186-4880-b782-3c03da562276", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Checked 240 times, found 0 matches.\n" + ] + } + ], + "source": [ + "c = 0\n", + "intersect_count = 0\n", + "for i in pointing_regions:\n", + " c += 1\n", + " if i.intersects(rd):\n", + " print(f\"Intersects!\")\n", + " intersect_count += 1\n", + "print(f\"Checked {c} times, found {intersect_count} matches.\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.6" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/notebooks/region_search/sky_patches.ipynb b/notebooks/region_search/sky_patches.ipynb index ee4ec036b..105295c5e 100644 --- a/notebooks/region_search/sky_patches.ipynb +++ b/notebooks/region_search/sky_patches.ipynb @@ -66,6 +66,7 @@ "source": [ "# We will set up a dictionary with some values we will need for a given \"instrument\" here.\n", "chipDict = {}\n", + "# matches_per_sec refers to how fast we can compare region hashes using LSST sphgeom\n", "\n", "# Dark Energy Camera; Cerro Tololo Inter-American Observatory (CTIO), Chile\n", "chipDict[\"DECam\"] = {\"chipsize_arcmin\": [9, 18]} # 0.263\"/pixel, (2048,4096) pix/chip = (8.98,17.95')/chip\n", @@ -221,7 +222,7 @@ } ], "source": [ - "# test very confined Dec case\n", + "# test very confined Declination case\n", "patches_result, patches_centers, info = generate_patches(\n", " arcminutes=(15, 15), overlap_percentage=0, decRange=[-90, -89.75], export=False\n", ")\n", @@ -279,7 +280,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 1, "id": "52946064", "metadata": {}, "outputs": [], @@ -342,7 +343,7 @@ " ax.set_xlim(xrange[0], xrange[1])\n", " ax.set_ylim(yrange[0], yrange[1])\n", "\n", - " plt.grid(True)\n", + " plt.grid(False)\n", "\n", " outfile_base = f\"{subfolder}/patches\"\n", " if title != None:\n", From d7bacfad20405900bab4d0c28c2b0796909e73c2 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Wed, 7 Feb 2024 15:17:28 -0500 Subject: [PATCH 22/27] Implementation --- data/demo_config.yml | 1 - docs/source/user_manual/search_params.rst | 3 + src/kbmod/analysis_utils.py | 143 ------------------ src/kbmod/configuration.py | 1 + src/kbmod/filters/stamp_filters.py | 170 +++++++++++++++++++++- src/kbmod/run_search.py | 21 ++- src/kbmod/search/common.h | 17 +++ src/kbmod/search/raw_image.cpp | 18 ++- tests/test_analysis_utils.py | 126 ---------------- tests/test_configuration.py | 1 + tests/test_raw_image.py | 16 ++ tests/test_stamp_filters.py | 124 ++++++++++++++++ 12 files changed, 353 insertions(+), 288 deletions(-) diff --git a/data/demo_config.yml b/data/demo_config.yml index 1d88e80c5..12d8b8585 100644 --- a/data/demo_config.yml +++ b/data/demo_config.yml @@ -55,7 +55,6 @@ mom_lims: - 37.5 - 37.5 - 1.5 -- 1.5 - 1.0 - 1.0 num_cores: 1 diff --git a/docs/source/user_manual/search_params.rst b/docs/source/user_manual/search_params.rst index 32efcce6c..c6f48e94f 100644 --- a/docs/source/user_manual/search_params.rst +++ b/docs/source/user_manual/search_params.rst @@ -155,6 +155,9 @@ This document serves to provide a quick overview of the existing parameters and | | | Can be use used in addition to | | | | outputting individual result files. | +------------------------+-----------------------------+----------------------------------------+ +| ``save_all_stamps`` | True | Save the individual stamps for each | +| | | result and timestep. | ++------------------------+-----------------------------+----------------------------------------+ | ``sigmaG_lims`` | [25, 75] | The percentiles to use in sigmaG | | | | filtering, if | | | | ``filter_type= clipped_sigmaG``. | diff --git a/src/kbmod/analysis_utils.py b/src/kbmod/analysis_utils.py index 4da73ca78..709e7a66f 100644 --- a/src/kbmod/analysis_utils.py +++ b/src/kbmod/analysis_utils.py @@ -121,149 +121,6 @@ def load_and_filter_results( res_num += chunk_size return keep - def get_all_stamps(self, result_list, search, stamp_radius): - """Get the stamps for the final results from a kbmod search. - - Parameters - ---------- - result_list : `ResultList` - The values from trajectories. The stamps are inserted into this data structure. - search : `kbmod.StackSearch` - The search object - stamp_radius : int - The radius of the stamps to create. - """ - stamp_edge = stamp_radius * 2 + 1 - for row in result_list.results: - stamps = kb.StampCreator.get_stamps(search.get_imagestack(), row.trajectory, stamp_radius) - # TODO: a way to avoid a copy here would be to do - # np.array([s.image for s in stamps], dtype=np.single, copy=False) - # but that could cause a problem with reference counting at the m - # moment. The real fix is to make the stamps return Image not - # RawImage, return the Image and avoid a reference to a private - # attribute. This risks collecting RawImage but leaving a dangling - # ref to its private field. That's a fix for another time. - row.all_stamps = np.array([stamp.image for stamp in stamps]) - - def apply_stamp_filter( - self, - result_list, - search, - center_thresh=0.03, - peak_offset=[2.0, 2.0], - mom_lims=[35.5, 35.5, 1.0, 0.25, 0.25], - chunk_size=1000000, - stamp_type="sum", - stamp_radius=10, - ): - """This function filters result postage stamps based on their Gaussian - Moments. Results with stamps that are similar to a Gaussian are kept. - - Parameters - ---------- - result_list : `ResultList` - The values from trajectories. This data gets modified directly by - the filtering. - search : `kbmod.StackSearch` - The search object. - center_thresh : float - The fraction of the total flux that must be contained in a single - central pixel. - peak_offset : list of floats - How far the brightest pixel in the stamp can be from the central - pixel. - mom_lims : list of floats - The maximum limit of the xx, yy, xy, x, and y central moments of - the stamp. - chunk_size : int - How many stamps to load and filter at a time. - stamp_type : string - Which method to use to generate stamps. - One of 'median', 'cpp_median', 'mean', 'cpp_mean', or 'sum'. - stamp_radius : int - The radius of the stamp. - """ - # Set the stamp creation and filtering parameters. - params = kb.StampParameters() - params.radius = stamp_radius - params.do_filtering = True - params.center_thresh = center_thresh - params.peak_offset_x = peak_offset[0] - params.peak_offset_y = peak_offset[1] - params.m20_limit = mom_lims[0] - params.m02_limit = mom_lims[1] - params.m11_limit = mom_lims[2] - params.m10_limit = mom_lims[3] - params.m01_limit = mom_lims[4] - - if stamp_type == "cpp_median" or stamp_type == "median": - params.stamp_type = kb.StampType.STAMP_MEDIAN - elif stamp_type == "cpp_mean" or stamp_type == "mean": - params.stamp_type = kb.StampType.STAMP_MEAN - else: - params.stamp_type = kb.StampType.STAMP_SUM - - # Save some useful helper data. - num_times = search.get_num_images() - all_valid_inds = [] - - # Run the stamp creation and filtering in batches of chunk_size. - print("---------------------------------------") - print("Applying Stamp Filtering") - print("---------------------------------------", flush=True) - start_time = time.time() - start_idx = 0 - if result_list.num_results() <= 0: - print("Skipping. Nothing to filter.") - return - - print("Stamp filtering %i results" % result_list.num_results()) - while start_idx < result_list.num_results(): - end_idx = min([start_idx + chunk_size, result_list.num_results()]) - - # Create a subslice of the results and the Boolean indices. - # Note that the sum stamp type does not filter out lc_index. - inds_to_use = [i for i in range(start_idx, end_idx)] - trj_slice = [result_list.results[i].trajectory for i in inds_to_use] - if params.stamp_type != kb.StampType.STAMP_SUM: - bool_slice = [result_list.results[i].valid_indices_as_booleans() for i in inds_to_use] - else: - # For the sum stamp, use all the indices for each trajectory. - all_true = [True] * num_times - bool_slice = [all_true for _ in inds_to_use] - - # Create and filter the results, using the GPU if there is one and enough - # trajectories to make it worthwhile. - stamps_slice = kb.StampCreator.get_coadded_stamps( - search.get_imagestack(), - trj_slice, - bool_slice, - params, - kb.HAS_GPU and len(trj_slice) > 100, - ) - # TODO: a way to avoid a copy here would be to do - # np.array([s.image for s in stamps], dtype=np.single, copy=False) - # but that could cause a problem with reference counting at the m - # moment. The real fix is to make the stamps return Image not - # RawImage and avoid reference to an private attribute and risking - # collecting RawImage but leaving a dangling ref to the attribute. - # That's a fix for another time so I'm leaving it as a copy here - for ind, stamp in enumerate(stamps_slice): - if stamp.width > 1: - result_list.results[ind + start_idx].stamp = np.array(stamp.image) - all_valid_inds.append(ind + start_idx) - - # Move to the next chunk. - start_idx += chunk_size - - # Do the actual filtering of results - result_list.filter_results(all_valid_inds) - print("Keeping %i results" % result_list.num_results(), flush=True) - - end_time = time.time() - time_elapsed = end_time - start_time - print("{:.2f}s elapsed".format(time_elapsed)) - def apply_clustering(self, result_list, cluster_params): """This function clusters results that have similar trajectories. diff --git a/src/kbmod/configuration.py b/src/kbmod/configuration.py index c6fdeeba4..88e59063b 100644 --- a/src/kbmod/configuration.py +++ b/src/kbmod/configuration.py @@ -74,6 +74,7 @@ def __init__(self): "repeated_flag_keys": default_repeated_flag_keys, "res_filepath": None, "result_filename": None, + "save_all_stamps": True, "sigmaG_lims": [25, 75], "stamp_radius": 10, "stamp_type": "sum", diff --git a/src/kbmod/filters/stamp_filters.py b/src/kbmod/filters/stamp_filters.py index 3d5db49aa..4354c26c5 100644 --- a/src/kbmod/filters/stamp_filters.py +++ b/src/kbmod/filters/stamp_filters.py @@ -5,9 +5,20 @@ """ import abc +import numpy as np +import time +from kbmod.configuration import SearchConfiguration from kbmod.result_list import ResultRow -from kbmod.search import KB_NO_DATA, RawImage +from kbmod.search import ( + HAS_GPU, + KB_NO_DATA, + ImageStack, + RawImage, + StampCreator, + StampParameters, + StampType, +) class BaseStampFilter(abc.ABC): @@ -237,3 +248,160 @@ def keep_row(self, row: ResultRow): """ image = RawImage(row.stamp) return image.center_is_local_max(self.flux_thresh, self.local_max) + + +def extract_search_parameters_from_config(config): + """Create an initialized StampParameters object from the configuration settings + while doing some validity checking. + + Parameters + ---------- + config : `SearchConfiguration` + The configuration object. + + Returns + ------- + params : `StampParameters` + The StampParameters object with all fields set. + + Raises + ------ + Raises a ``ValueError`` if parameter validation fails. + Raises a ``KeyError`` if a required parameter is not found. + """ + params = StampParameters() + + # Construction parameters + params.radius = config["stamp_radius"] + if params.radius < 0: + raise ValueError(f"Invalid stamp radius {params.radius}") + + stamp_type = config["stamp_type"] + if stamp_type == "cpp_median" or stamp_type == "median": + params.stamp_type = StampType.STAMP_MEDIAN + elif stamp_type == "cpp_mean" or stamp_type == "mean": + params.stamp_type = StampType.STAMP_MEAN + elif stamp_type == "cpp_sum" or stamp_type == "sum": + params.stamp_type = StampType.STAMP_SUM + else: + raise ValueError(f"Unrecognized stamp type: {stamp_type}") + + # Filtering parameters (with validity checking) + params.do_filtering = config["do_stamp_filter"] + params.center_thresh = config["center_thresh"] + + peak_offset = config["peak_offset"] + if len(peak_offset) != 2: + raise ValueError(f"Expected length 2 list for peak_offset. Found {peak_offset}") + params.peak_offset_x = peak_offset[0] + params.peak_offset_y = peak_offset[1] + + mom_lims = config["mom_lims"] + if len(mom_lims) != 5: + raise ValueError(f"Expected length 5 list for mom_lims. Found {mom_lims}") + params.m20_limit = mom_lims[0] + params.m02_limit = mom_lims[1] + params.m11_limit = mom_lims[2] + params.m10_limit = mom_lims[3] + params.m01_limit = mom_lims[4] + + return params + + +def get_coadds_and_filter(result_list, im_stack, stamp_params, chunk_size=1000000, debug=False): + """Create the co-added postage stamps and filter them based on their statistical + properties. Results with stamps that are similar to a Gaussian are kept. + + Parameters + ---------- + result_list : `ResultList` + The current set of results. Modified directly. + im_stack : `ImageStack` + The images from which to build the co-added stamps. + stamp_params : `StampParameters` or `SearchConfiguration` + The filtering parameters for the stamps. + chunk_size : `int` + How many stamps to load and filter at a time. Used to control memory. + debug : `bool` + Output verbose debugging messages. + """ + if type(stamp_params) is SearchConfiguration: + stamp_params = extract_search_parameters_from_config(stamp_params) + + if debug: + print("---------------------------------------") + print("Applying Stamp Filtering") + print("---------------------------------------") + if result_list.num_results() <= 0: + print("Skipping. Nothing to filter.") + else: + print(f"Stamp filtering {result_list.num_results()} results.") + print(stamp_params) + print(f"Using chunksize = {chunk_size}") + + # Run the stamp creation and filtering in batches of chunk_size. + start_time = time.time() + start_idx = 0 + all_valid_inds = [] + while start_idx < result_list.num_results(): + end_idx = min([start_idx + chunk_size, result_list.num_results()]) + + # Create a subslice of the results and the Boolean indices. + # Note that the sum stamp type does not filter out lc_index. + inds_to_use = [i for i in range(start_idx, end_idx)] + trj_slice = [result_list.results[i].trajectory for i in inds_to_use] + if stamp_params.stamp_type != StampType.STAMP_SUM: + bool_slice = [result_list.results[i].valid_indices_as_booleans() for i in inds_to_use] + else: + # For the sum stamp, use all the indices for each trajectory. + all_true = [True] * im_stack.img_count() + bool_slice = [all_true for _ in inds_to_use] + + # Create and filter the results, using the GPU if there is one and enough + # trajectories to make it worthwhile. + stamps_slice = StampCreator.get_coadded_stamps( + im_stack, + trj_slice, + bool_slice, + stamp_params, + HAS_GPU and len(trj_slice) > 100, + ) + # TODO: a way to avoid a copy here would be to do + # np.array([s.image for s in stamps], dtype=np.single, copy=False) + # but that could cause a problem with reference counting at the m + # moment. The real fix is to make the stamps return Image not + # RawImage and avoid reference to an private attribute and risking + # collecting RawImage but leaving a dangling ref to the attribute. + # That's a fix for another time so I'm leaving it as a copy here + for ind, stamp in enumerate(stamps_slice): + if stamp.width > 1: + result_list.results[ind + start_idx].stamp = np.array(stamp.image) + all_valid_inds.append(ind + start_idx) + + # Move to the next chunk. + start_idx += chunk_size + + # Do the actual filtering of results + result_list.filter_results(all_valid_inds) + if debug: + print("Keeping %i results" % result_list.num_results(), flush=True) + time_elapsed = time.time() - start_time + print("{:.2f}s elapsed".format(time_elapsed)) + + +def append_all_stamps(result_list, im_stack, stamp_radius): + """Get the stamps for the final results from a kbmod search. These are appended + onto the corresponding entries in a ResultList. + + Parameters + ---------- + result_list : `ResultList` + The current set of results. Modified directly. + im_stack : `ImageStack` + The stack of images. + stamp_radius : `int` + The radius of the stamps to create. + """ + for row in result_list.results: + stamps = StampCreator.get_stamps(im_stack, row.trajectory, stamp_radius) + row.all_stamps = np.array([stamp.image for stamp in stamps]) diff --git a/src/kbmod/run_search.py b/src/kbmod/run_search.py index 0065ccae3..9ca49f1ec 100644 --- a/src/kbmod/run_search.py +++ b/src/kbmod/run_search.py @@ -13,11 +13,12 @@ import kbmod.search as kb from .analysis_utils import PostProcess -from .data_interface import load_input_from_config, load_input_from_file from .configuration import SearchConfiguration +from .data_interface import load_input_from_config, load_input_from_file +from .filters.sigma_g_filter import SigmaGClipping +from .filters.stamp_filters import append_all_stamps, get_coadds_and_filter from .masking import apply_mask_operations from .result_list import * -from .filters.sigma_g_filter import SigmaGClipping from .work_unit import WorkUnit @@ -161,14 +162,11 @@ def run_search(self, config, stack): max_lh=config["max_lh"], ) if config["do_stamp_filter"]: - kb_post_process.apply_stamp_filter( + get_coadds_and_filter( keep, - search, - center_thresh=config["center_thresh"], - peak_offset=config["peak_offset"], - mom_lims=config["mom_lims"], - stamp_type=config["stamp_type"], - stamp_radius=config["stamp_radius"], + search.get_imagestack(), + config, + debug=config["debug"], ) if config["do_clustering"]: @@ -180,8 +178,9 @@ def run_search(self, config, stack): cluster_params["mjd"] = np.array(mjds) kb_post_process.apply_clustering(keep, cluster_params) - # Extract all the stamps. - kb_post_process.get_all_stamps(keep, search, config["stamp_radius"]) + # Extract all the stamps for all time steps and append them onto the result rows. + if config["save_all_stamps"]: + append_all_stamps(keep, search.get_imagestack(), config["stamp_radius"]) # TODO - Re-enable the known object counting once we have a way to pass # A WCS into the WorkUnit. diff --git a/src/kbmod/search/common.h b/src/kbmod/search/common.h index b7c89663e..285d51876 100644 --- a/src/kbmod/search/common.h +++ b/src/kbmod/search/common.h @@ -106,6 +106,22 @@ struct StampParameters { float m11_limit; float m02_limit; float m20_limit; + + const std::string to_string() const { + // If filtering is turned off, output the minimal information on a single line. + // Otherwise dump the full statistics on multiple lines. + if (!do_filtering) { + return ("Type: " + std::to_string(stamp_type) + " Radius: " + std::to_string(radius) + + " Filtering: false"); + } else { + return ("Type: " + std::to_string(stamp_type) + "\nRadius: " + std::to_string(radius) + + "\nFiltering: true" + "\nCenter Thresh: " + std::to_string(center_thresh) + + "\nPeak Offset: x=" + std::to_string(peak_offset_x) + " y=" + + std::to_string(peak_offset_y) + "\nMoment Limits: m01=" + std::to_string(m01_limit) + + " m10=" + std::to_string(m10_limit) + " m11=" + std::to_string(m11_limit) + + " m02=" + std::to_string(m02_limit) + " m20=" + std::to_string(m02_limit)); + } + } }; // Basic image moments use for analysis. @@ -162,6 +178,7 @@ static void image_moments_bindings(py::module &m) { static void stamp_parameters_bindings(py::module &m) { py::class_(m, "StampParameters", pydocs::DOC_StampParameters) .def(py::init<>()) + .def("__str__", &StampParameters::to_string) .def_readwrite("radius", &StampParameters::radius) .def_readwrite("stamp_type", &StampParameters::stamp_type) .def_readwrite("do_filtering", &StampParameters::do_filtering) diff --git a/src/kbmod/search/raw_image.cpp b/src/kbmod/search/raw_image.cpp index a2e541355..f4f40637f 100644 --- a/src/kbmod/search/raw_image.cpp +++ b/src/kbmod/search/raw_image.cpp @@ -114,13 +114,19 @@ RawImage RawImage::create_stamp(const Point& p, const int radius, const bool kee if (radius < 0) throw std::runtime_error("stamp radius must be at least 0"); const int dim = radius * 2 + 1; - // can't address this instance of non-uniform index handling with Point - // and Index, because at a base level it adopts a different definition of - // the pixel grid to coordinate system transformation. - auto [corner, anchor, w, h] = indexing::anchored_block({(int)p.y, (int)p.x}, radius, width, height); - Image stamp = Image::Constant(dim, dim, NO_DATA); - stamp.block(anchor.i, anchor.j, h, w) = image.block(corner.i, corner.j, h, w); + + // Eigen gets uphappy if the stamp does not overlap at all. In this case, skip + // the computation and leave the entire stamp set to NO_DATA. + Index idx = p.to_index(); + if ((idx.j + radius >= 0) && (idx.j - radius < (int)width) && + (idx.i + radius >= 0) && (idx.i - radius < (int)height)) { + // can't address this instance of non-uniform index handling with Point + // and Index, because at a base level it adopts a different definition of + // the pixel grid to coordinate system transformation. + auto [corner, anchor, w, h] = indexing::anchored_block({(int)p.y, (int)p.x}, radius, width, height); + stamp.block(anchor.i, anchor.j, h, w) = image.block(corner.i, corner.j, h, w); + } if (!keep_no_data) stamp = (stamp.array() == NO_DATA).select(0.0, stamp); diff --git a/tests/test_analysis_utils.py b/tests/test_analysis_utils.py index 9d8523962..506202de0 100644 --- a/tests/test_analysis_utils.py +++ b/tests/test_analysis_utils.py @@ -131,132 +131,6 @@ def setUp(self): row.set_psi_phi(get_psi_curves[i], get_phi_curves[i]) self.curve_result_set.append_result(row) - @unittest.skipIf(not HAS_GPU, "Skipping test (no GPU detected)") - def test_apply_stamp_filter(self): - # object properties - self.object_flux = 250.0 - self.start_x = 4 - self.start_y = 3 - self.vxel = 2.0 - self.vyel = 1.0 - - for i in range(self.img_count): - time = i / self.img_count - add_fake_object( - self.imlist[i], - self.start_x + time * self.vxel + 0.5, - self.start_y + time * self.vyel + 0.5, - self.object_flux, - self.p, - ) - - stack = ImageStack(self.imlist) - search = StackSearch(stack) - search.search( - self.angle_steps, - self.velocity_steps, - self.min_angle, - self.max_angle, - self.min_vel, - self.max_vel, - int(self.img_count / 2), - ) - - zeroed_times = np.array(stack.build_zeroed_times()) - kb_post_process = PostProcess(self.config, zeroed_times) - - keep = kb_post_process.load_and_filter_results( - search, - self.config["lh_level"], - chunk_size=self.config["chunk_size"], - max_lh=self.config["max_lh"], - ) - - # Apply the stamp filter with default parameters. - kb_post_process.apply_stamp_filter(keep, search) - - # Check that we get at least one result and those results have stamps. - self.assertGreater(keep.num_results(), 0) - for i in range(keep.num_results()): - self.assertIsNotNone(keep.results[i].stamp) - - def test_apply_stamp_filter_2(self): - # Also confirms that apply_stamp_filter works with a chunksize < number - # of results. - - # object properties - self.object_flux = 250.0 - self.start_x = 4 - self.start_y = 3 - self.vxel = 2.0 - self.vyel = 1.0 - - for i in range(self.img_count): - time = i / self.img_count - add_fake_object( - self.imlist[i], - self.start_x + time * self.vxel, - self.start_y + time * self.vyel, - self.object_flux, - self.p, - ) - - stack = ImageStack(self.imlist) - search = StackSearch(stack) - - # Create a first Trajectory that matches perfectly. - trj = Trajectory() - trj.x = self.start_x - trj.y = self.start_y - trj.vx = self.vxel - trj.vy = self.vyel - - # Create a second Trajectory that isn't any good. - trj2 = Trajectory() - trj2.x = 1 - trj2.y = 1 - trj2.vx = 0 - trj2.vy = 0 - - # Create a third Trajectory that is close to good, but offset. - trj3 = Trajectory() - trj3.x = trj.x + 2 - trj3.y = trj.y + 2 - trj3.vx = trj.vx - trj3.vy = trj.vy - - # Create a fourth Trajectory that is just close enough - trj4 = Trajectory() - trj4.x = trj.x + 1 - trj4.y = trj.y + 1 - trj4.vx = trj.vx - trj4.vy = trj.vy - - # Create the ResultList. - keep = ResultList(self.time_list) - keep.append_result(ResultRow(trj, self.img_count)) - keep.append_result(ResultRow(trj2, self.img_count)) - keep.append_result(ResultRow(trj3, self.img_count)) - keep.append_result(ResultRow(trj4, self.img_count)) - - # Create the post processing object. - kb_post_process = PostProcess(self.config, self.time_list) - keep2 = kb_post_process.apply_stamp_filter( - keep, - search, - center_thresh=0.03, - peak_offset=[1.5, 1.5], - mom_lims=[35.5, 35.5, 1.0, 1.0, 1.0], - chunk_size=1, - stamp_type="cpp_mean", - stamp_radius=5, - ) - - # The check that the correct indices and number of stamps are saved. - self.assertEqual(keep.num_results(), 2) - self.assertEqual(keep.results[0].trajectory.x, self.start_x) - self.assertEqual(keep.results[1].trajectory.x, self.start_x + 1) - def test_clustering(self): cluster_params = {} cluster_params["x_size"] = self.dim_x diff --git a/tests/test_configuration.py b/tests/test_configuration.py index 7140352cd..da9f90761 100644 --- a/tests/test_configuration.py +++ b/tests/test_configuration.py @@ -7,6 +7,7 @@ from yaml import safe_load from kbmod.configuration import SearchConfiguration +from kbmod.search import StampParameters, StampType class test_configuration(unittest.TestCase): diff --git a/tests/test_raw_image.py b/tests/test_raw_image.py index be1a48d57..6d70434ca 100644 --- a/tests/test_raw_image.py +++ b/tests/test_raw_image.py @@ -374,6 +374,22 @@ def test_make_stamp(self): expected = np.array([[0.0, 100.0, 101.0], [0.0, 110.0, 111.0], [0.0, 0.0, 0.0]]) self.assertTrue((stamp.image == expected).all()) + # Test a stamp that is completely out of bounds. + stamp = img.create_stamp(20.5, 20.5, 1, False) + expected = np.array([[0.0, 0.0, 0.0], [0.0, 0.0, 0.0], [0.0, 0.0, 0.0]]) + self.assertTrue((stamp.image == expected).all()) + + # Test a stamp that overlaps at a single corner pixel. + stamp = img.create_stamp(-1.5, -1.5, 1, True) + expected = np.array( + [ + [KB_NO_DATA, KB_NO_DATA, KB_NO_DATA], + [KB_NO_DATA, KB_NO_DATA, KB_NO_DATA], + [KB_NO_DATA, KB_NO_DATA, 0.0], + ] + ) + self.assertTrue((stamp.image == expected).all()) + def test_read_write_file(self): """Test file writes and reads correctly.""" img = RawImage(self.array, 10.0) diff --git a/tests/test_stamp_filters.py b/tests/test_stamp_filters.py index 61c44cf73..32e62272a 100644 --- a/tests/test_stamp_filters.py +++ b/tests/test_stamp_filters.py @@ -1,5 +1,8 @@ +import numpy as np import unittest +from kbmod.configuration import SearchConfiguration +from kbmod.fake_data_creator import add_fake_object, FakeDataSet from kbmod.filters.stamp_filters import * from kbmod.result_list import * from kbmod.search import * @@ -137,6 +140,127 @@ def test_center_filtering(self): self.assertFalse(StampCenterFilter(3, True, 0.4).keep_row(row)) self.assertTrue(StampCenterFilter(3, False, 0.2).keep_row(row)) + def test_extract_search_parameters_from_config(self): + config_dict = { + "center_thresh": 0.05, + "do_stamp_filter": True, + "mom_lims": [50.0, 51.0, 1.0, 2.0, 3.0], + "peak_offset": [1.5, 3.5], + "stamp_type": "median", + "stamp_radius": 7, + } + config = SearchConfiguration.from_dict(config_dict) + + params = extract_search_parameters_from_config(config) + self.assertEqual(params.radius, 7) + self.assertEqual(params.stamp_type, StampType.STAMP_MEDIAN) + self.assertEqual(params.do_filtering, True) + self.assertAlmostEqual(params.center_thresh, 0.05) + self.assertAlmostEqual(params.peak_offset_x, 1.5) + self.assertAlmostEqual(params.peak_offset_y, 3.5) + self.assertAlmostEqual(params.m20_limit, 50.0) + self.assertAlmostEqual(params.m02_limit, 51.0) + self.assertAlmostEqual(params.m11_limit, 1.0) + self.assertAlmostEqual(params.m10_limit, 2.0) + self.assertAlmostEqual(params.m01_limit, 3.0) + + # Test bad configurations + config.set("stamp_radius", -1) + self.assertRaises(ValueError, extract_search_parameters_from_config, config) + config.set("stamp_radius", 7) + + config.set("stamp_type", "broken") + self.assertRaises(ValueError, extract_search_parameters_from_config, config) + config.set("stamp_type", "median") + + config.set("peak_offset", [50.0]) + self.assertRaises(ValueError, extract_search_parameters_from_config, config) + config.set("peak_offset", [1.5, 3.5]) + + config.set("mom_lims", [50.0, 51.0, 1.0, 3.0]) + self.assertRaises(ValueError, extract_search_parameters_from_config, config) + config.set("mom_lims", [50.0, 51.0, 1.0, 2.0, 3.0]) + + @unittest.skipIf(not HAS_GPU, "Skipping test (no GPU detected)") + def test_get_coadds_and_filter(self): + image_count = 10 + ds = FakeDataSet( + 25, # width + 35, # height + image_count, # time steps + 1.0, # noise level + 0.5, # psf value + 1, # observations per day + True, # Use a fixed seed for testing + ) + + # Insert a single fake object with known parameters. + trj = make_trajectory(8, 7, 2.0, 1.0, flux=250.0) + ds.insert_object(trj) + + # Second Trajectory that isn't any good. + trj2 = make_trajectory(1, 1, 0.0, 0.0) + + # Third Trajectory that is close to good, but offset. + trj3 = make_trajectory(trj.x + 2, trj.y + 2, trj.vx, trj.vy) + + # Create a fourth Trajectory that is just close enough + trj4 = make_trajectory(trj.x + 1, trj.y + 1, trj.vx, trj.vy) + + # Create the ResultList. + keep = ResultList(ds.times) + keep.append_result(ResultRow(trj, image_count)) + keep.append_result(ResultRow(trj2, image_count)) + keep.append_result(ResultRow(trj3, image_count)) + keep.append_result(ResultRow(trj4, image_count)) + + # Create the stamp parameters we need. + config_dict = { + "center_thresh": 0.03, + "do_stamp_filter": True, + "mom_lims": [35.5, 35.5, 1.0, 1.0, 1.0], + "peak_offset": [1.5, 1.5], + "stamp_type": "cpp_mean", + "stamp_radius": 5, + } + config = SearchConfiguration.from_dict(config_dict) + + # Do the filtering. + get_coadds_and_filter(keep, ds.stack, config, chunk_size=1, debug=False) + + # The check that the correct indices and number of stamps are saved. + self.assertEqual(keep.num_results(), 2) + self.assertEqual(keep.results[0].trajectory.x, trj.x) + self.assertEqual(keep.results[1].trajectory.x, trj.x + 1) + self.assertIsNotNone(keep.results[0].stamp) + self.assertIsNotNone(keep.results[1].stamp) + + def test_append_all_stamps(self): + image_count = 10 + ds = FakeDataSet( + 25, # width + 35, # height + image_count, # time steps + 1.0, # noise level + 0.5, # psf value + 1, # observations per day + True, # Use a fixed seed for testing + ) + + # Make a few results with different trajectories. + keep = ResultList(ds.times) + keep.append_result(ResultRow(make_trajectory(8, 7, 2.0, 1.0), image_count)) + keep.append_result(ResultRow(make_trajectory(10, 22, -2.0, -1.0), image_count)) + keep.append_result(ResultRow(make_trajectory(8, 7, -2.0, -1.0), image_count)) + + append_all_stamps(keep, ds.stack, 5) + for row in keep.results: + self.assertIsNotNone(row.all_stamps) + self.assertEqual(len(row.all_stamps), image_count) + for i in range(image_count): + self.assertEqual(np.shape(row.all_stamps[i])[0], 11) + self.assertEqual(np.shape(row.all_stamps[i])[1], 11) + if __name__ == "__main__": unittest.main() From cc2ea338d6d887d44099ee92fece97cad4c1ccc8 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Wed, 7 Feb 2024 15:21:22 -0500 Subject: [PATCH 23/27] Formatting --- src/kbmod/search/raw_image.cpp | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/src/kbmod/search/raw_image.cpp b/src/kbmod/search/raw_image.cpp index f4f40637f..019f18a85 100644 --- a/src/kbmod/search/raw_image.cpp +++ b/src/kbmod/search/raw_image.cpp @@ -116,11 +116,11 @@ RawImage RawImage::create_stamp(const Point& p, const int radius, const bool kee const int dim = radius * 2 + 1; Image stamp = Image::Constant(dim, dim, NO_DATA); - // Eigen gets uphappy if the stamp does not overlap at all. In this case, skip - // the computation and leave the entire stamp set to NO_DATA. + // Eigen gets uphappy if the stamp does not overlap at all. In this case, skip + // the computation and leave the entire stamp set to NO_DATA. Index idx = p.to_index(); - if ((idx.j + radius >= 0) && (idx.j - radius < (int)width) && - (idx.i + radius >= 0) && (idx.i - radius < (int)height)) { + if ((idx.j + radius >= 0) && (idx.j - radius < (int)width) && (idx.i + radius >= 0) && + (idx.i - radius < (int)height)) { // can't address this instance of non-uniform index handling with Point // and Index, because at a base level it adopts a different definition of // the pixel grid to coordinate system transformation. From 30759be71f6eda83481defb7e3b0618114e6acaa Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Wed, 7 Feb 2024 15:30:42 -0500 Subject: [PATCH 24/27] Remove unneeded import --- tests/test_configuration.py | 1 - 1 file changed, 1 deletion(-) diff --git a/tests/test_configuration.py b/tests/test_configuration.py index da9f90761..7140352cd 100644 --- a/tests/test_configuration.py +++ b/tests/test_configuration.py @@ -7,7 +7,6 @@ from yaml import safe_load from kbmod.configuration import SearchConfiguration -from kbmod.search import StampParameters, StampType class test_configuration(unittest.TestCase): From 5cc08bd8dc0be90eebc56008cd8705a4e0467373 Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Wed, 7 Feb 2024 16:49:42 -0500 Subject: [PATCH 25/27] Fix typo --- src/kbmod/search/raw_image.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/kbmod/search/raw_image.cpp b/src/kbmod/search/raw_image.cpp index 019f18a85..739c576c8 100644 --- a/src/kbmod/search/raw_image.cpp +++ b/src/kbmod/search/raw_image.cpp @@ -116,7 +116,7 @@ RawImage RawImage::create_stamp(const Point& p, const int radius, const bool kee const int dim = radius * 2 + 1; Image stamp = Image::Constant(dim, dim, NO_DATA); - // Eigen gets uphappy if the stamp does not overlap at all. In this case, skip + // Eigen gets unhappy if the stamp does not overlap at all. In this case, skip // the computation and leave the entire stamp set to NO_DATA. Index idx = p.to_index(); if ((idx.j + radius >= 0) && (idx.j - radius < (int)width) && (idx.i + radius >= 0) && From 545d1073570635e518032dd37a09a8424f7131a8 Mon Sep 17 00:00:00 2001 From: Colin Orion Chandler Date: Wed, 7 Feb 2024 16:12:34 -0800 Subject: [PATCH 26/27] Region searching (#461) * Plot correction, clarifying text disable gridlines for the sky plotting * Create Region Searching Workbook.ipynb This contains the essence of Region Search for now. * Creating a structure for scratch notebooks Brainstorming, demos, and testing to share. * Update RegionSearchTesting.ipynb black --target-version py38 --line-length 110 is what works, but only if black was installed with [jupyter] * Update Region Searching Workbook.ipynb Consolidation into a single Pandas dataframe, Notebook cleanup, master function in preparation for a demo, TODO items added/updated, and a Next Steps added to the end. * Update Region Searching Workbook.ipynb Fixed broken/missing get_timestamps. Other minor fixes too. * Update Region Searching Workbook.ipynb Fixed hanging function with a pass. --- .../Region Searching Workbook.ipynb | 586 ++++++++++-------- 1 file changed, 311 insertions(+), 275 deletions(-) diff --git a/notebooks/region_search/Region Searching Workbook.ipynb b/notebooks/region_search/Region Searching Workbook.ipynb index 5d7e6da65..deb393ea1 100644 --- a/notebooks/region_search/Region Searching Workbook.ipynb +++ b/notebooks/region_search/Region Searching Workbook.ipynb @@ -5,7 +5,7 @@ "id": "d94d8d2b", "metadata": {}, "source": [ - "# Butler Interface for User\n", + "# Region Searching for KBMOD\n", "\n", "The point of this notebook is to do step-by-step exploration of the DEEP dataset that was first run through KBMOD for the first set of papers. That work was led by Hayden Smotherman, hence the reference to that name.\n", "\n", @@ -36,7 +36,7 @@ }, { "cell_type": "code", - "execution_count": 339, + "execution_count": 1, "id": "d0189084", "metadata": {}, "outputs": [], @@ -45,6 +45,7 @@ "import lsst\n", "import lsst.daf.butler as dafButler\n", "import os\n", + "import glob\n", "import time\n", "from matplotlib import pyplot as plt\n", "import progressbar\n", @@ -58,7 +59,7 @@ }, { "cell_type": "code", - "execution_count": 476, + "execution_count": 2, "id": "ceeec168", "metadata": {}, "outputs": [ @@ -82,7 +83,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 3, "id": "693492d4", "metadata": {}, "outputs": [], @@ -94,7 +95,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "id": "b13eb927", "metadata": {}, "outputs": [], @@ -127,7 +128,7 @@ }, { "cell_type": "code", - "execution_count": 465, + "execution_count": 5, "id": "e6a546f0", "metadata": {}, "outputs": [], @@ -157,7 +158,7 @@ }, { "cell_type": "code", - "execution_count": 466, + "execution_count": 6, "id": "3006e4fd", "metadata": {}, "outputs": [ @@ -175,7 +176,7 @@ }, { "cell_type": "code", - "execution_count": 468, + "execution_count": 7, "id": "b409c810", "metadata": {}, "outputs": [], @@ -234,7 +235,7 @@ }, { "cell_type": "code", - "execution_count": 473, + "execution_count": 8, "id": "dc9a4efc", "metadata": {}, "outputs": [ @@ -251,7 +252,7 @@ " 'PointingGroup023/imdiff_r']" ] }, - "execution_count": 473, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -263,7 +264,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 9, "id": "4537e06a", "metadata": {}, "outputs": [], @@ -298,7 +299,7 @@ }, { "cell_type": "code", - "execution_count": 169, + "execution_count": 10, "id": "47c8c37c", "metadata": {}, "outputs": [], @@ -369,24 +370,110 @@ }, { "cell_type": "code", - "execution_count": 170, + "execution_count": 11, "id": "b741015f", "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "100% (129 of 129) |######################| Elapsed Time: 0:02:28 Time: 0:02:28\n" - ] - }, { "name": "stdout", "output_type": "stream", "text": [ - "Saving 46 datasetTypes to /astro/users/coc123/kbmod_tmp/dataset_types.csv now...\n", - "CPU times: user 1min 57s, sys: 2.96 s, total: 2min\n", - "Wall time: 2min 28s\n" + "Recycling /astro/users/coc123/kbmod_tmp/dataset_types.csv as overwrite was False...\n", + "assembleCoadd_config,8\n", + "\n", + "assembleCoadd_log,268\n", + "\n", + "assembleCoadd_metadata,700\n", + "\n", + "cal_ref_cat,122856\n", + "\n", + "calexp,47403\n", + "\n", + "calexpBackground,47403\n", + "\n", + "calibrate_config,8\n", + "\n", + "calibrate_log,17961\n", + "\n", + "calibrate_metadata,47403\n", + "\n", + "characterizeImage_config,8\n", + "\n", + "characterizeImage_log,18290\n", + "\n", + "characterizeImage_metadata,47423\n", + "\n", + "deepCoadd,693\n", + "\n", + "deepCoadd_directWarp,167085\n", + "\n", + "deepCoadd_inputMap,693\n", + "\n", + "deepCoadd_psfMatchedWarp,167085\n", + "\n", + "deepDiff_diaSrc,47383\n", + "\n", + "deepDiff_diaSrc_schema,8\n", + "\n", + "deepDiff_differenceExp,47383\n", + "\n", + "deepDiff_warpedExp,29445\n", + "\n", + "gaia_DR1_v1,524283\n", + "\n", + "icExp,47423\n", + "\n", + "icExpBackground,47423\n", + "\n", + "icSrc,47423\n", + "\n", + "icSrc_schema,8\n", + "\n", + "imageDifference_config,8\n", + "\n", + "imageDifference_log,17942\n", + "\n", + "imageDifference_metadata,47383\n", + "\n", + "isr_config,8\n", + "\n", + "isr_log,18290\n", + "\n", + "isr_metadata,48422\n", + "\n", + "makeWarp_config,8\n", + "\n", + "makeWarp_log,64924\n", + "\n", + "makeWarp_metadata,167085\n", + "\n", + "overscanRaw,48422\n", + "\n", + "overscan_config,8\n", + "\n", + "overscan_log,18290\n", + "\n", + "overscan_metadata,48422\n", + "\n", + "packages,32\n", + "\n", + "postISRCCD,48422\n", + "\n", + "ps1_pv3_3pi_20170110,130924\n", + "\n", + "raw,48422\n", + "\n", + "skyMap,1\n", + "\n", + "src,47403\n", + "\n", + "srcMatch,47403\n", + "\n", + "src_schema,8\n", + "\n", + "Read 46 datasetTypes from disk.\n", + "CPU times: user 1.55 ms, sys: 1.26 ms, total: 2.81 ms\n", + "Wall time: 3.19 ms\n" ] } ], @@ -398,7 +485,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 12, "id": "6406f04c", "metadata": {}, "outputs": [ @@ -462,12 +549,12 @@ "\n", "print(f\"Across all collections, we see the following numbers by datasetType: \")\n", "for dt in datasetTypes:\n", - " print(f\"{datasetTypes[dt]!s:10} {dt.name}\")" + " print(f\"{datasetTypes[dt]!s:10} {dt}\")" ] }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 13, "id": "53a03c75", "metadata": {}, "outputs": [], @@ -492,7 +579,7 @@ }, { "cell_type": "code", - "execution_count": 608, + "execution_count": 14, "id": "c47e5588", "metadata": {}, "outputs": [], @@ -536,7 +623,7 @@ }, { "cell_type": "code", - "execution_count": 611, + "execution_count": 15, "id": "eb222e02", "metadata": {}, "outputs": [ @@ -544,8 +631,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 1.82 s, sys: 83.2 ms, total: 1.91 s\n", - "Wall time: 2.4 s\n" + "CPU times: user 2.23 s, sys: 122 ms, total: 2.35 s\n", + "Wall time: 2.87 s\n" ] } ], @@ -559,7 +646,7 @@ }, { "cell_type": "code", - "execution_count": 612, + "execution_count": 16, "id": "6e9462e1", "metadata": {}, "outputs": [ @@ -691,7 +778,7 @@ "[47383 rows x 3 columns]" ] }, - "execution_count": 612, + "execution_count": 16, "metadata": {}, "output_type": "execute_result" } @@ -702,7 +789,7 @@ }, { "cell_type": "code", - "execution_count": 610, + "execution_count": 17, "id": "e04e2f35", "metadata": {}, "outputs": [ @@ -720,7 +807,7 @@ }, { "cell_type": "code", - "execution_count": 559, + "execution_count": 18, "id": "08d5b443", "metadata": {}, "outputs": [ @@ -737,7 +824,7 @@ "visit_detector_region.RecordClass(instrument='DECam', detector=62, visit=946176, region=ConvexPolygon([UnitVector3d(0.9876086828694174, -0.13336028508776862, -0.08272922024438323), UnitVector3d(0.9873378171284917, -0.13332652431396907, -0.08595389916869185), UnitVector3d(0.9881047366097594, -0.12752395595185462, -0.08594573955553172), UnitVector3d(0.9883760335240734, -0.12755303452468866, -0.0827226676235914)]))" ] }, - "execution_count": 559, + "execution_count": 18, "metadata": {}, "output_type": "execute_result" } @@ -749,7 +836,7 @@ }, { "cell_type": "code", - "execution_count": 560, + "execution_count": 19, "id": "e28031c2", "metadata": {}, "outputs": [ @@ -759,7 +846,7 @@ "{instrument: 'DECam', detector: 62, visit: 946176}" ] }, - "execution_count": 560, + "execution_count": 19, "metadata": {}, "output_type": "execute_result" } @@ -771,7 +858,7 @@ }, { "cell_type": "code", - "execution_count": 561, + "execution_count": 20, "id": "761f3610", "metadata": {}, "outputs": [ @@ -794,7 +881,7 @@ }, { "cell_type": "code", - "execution_count": 562, + "execution_count": 21, "id": "5d6b2106", "metadata": {}, "outputs": [ @@ -804,7 +891,7 @@ "b'p\\xddnE\\x86}\\x9a\\xef?\\x0f\\xc3\\x84\\'\\xf3\\x11\\xc1\\xbf\\x80\\x8a_\\xff\\xbd-\\xb5\\xbf\\x04xUzE\\x98\\xef?\\x94\\x15\\xcf\\xf2\\xd7\\x10\\xc1\\xbf\\x9d\\xa9\\xe4!\\x13\\x01\\xb6\\xbf\\x1d_\\x18\\xd3\\x8d\\x9e\\xef?\\x80\\x87\"z\\xb4R\\xc0\\xbff\\x1d\\x9f<\\x8a\\x00\\xb6\\xbf\\xe4Z\\x84\\xc6\\xc6\\xa0\\xef?\\x1f\\x01\\xe5g\\xa8S\\xc0\\xbf\\xba\\xc9\\x14\\x10P-\\xb5\\xbf'" ] }, - "execution_count": 562, + "execution_count": 21, "metadata": {}, "output_type": "execute_result" } @@ -816,7 +903,7 @@ }, { "cell_type": "code", - "execution_count": 563, + "execution_count": 22, "id": "aa653a8b", "metadata": {}, "outputs": [ @@ -826,7 +913,7 @@ "False" ] }, - "execution_count": 563, + "execution_count": 22, "metadata": {}, "output_type": "execute_result" } @@ -849,7 +936,7 @@ }, { "cell_type": "code", - "execution_count": 587, + "execution_count": 23, "id": "acda18f4", "metadata": {}, "outputs": [ @@ -857,8 +944,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 323 ms, sys: 68 ms, total: 391 ms\n", - "Wall time: 582 ms\n" + "CPU times: user 544 ms, sys: 41.7 ms, total: 586 ms\n", + "Wall time: 649 ms\n" ] } ], @@ -874,7 +961,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 24, "id": "bb076b4b", "metadata": {}, "outputs": [], @@ -897,7 +984,7 @@ }, { "cell_type": "code", - "execution_count": 564, + "execution_count": 25, "id": "0228bb4d", "metadata": {}, "outputs": [], @@ -925,7 +1012,7 @@ }, { "cell_type": "code", - "execution_count": 613, + "execution_count": 26, "id": "6c3bb244", "metadata": {}, "outputs": [ @@ -935,8 +1022,8 @@ "text": [ "Found DECam. Adding to \"desired_instruments\" now.\n", "WARNING: we are not iterating over all rows to find instruments, just taking the first one.\n", - "CPU times: user 140 ms, sys: 19 ms, total: 159 ms\n", - "Wall time: 199 ms\n" + "CPU times: user 1.27 s, sys: 285 ms, total: 1.56 s\n", + "Wall time: 1.61 s\n" ] } ], @@ -957,7 +1044,7 @@ }, { "cell_type": "code", - "execution_count": 614, + "execution_count": 27, "id": "dfc37b54", "metadata": {}, "outputs": [ @@ -965,8 +1052,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 875 ms, sys: 108 ms, total: 983 ms\n", - "Wall time: 1.02 s\n" + "CPU times: user 1.16 s, sys: 135 ms, total: 1.3 s\n", + "Wall time: 1.33 s\n" ] } ], @@ -982,7 +1069,7 @@ }, { "cell_type": "code", - "execution_count": 529, + "execution_count": 28, "id": "789f1d42", "metadata": {}, "outputs": [ @@ -992,7 +1079,7 @@ "62" ] }, - "execution_count": 529, + "execution_count": 28, "metadata": {}, "output_type": "execute_result" } @@ -1003,7 +1090,7 @@ }, { "cell_type": "code", - "execution_count": 530, + "execution_count": 29, "id": "351e8d03", "metadata": {}, "outputs": [ @@ -1013,7 +1100,7 @@ "'VR'" ] }, - "execution_count": 530, + "execution_count": 29, "metadata": {}, "output_type": "execute_result" } @@ -1024,17 +1111,17 @@ }, { "cell_type": "code", - "execution_count": 531, + "execution_count": 30, "id": "1c1e5431", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 531, + "execution_count": 30, "metadata": {}, "output_type": "execute_result" }, @@ -1056,7 +1143,7 @@ }, { "cell_type": "code", - "execution_count": 532, + "execution_count": 31, "id": "ba1b7ab6", "metadata": {}, "outputs": [ @@ -1069,7 +1156,7 @@ "Pixel Scale: 0.262593 arcsec/pixel" ] }, - "execution_count": 532, + "execution_count": 31, "metadata": {}, "output_type": "execute_result" } @@ -1081,7 +1168,7 @@ }, { "cell_type": "code", - "execution_count": 503, + "execution_count": 32, "id": "4270995e", "metadata": { "scrolled": true @@ -1311,7 +1398,7 @@ }, { "cell_type": "code", - "execution_count": 272, + "execution_count": 33, "id": "7bbc916e", "metadata": {}, "outputs": [], @@ -1322,7 +1409,7 @@ }, { "cell_type": "code", - "execution_count": 567, + "execution_count": 34, "id": "e0f8f8f9", "metadata": {}, "outputs": [], @@ -1404,7 +1491,7 @@ }, { "cell_type": "code", - "execution_count": 628, + "execution_count": 35, "id": "6dd2ea6a", "metadata": {}, "outputs": [ @@ -1413,8 +1500,8 @@ "output_type": "stream", "text": [ "Recycled 47383 paths from /astro/users/coc123/kbmod_tmp/uri_cache.lst as overwrite was False.\n", - "CPU times: user 45 ms, sys: 32.1 ms, total: 77.1 ms\n", - "Wall time: 76.7 ms\n" + "CPU times: user 32 ms, sys: 21.5 ms, total: 53.5 ms\n", + "Wall time: 53.7 ms\n" ] } ], @@ -1435,7 +1522,7 @@ }, { "cell_type": "code", - "execution_count": 617, + "execution_count": 36, "id": "eae8d366", "metadata": {}, "outputs": [ @@ -1445,7 +1532,7 @@ "'file:///epyc/users/smotherh/DEEP/PointingGroups/butler-repo/PointingGroup021/imdiff_r/20210723T174135Z/deepDiff_differenceExp/20190927/VR/VR_DECam_c0007_6300.0_2600.0/898286/deepDiff_differenceExp_DECam_VR_VR_DECam_c0007_6300_0_2600_0_898286_S29_PointingGroup021_imdiff_r_20210723T174135Z.fits'" ] }, - "execution_count": 617, + "execution_count": 36, "metadata": {}, "output_type": "execute_result" } @@ -1466,7 +1553,7 @@ }, { "cell_type": "code", - "execution_count": 619, + "execution_count": 37, "id": "df7ff31f", "metadata": {}, "outputs": [ @@ -1475,8 +1562,8 @@ "output_type": "stream", "text": [ "0 DateTime(\"2019-09-27T00:20:59.932016000\", TAI) 120.0 (351.3806941054, -5.2403083277)\n", - "CPU times: user 126 ms, sys: 12 ms, total: 138 ms\n", - "Wall time: 175 ms\n" + "CPU times: user 93.4 ms, sys: 11.5 ms, total: 105 ms\n", + "Wall time: 145 ms\n" ] } ], @@ -1492,7 +1579,7 @@ }, { "cell_type": "code", - "execution_count": 572, + "execution_count": 38, "id": "3ccadfaa", "metadata": {}, "outputs": [ @@ -1502,7 +1589,7 @@ "lsst.daf.base.dateTime.dateTime.DateTime" ] }, - "execution_count": 572, + "execution_count": 38, "metadata": {}, "output_type": "execute_result" } @@ -1514,7 +1601,7 @@ }, { "cell_type": "code", - "execution_count": 573, + "execution_count": 39, "id": "d73d8119", "metadata": {}, "outputs": [ @@ -1524,73 +1611,77 @@ "'2019-09-27T00:20:22.932'" ] }, - "execution_count": 573, + "execution_count": 39, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# Let's convert to a plain string, UTC (handles 37 s offset).\n", - "t = Time(testing, format=\"isot\", scale=\"tai\")\n", + "t = Time(str(visitInfo.date).split('\"')[1], format=\"isot\", scale=\"tai\")\n", "str(t.utc)" ] }, { "cell_type": "code", - "execution_count": 574, - "id": "89822691", + "execution_count": 40, + "id": "4cb53994", "metadata": {}, "outputs": [], "source": [ - "def getTimestamps(dataIds, overwrite=False):\n", - " \"\"\"Get timestamps for a bunch of dataIds.\n", - " Convert the LSST/Butler TAI to UTC in the process.\n", - " Do this all in a chunked, multiprocessing way.\n", - " Takes about 3 minutes as of 2/1/2024 (Hayden DEEP).\n", - " BUT if we have the values cached, just read those instead, unless overwrite is True.\n", - " 2/1/2024 COC\n", - " \"\"\"\n", - " # thank you ChatGPT 4 for helping parallelize\n", + "# New parallel version with order-preservation redone 2/7/2024 COC\n", "\n", - " timestamps = []\n", "\n", - " import glob\n", + "# Define get_timestamps at the top level of your module\n", + "def get_timestamps(dataIds_chunk, repo_path, desired_collections):\n", + " chunked_data = []\n", + " butler = dafButler.Butler(repo_path)\n", + " for dataId in dataIds_chunk:\n", + " try:\n", + " visitInfo = butler.get(\"calexp.visitInfo\", dataId=dataId, collections=desired_collections)\n", + " t = Time(str(visitInfo.date).split('\"')[1], format=\"isot\", scale=\"tai\")\n", + " tutc = str(t.utc)\n", + " chunked_data.append(tutc)\n", + " except Exception as e:\n", + " print(f\"Failed to retrieve timestamp for dataId {dataId}: {e}\")\n", + " return chunked_data\n", "\n", - " cache_file = f\"{basedir}/vdr_timestamps.lst\"\n", "\n", - " cache_file_exists = False\n", - " if len(glob.glob(cache_file)) > 0:\n", - " cache_file_exists = True\n", + "def getTimestamps(dataIds, overwrite=False):\n", + " timestamps = []\n", + " cache_file = f\"{basedir}/vdr_timestamps.lst\"\n", "\n", - " if overwrite == False and cache_file_exists == True:\n", - " print(f\"Overwrite is False, so we will read the timestamps from file now...\")\n", + " if not overwrite and glob.glob(cache_file):\n", + " print(\"Overwrite is False, so we will read the timestamps from file now...\")\n", " with open(cache_file, \"r\") as f:\n", - " for line in f:\n", - " timestamps.append(line.strip())\n", + " timestamps = [line.strip() for line in f]\n", " print(f\"Recycled {len(timestamps)} from {cache_file}.\")\n", " return timestamps\n", "\n", - " if overwrite or not cache_file_exists:\n", - " timestamps = [] # Re-initialize timestamps here to ensure it's fresh\n", + " def chunked_dataIds(dataIds, chunk_size=200):\n", + " for i in range(0, len(dataIds), chunk_size):\n", + " yield dataIds[i : i + chunk_size]\n", "\n", - " with ProcessPoolExecutor() as executor:\n", - " dataId_chunks = list(chunked_dataIds(dataIds))\n", - " # Initialize progress bar\n", - " with progressbar.ProgressBar(max_value=len(dataId_chunks)) as bar:\n", - " # Use map for preserving order and simplifying the code\n", - " results = executor.map(get_timestamps, dataId_chunks)\n", + " dataId_chunks = list(chunked_dataIds(dataIds))\n", + "\n", + " with ProcessPoolExecutor() as executor:\n", + " # Adjust the executor.map call to pass additional arguments to get_timestamps\n", + " result_chunks = list(\n", + " executor.map(\n", + " get_timestamps,\n", + " dataId_chunks,\n", + " [repo_path] * len(dataId_chunks),\n", + " [desired_collections] * len(dataId_chunks),\n", + " )\n", + " )\n", "\n", - " # Process results and maintain the order\n", - " for i, chunk_result in enumerate(results):\n", - " timestamps.extend(chunk_result) # Correctly extend with the result of each future\n", - " bar.update(i)\n", + " timestamps = [timestamp for chunk in result_chunks for timestamp in chunk]\n", "\n", - " # Write to cache if necessary\n", - " if overwrite or not cache_file_exists:\n", - " with open(cache_file, \"w\") as f:\n", - " for ts in timestamps:\n", - " print(ts, file=f)\n", - " print(f\"Wrote {len(timestamps)} lines to {cache_file} for future use.\")\n", + " if overwrite or not glob.glob(cache_file):\n", + " with open(cache_file, \"w\") as f:\n", + " for ts in timestamps:\n", + " print(ts, file=f)\n", + " print(f\"Wrote {len(timestamps)} lines to {cache_file} for future use.\")\n", "\n", " print(f\"Obtained {len(timestamps)} timestamps.\")\n", " return timestamps" @@ -1598,32 +1689,7 @@ }, { "cell_type": "code", - "execution_count": 620, - "id": "5ea2f086", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "'2019-09-27T00:20:22.932'" - ] - }, - "execution_count": 620, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "# Double-check that we can convert Butler timestamp (TAI) to UTC string\n", - "visitInfo = butler.get(\"calexp.visitInfo\", dataId=df[\"data_id\"].iloc()[0], collections=desired_collections)\n", - "t = Time(str(visitInfo.date).split('\"')[1], format=\"isot\", scale=\"tai\")\n", - "tutc = str(t.utc)\n", - "tutc" - ] - }, - { - "cell_type": "code", - "execution_count": 621, + "execution_count": 41, "id": "7e0d33c0", "metadata": {}, "outputs": [ @@ -1633,8 +1699,8 @@ "text": [ "Overwrite is False, so we will read the timestamps from file now...\n", "Recycled 47383 from /astro/users/coc123/kbmod_tmp/vdr_timestamps.lst.\n", - "CPU times: user 24.1 ms, sys: 9.07 ms, total: 33.2 ms\n", - "Wall time: 30.1 ms\n" + "CPU times: user 16.8 ms, sys: 5.06 ms, total: 21.9 ms\n", + "Wall time: 21.4 ms\n" ] } ], @@ -1647,7 +1713,7 @@ }, { "cell_type": "code", - "execution_count": 622, + "execution_count": 42, "id": "adddf1e4", "metadata": {}, "outputs": [ @@ -1668,7 +1734,7 @@ "Name: ut, Length: 47383, dtype: object" ] }, - "execution_count": 622, + "execution_count": 42, "metadata": {}, "output_type": "execute_result" } @@ -1679,65 +1745,10 @@ }, { "cell_type": "code", - "execution_count": 364, + "execution_count": 43, "id": "a789a331", "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "0 : 2019-09-27T00:20:22.932 for {instrument: 'DECam', detector: 1, visit: 898286}. Dict had: 2019-09-27\n", - "1000 : 2019-09-27T02:24:03.066 for {instrument: 'DECam', detector: 12, visit: 898336}. Dict had: 2019-08-29\n", - "2000 : 2019-09-27T00:32:44.405 for {instrument: 'DECam', detector: 23, visit: 898291}. Dict had: 2019-08-29\n", - "3000 : 2019-09-27T02:36:24.497 for {instrument: 'DECam', detector: 33, visit: 898341}. Dict had: 2019-08-29\n", - "4000 : 2019-09-27T00:45:05.306 for {instrument: 'DECam', detector: 44, visit: 898296}. Dict had: 2019-08-29\n", - "5000 : 2019-09-27T02:51:16.295 for {instrument: 'DECam', detector: 54, visit: 898347}. Dict had: 2019-08-29\n", - "6000 : 2019-08-29T07:25:55.714 for {instrument: 'DECam', detector: 4, visit: 891512}. Dict had: 2019-08-30\n", - "7000 : 2019-08-29T06:36:25.673 for {instrument: 'DECam', detector: 14, visit: 891492}. Dict had: 2019-08-30\n", - "8000 : 2019-08-29T05:46:48.259 for {instrument: 'DECam', detector: 24, visit: 891472}. Dict had: 2019-08-29\n", - "9000 : 2019-08-29T09:11:52.823 for {instrument: 'DECam', detector: 33, visit: 891554}. Dict had: 2020-10-19\n", - "10000: 2019-08-29T08:24:43.475 for {instrument: 'DECam', detector: 43, visit: 891535}. Dict had: 2020-10-19\n", - "11000: 2019-08-29T07:39:44.133 for {instrument: 'DECam', detector: 53, visit: 891517}. Dict had: 2020-10-19\n", - "12000: 2020-10-19T03:57:38.040 for {instrument: 'DECam', detector: 1, visit: 946776}. Dict had: 2020-10-19\n", - "13000: 2020-10-19T03:55:07.913 for {instrument: 'DECam', detector: 13, visit: 946775}. Dict had: 2020-10-19\n", - "14000: 2020-10-19T03:52:39.901 for {instrument: 'DECam', detector: 24, visit: 946774}. Dict had: 2020-10-19\n", - "15000: 2020-10-19T03:50:11.828 for {instrument: 'DECam', detector: 35, visit: 946773}. Dict had: 2019-09-27\n", - "16000: 2020-10-19T03:47:43.087 for {instrument: 'DECam', detector: 46, visit: 946772}. Dict had: 2019-09-27\n", - "17000: 2020-10-19T03:45:14.564 for {instrument: 'DECam', detector: 57, visit: 946771}. Dict had: 2019-09-27\n", - "18000: 2019-08-30T07:36:47.123 for {instrument: 'DECam', detector: 7, visit: 891898}. Dict had: 2019-09-27\n", - "19000: 2019-08-30T07:11:50.193 for {instrument: 'DECam', detector: 17, visit: 891888}. Dict had: 2019-09-27\n", - "20000: 2019-08-30T06:47:05.343 for {instrument: 'DECam', detector: 27, visit: 891878}. Dict had: 2019-08-30\n", - "21000: 2019-08-30T06:22:19.105 for {instrument: 'DECam', detector: 37, visit: 891868}. Dict had: 2019-08-30\n", - "22000: 2019-08-30T05:57:29.152 for {instrument: 'DECam', detector: 47, visit: 891858}. Dict had: 2019-08-30\n", - "23000: 2019-08-30T05:32:32.635 for {instrument: 'DECam', detector: 57, visit: 891848}. Dict had: 2019-08-30\n", - "24000: 2019-09-28T01:46:11.541 for {instrument: 'DECam', detector: 6, visit: 898736}. Dict had: 2019-09-28\n", - "25000: 2019-09-28T03:00:31.172 for {instrument: 'DECam', detector: 16, visit: 898766}. Dict had: 2019-09-28\n", - "26000: 2019-09-28T00:17:03.748 for {instrument: 'DECam', detector: 27, visit: 898700}. Dict had: 2019-09-28\n", - "27000: 2019-09-28T01:31:18.723 for {instrument: 'DECam', detector: 37, visit: 898730}. Dict had: 2019-09-28\n", - "28000: 2019-09-28T02:45:39.745 for {instrument: 'DECam', detector: 47, visit: 898760}. Dict had: 2019-09-28\n", - "29000: 2019-09-28T04:00:09.666 for {instrument: 'DECam', detector: 57, visit: 898790}. Dict had: 2019-08-28\n", - "30000: 2019-08-28T06:43:48.523 for {instrument: 'DECam', detector: 7, visit: 891114}. Dict had: 2019-08-28\n", - "31000: 2019-08-28T05:29:20.494 for {instrument: 'DECam', detector: 17, visit: 891084}. Dict had: 2019-08-28\n", - "32000: 2019-08-28T08:31:09.143 for {instrument: 'DECam', detector: 26, visit: 891157}. Dict had: 2019-08-28\n", - "33000: 2019-08-28T07:21:26.793 for {instrument: 'DECam', detector: 36, visit: 891129}. Dict had: 2019-08-28\n", - "34000: 2019-08-28T06:06:34.210 for {instrument: 'DECam', detector: 46, visit: 891099}. Dict had: 2019-08-28\n", - "35000: 2019-08-28T09:08:44.560 for {instrument: 'DECam', detector: 55, visit: 891172}. Dict had: 2019-09-28\n", - "36000: 2019-09-29T00:19:06.349 for {instrument: 'DECam', detector: 5, visit: 899020}. Dict had: 2019-09-29\n", - "37000: 2019-09-29T01:58:29.441 for {instrument: 'DECam', detector: 15, visit: 899060}. Dict had: 2019-09-29\n", - "38000: 2019-09-29T03:37:44.590 for {instrument: 'DECam', detector: 25, visit: 899100}. Dict had: 2019-09-29\n", - "39000: 2019-09-29T01:18:42.912 for {instrument: 'DECam', detector: 36, visit: 899044}. Dict had: 2019-09-29\n", - "40000: 2019-09-29T02:58:02.739 for {instrument: 'DECam', detector: 46, visit: 899084}. Dict had: 2019-09-29\n", - "41000: 2019-09-29T00:38:58.257 for {instrument: 'DECam', detector: 57, visit: 899028}. Dict had: 2019-09-29\n", - "42000: 2020-10-17T03:45:59.925 for {instrument: 'DECam', detector: 6, visit: 946166}. Dict had: 2020-10-17\n", - "43000: 2020-10-17T01:26:44.472 for {instrument: 'DECam', detector: 17, visit: 946110}. Dict had: 2020-10-17\n", - "44000: 2020-10-17T03:06:21.338 for {instrument: 'DECam', detector: 27, visit: 946150}. Dict had: 2020-10-17\n", - "45000: 2020-10-17T00:46:58.038 for {instrument: 'DECam', detector: 38, visit: 946094}. Dict had: 2020-10-17\n", - "46000: 2020-10-17T02:26:33.210 for {instrument: 'DECam', detector: 48, visit: 946134}. Dict had: 2020-10-17\n", - "47000: 2020-10-17T04:05:48.949 for {instrument: 'DECam', detector: 58, visit: 946174}. Dict had: 2020-10-17\n" - ] - } - ], + "outputs": [], "source": [ "# This is for coming back to later to make sure the stamps line up\n", "# IGNORE FOR NOW 2/6/2024 COC\n", @@ -1770,7 +1781,7 @@ }, { "cell_type": "code", - "execution_count": 578, + "execution_count": 44, "id": "e45d7199", "metadata": {}, "outputs": [], @@ -1793,7 +1804,7 @@ }, { "cell_type": "code", - "execution_count": 579, + "execution_count": 45, "id": "9b278b50", "metadata": {}, "outputs": [ @@ -1806,7 +1817,7 @@ " (352.64644359666477, -4.7450820235469715)]" ] }, - "execution_count": 579, + "execution_count": 45, "metadata": {}, "output_type": "execute_result" } @@ -1819,7 +1830,7 @@ }, { "cell_type": "code", - "execution_count": 580, + "execution_count": 46, "id": "b37bfe47", "metadata": {}, "outputs": [], @@ -1842,7 +1853,7 @@ }, { "cell_type": "code", - "execution_count": 581, + "execution_count": 47, "id": "ef329736", "metadata": {}, "outputs": [ @@ -1853,7 +1864,7 @@ " (-4.930880058593892, -4.7450820235469715))" ] }, - "execution_count": 581, + "execution_count": 47, "metadata": {}, "output_type": "execute_result" } @@ -1876,7 +1887,7 @@ }, { "cell_type": "code", - "execution_count": 582, + "execution_count": 48, "id": "4c89be9e", "metadata": {}, "outputs": [], @@ -1895,7 +1906,7 @@ }, { "cell_type": "code", - "execution_count": 182, + "execution_count": 49, "id": "8e1e764c", "metadata": {}, "outputs": [ @@ -1905,18 +1916,18 @@ "(352.477974357993, -4.837981041070432)" ] }, - "execution_count": 182, + "execution_count": 49, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "getCenterRaDec(tmpref.region)" + "getCenterRaDec(example_vdr_ref.region)" ] }, { "cell_type": "code", - "execution_count": 624, + "execution_count": 50, "id": "8e54db29", "metadata": {}, "outputs": [ @@ -1924,8 +1935,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 363 ms, sys: 19 ms, total: 382 ms\n", - "Wall time: 379 ms\n" + "CPU times: user 403 ms, sys: 15.8 ms, total: 419 ms\n", + "Wall time: 419 ms\n" ] } ], @@ -1936,7 +1947,7 @@ }, { "cell_type": "code", - "execution_count": 625, + "execution_count": 51, "id": "64908868", "metadata": {}, "outputs": [ @@ -1946,7 +1957,7 @@ "47383" ] }, - "execution_count": 625, + "execution_count": 51, "metadata": {}, "output_type": "execute_result" } @@ -1957,7 +1968,7 @@ }, { "cell_type": "code", - "execution_count": 626, + "execution_count": 52, "id": "625de417", "metadata": {}, "outputs": [ @@ -1967,7 +1978,7 @@ "(351.0694028401149, -4.336598368890197)" ] }, - "execution_count": 626, + "execution_count": 52, "metadata": {}, "output_type": "execute_result" } @@ -1978,7 +1989,7 @@ }, { "cell_type": "code", - "execution_count": 627, + "execution_count": 53, "id": "67b57215", "metadata": {}, "outputs": [ @@ -1986,17 +1997,17 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 1.2 s, sys: 26 ms, total: 1.23 s\n", - "Wall time: 1.22 s\n" + "CPU times: user 1.62 s, sys: 71.3 ms, total: 1.69 s\n", + "Wall time: 1.72 s\n" ] }, { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 627, + "execution_count": 53, "metadata": {}, "output_type": "execute_result" }, @@ -2035,7 +2046,7 @@ }, { "cell_type": "code", - "execution_count": 554, + "execution_count": 54, "id": "c2dc4e1a", "metadata": {}, "outputs": [ @@ -2045,7 +2056,7 @@ "{instrument: 'DECam', detector: 1, visit: 898286}" ] }, - "execution_count": 554, + "execution_count": 54, "metadata": {}, "output_type": "execute_result" } @@ -2057,17 +2068,17 @@ }, { "cell_type": "code", - "execution_count": 435, + "execution_count": 55, "id": "580ac4ed", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 435, + "execution_count": 55, "metadata": {}, "output_type": "execute_result" }, @@ -2093,7 +2104,7 @@ }, { "cell_type": "code", - "execution_count": 237, + "execution_count": 56, "id": "6ee544b8", "metadata": {}, "outputs": [], @@ -2116,7 +2127,7 @@ }, { "cell_type": "code", - "execution_count": 589, + "execution_count": 57, "id": "2c770982", "metadata": {}, "outputs": [], @@ -2162,7 +2173,7 @@ }, { "cell_type": "code", - "execution_count": 202, + "execution_count": 58, "id": "2fcdd8b3", "metadata": {}, "outputs": [], @@ -2203,7 +2214,7 @@ }, { "cell_type": "code", - "execution_count": 204, + "execution_count": 59, "id": "c0916372", "metadata": {}, "outputs": [ @@ -2220,18 +2231,18 @@ "(189361, 1895.111766130883)" ] }, - "execution_count": 204, + "execution_count": 59, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "getHTMstuff(vdr_centers[0][0], vdr_centers[0][1], verbose=True)" + "getHTMstuff(df[\"center_coord\"].iloc()[0][0], df[\"center_coord\"].iloc()[0][1], verbose=True)" ] }, { "cell_type": "code", - "execution_count": 588, + "execution_count": 60, "id": "47c447c5", "metadata": {}, "outputs": [ @@ -2270,7 +2281,7 @@ }, { "cell_type": "code", - "execution_count": 441, + "execution_count": 61, "id": "048e38e1", "metadata": {}, "outputs": [], @@ -2349,7 +2360,7 @@ }, { "cell_type": "code", - "execution_count": 442, + "execution_count": 62, "id": "25710a99", "metadata": {}, "outputs": [ @@ -2358,8 +2369,8 @@ "output_type": "stream", "text": [ "Recycling /astro/users/coc123/kbmod_tmp/overlapping_sets.pickle as overwrite=False.\n", - "CPU times: user 173 ms, sys: 22.1 ms, total: 195 ms\n", - "Wall time: 192 ms\n" + "CPU times: user 425 ms, sys: 134 ms, total: 559 ms\n", + "Wall time: 559 ms\n" ] } ], @@ -2374,7 +2385,7 @@ }, { "cell_type": "code", - "execution_count": 590, + "execution_count": 63, "id": "5f2d5a03", "metadata": {}, "outputs": [ @@ -2390,9 +2401,17 @@ "print(f\"There are {len(overlapping_sets.keys())} discrete chip-level pointings.\") # should be 488" ] }, + { + "cell_type": "markdown", + "id": "4e362e41", + "metadata": {}, + "source": [ + "#### Exploring the overlapping_sets" + ] + }, { "cell_type": "code", - "execution_count": 591, + "execution_count": 64, "id": "9ed24e28", "metadata": {}, "outputs": [ @@ -2400,17 +2419,17 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 503 ms, sys: 24.9 ms, total: 527 ms\n", - "Wall time: 526 ms\n" + "CPU times: user 481 ms, sys: 18 ms, total: 499 ms\n", + "Wall time: 503 ms\n" ] }, { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 591, + "execution_count": 64, "metadata": {}, "output_type": "execute_result" }, @@ -2443,7 +2462,7 @@ }, { "cell_type": "code", - "execution_count": 594, + "execution_count": 65, "id": "55ffd374", "metadata": {}, "outputs": [ @@ -2453,7 +2472,7 @@ "'2019-09-27T00:20:22.932'" ] }, - "execution_count": 594, + "execution_count": 65, "metadata": {}, "output_type": "execute_result" } @@ -2464,7 +2483,7 @@ }, { "cell_type": "code", - "execution_count": 595, + "execution_count": 66, "id": "fcd39c41", "metadata": {}, "outputs": [ @@ -2472,15 +2491,15 @@ "name": "stderr", "output_type": "stream", "text": [ - ":19: MatplotlibDeprecationWarning: The get_cmap function was deprecated in Matplotlib 3.7 and will be removed two minor releases later. Use ``matplotlib.colormaps[name]`` or ``matplotlib.colormaps.get_cmap(obj)`` instead.\n" + ":17: MatplotlibDeprecationWarning: The get_cmap function was deprecated in Matplotlib 3.7 and will be removed two minor releases later. Use ``matplotlib.colormaps[name]`` or ``matplotlib.colormaps.get_cmap(obj)`` instead.\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 6.24 s, sys: 526 ms, total: 6.77 s\n", - "Wall time: 6.24 s\n" + "CPU times: user 9.24 s, sys: 745 ms, total: 9.98 s\n", + "Wall time: 9.51 s\n" ] }, { @@ -2536,19 +2555,19 @@ }, { "cell_type": "code", - "execution_count": 596, + "execution_count": 67, "id": "418c97ee", "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "Index(['data_id', 'region', 'detector', 'uri', 'center_coord', 'ut',\n", + "Index(['data_id', 'region', 'detector', 'uri', 'ut', 'center_coord',\n", " 'ut_datetime'],\n", " dtype='object')" ] }, - "execution_count": 596, + "execution_count": 67, "metadata": {}, "output_type": "execute_result" } @@ -2559,7 +2578,7 @@ }, { "cell_type": "code", - "execution_count": 597, + "execution_count": 68, "id": "d06ed515", "metadata": {}, "outputs": [ @@ -2576,7 +2595,7 @@ " datetime.date(2020, 10, 19)]" ] }, - "execution_count": 597, + "execution_count": 68, "metadata": {}, "output_type": "execute_result" } @@ -2597,7 +2616,7 @@ }, { "cell_type": "code", - "execution_count": 598, + "execution_count": 69, "id": "58158f47", "metadata": {}, "outputs": [ @@ -2608,13 +2627,13 @@ "region ConvexPolygon([UnitVector3d(0.9847372525065534...\n", "detector 1\n", "uri file:///epyc/users/smotherh/DEEP/PointingGroup...\n", - "center_coord (351.0694028401149, -4.336598368890197)\n", "ut 2019-09-27T00:20:22.932\n", + "center_coord (351.0694028401149, -4.336598368890197)\n", "ut_datetime 2019-09-27 00:20:22.932000\n", "Name: 0, dtype: object" ] }, - "execution_count": 598, + "execution_count": 69, "metadata": {}, "output_type": "execute_result" } @@ -2625,7 +2644,7 @@ }, { "cell_type": "code", - "execution_count": 599, + "execution_count": 70, "id": "2ff625e7", "metadata": {}, "outputs": [ @@ -2635,7 +2654,7 @@ "datetime.date(2019, 9, 27)" ] }, - "execution_count": 599, + "execution_count": 70, "metadata": {}, "output_type": "execute_result" } @@ -2646,7 +2665,7 @@ }, { "cell_type": "code", - "execution_count": 600, + "execution_count": 71, "id": "c3b48b13", "metadata": {}, "outputs": [ @@ -2656,7 +2675,7 @@ "(351.0694028401149, -4.336598368890197)" ] }, - "execution_count": 600, + "execution_count": 71, "metadata": {}, "output_type": "execute_result" } @@ -2667,7 +2686,7 @@ }, { "cell_type": "code", - "execution_count": 601, + "execution_count": 72, "id": "16506478", "metadata": {}, "outputs": [ @@ -2677,7 +2696,7 @@ "6267" ] }, - "execution_count": 601, + "execution_count": 72, "metadata": {}, "output_type": "execute_result" } @@ -2690,7 +2709,7 @@ }, { "cell_type": "code", - "execution_count": 603, + "execution_count": 73, "id": "166c9137", "metadata": {}, "outputs": [ @@ -2698,8 +2717,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 933 ms, sys: 33 ms, total: 966 ms\n", - "Wall time: 962 ms\n" + "CPU times: user 1.03 s, sys: 19 ms, total: 1.05 s\n", + "Wall time: 1.06 s\n" ] }, { @@ -2794,6 +2813,22 @@ "del tmpdf" ] }, + { + "cell_type": "code", + "execution_count": 77, + "id": "bfb23aef", + "metadata": {}, + "outputs": [], + "source": [ + "def ra_dec_search_overlapping_sets(df, overlapping_sets):\n", + " \"\"\"\n", + " 2/6/2024 COC\n", + " Implementing an extremely basic (RA, Dec) query functionality.\n", + " This will work within the overlapping_sets framework.\n", + " \"\"\"\n", + " pass" + ] + }, { "cell_type": "markdown", "id": "337ceedc", @@ -2807,7 +2842,7 @@ }, { "cell_type": "code", - "execution_count": 634, + "execution_count": 75, "id": "fccdee6b", "metadata": {}, "outputs": [], @@ -2823,6 +2858,7 @@ " import lsst\n", " import lsst.daf.butler as dafButler\n", " import os\n", + " import glob\n", " import time\n", " from matplotlib import pyplot as plt\n", " import progressbar\n", @@ -2869,7 +2905,7 @@ }, { "cell_type": "code", - "execution_count": 638, + "execution_count": 76, "id": "cf221f77", "metadata": {}, "outputs": [ @@ -2885,8 +2921,8 @@ "Overwrite is False, so we will read the timestamps from file now...\n", "Recycled 47383 from /astro/users/coc123/kbmod_tmp/vdr_timestamps.lst.\n", "Recycling /astro/users/coc123/kbmod_tmp/overlapping_sets.pickle as overwrite=False.\n", - "CPU times: user 3.91 s, sys: 413 ms, total: 4.32 s\n", - "Wall time: 5.54 s\n" + "CPU times: user 4.44 s, sys: 465 ms, total: 4.91 s\n", + "Wall time: 6.28 s\n" ] } ], From a2a2a030167649999322984260476670d17ae13f Mon Sep 17 00:00:00 2001 From: Jeremy Kubica <104161096+jeremykubica@users.noreply.github.com> Date: Thu, 8 Feb 2024 10:28:32 -0500 Subject: [PATCH 27/27] Add some basic checks --- src/kbmod/search/psf.cpp | 7 ++++++- src/kbmod/search/pydocs/psf_docs.h | 18 +++++++++++------- tests/test_psf.py | 8 ++++++++ 3 files changed, 25 insertions(+), 8 deletions(-) diff --git a/src/kbmod/search/psf.cpp b/src/kbmod/search/psf.cpp index 0ec947b8b..fa2735cbb 100644 --- a/src/kbmod/search/psf.cpp +++ b/src/kbmod/search/psf.cpp @@ -9,6 +9,10 @@ PSF::PSF() : kernel(1, 1.0) { } PSF::PSF(float stdev) { + if (stdev <= 0.0) { + throw std::runtime_error("PSF stdev must be > 0.0."); + } + width = stdev; float simple_gauss[MAX_KERNEL_RADIUS]; double psf_coverage = 0.0; @@ -28,7 +32,7 @@ PSF::PSF(float stdev) { i++; } - radius = i - 1; // This value is good for + radius = i - 1; dim = 2 * radius + 1; // Create 2D gaussain by multiplying with itself @@ -155,6 +159,7 @@ static void psf_bindings(py::module& m) { .def(py::init()) .def(py::init>()) .def(py::init()) + .def("__str__", &psf::print) .def("set_array", &psf::set_array, pydocs::DOC_PSF_set_array) .def("get_std", &psf::get_std, pydocs::DOC_PSF_get_std) .def("get_sum", &psf::get_sum, pydocs::DOC_PSF_get_sum) diff --git a/src/kbmod/search/pydocs/psf_docs.h b/src/kbmod/search/pydocs/psf_docs.h index 91ea88399..a58fb07f4 100644 --- a/src/kbmod/search/pydocs/psf_docs.h +++ b/src/kbmod/search/pydocs/psf_docs.h @@ -8,18 +8,22 @@ static const auto DOC_PSF = R"doc( Parameters ---------- stdev : `float`, optional - Standard deviation of the Gaussian PSF. + Standard deviation of the Gaussian PSF. Must be > 0.0. psf : `PSF`, optional Another PSF object. arr : `numpy.array`, optional A realization of the PSF. - Notes - ----- - When instantiated with another `psf` object, returns its copy. - When instantiated with an array-like object, that array must be - a square matrix and have an odd number of dimensions. Only one - of the arguments is required. + Notes + ----- + When instantiated with another `psf` object, returns its copy. + When instantiated with an array-like object, that array must be + a square matrix and have an odd number of dimensions. Only one + of the arguments is required. + + Raises + ------ + Raises a ``RuntimeError`` when given an invalid stdev. )doc"; static const auto DOC_PSF_set_array = R"doc( diff --git a/tests/test_psf.py b/tests/test_psf.py index f8cecb58e..a7eba0ea9 100644 --- a/tests/test_psf.py +++ b/tests/test_psf.py @@ -19,6 +19,14 @@ def test_make_noop(self): self.assertEqual(len(kernel0), 1) self.assertEqual(kernel0[0], 1.0) + def test_make_invalud(self): + # Raise an error if creating a PSF with a negative stdev. + self.assertRaises(RuntimeError, PSF, -1.0) + + def test_to_string(self): + result = self.psf_list[0].__str__() + self.assertGreater(len(result), 1) + def test_make_and_copy(self): psf1 = PSF(1.0) self.assertEqual(psf1.get_size(), 25)