Skip to content

Commit

Permalink
Update
Browse files Browse the repository at this point in the history
  • Loading branch information
TeachRaccooon committed Feb 7, 2025
1 parent 036f0cc commit e97393e
Show file tree
Hide file tree
Showing 3 changed files with 19 additions and 15 deletions.
6 changes: 3 additions & 3 deletions benchmark/bench_BQRRP/BQRRP_runtime_breakdown.cc
Original file line number Diff line number Diff line change
Expand Up @@ -120,8 +120,8 @@ int main(int argc, char *argv[]) {
int64_t m = std::stol(size);
int64_t n = std::stol(size);
double d_factor = 1.0;
std::vector<int64_t> b_sz = {25, 50, 125, 250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {32, 64, 128, 256, 512, 1024, 2048, 4096, 8192};
std::vector<int64_t> b_sz = {250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {256, 512, 1024, 2048, 4096, 8192};
auto state = RandBLAS::RNGState<r123::Philox4x32>();
auto state_constant = state;
// Timing results
Expand Down Expand Up @@ -154,7 +154,7 @@ int main(int argc, char *argv[]) {
file.flush();

int i = 0;
for (;i <= b_sz.size(); ++i) {
for (;i < b_sz.size(); ++i) {
call_all_algs(m_info, numruns, b_sz[i], qr_tall, all_data, state_constant, output_filename);
}
}
Expand Down
6 changes: 3 additions & 3 deletions benchmark/bench_BQRRP/BQRRP_speed_comparisons_block_size.cc
Original file line number Diff line number Diff line change
Expand Up @@ -198,8 +198,8 @@ int main(int argc, char *argv[]) {
int64_t m = std::stol(size);
int64_t n = std::stol(size);
double d_factor = 1.0;
std::vector<int64_t> b_sz = {25, 50, 125, 250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {32, 64, 128, 256, 512, 1024, 2048, 4096, 8192};
std::vector<int64_t> b_sz = {250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {256, 512, 1024, 2048, 4096, 8192};
auto state = RandBLAS::RNGState<r123::Philox4x32>();
auto state_constant = state;
// Timing results
Expand Down Expand Up @@ -231,7 +231,7 @@ int main(int argc, char *argv[]) {
file.flush();

int i = 0;
for (;i <= b_sz.size(); ++i) {
for (;i < b_sz.size(); ++i) {
call_all_algs(m_info, numruns, b_sz[i], all_data, state_constant, output_filename);
}
}
Expand Down
22 changes: 13 additions & 9 deletions benchmark/bench_BQRRP/BQRRP_subroutines_speed.cc
Original file line number Diff line number Diff line change
Expand Up @@ -308,7 +308,7 @@ static void call_apply_q(
std::string output_filename) {

auto m = all_data.row;
std::vector<int64_t> nb_gemqrt = {25, 50, 125, 250, 500, 1000, 2000, 4000, 8000};
std::vector<int64_t> nb_gemqrt = {250, 500, 1000, 2000, 4000, 8000};

// timing vars
long dur_ormqr = 0;
Expand All @@ -323,6 +323,10 @@ static void call_apply_q(
for(k = 0; k <= nb_gemqrt.size(); ++k) {
printf("Apply Q iteration %d; n==%d start.\n", i, n);
nb = nb_gemqrt[k];
printf("%d\n", nb);
printf("%d\n", m);
printf("%d\n", m - n);
printf("%d\n", n);
// Performing CholQR
blas::syrk(Layout::ColMajor, Uplo::Upper, Op::Trans, n, m, (T) 1.0, all_data.A.data(), m, (T) 0.0, all_data.R.data(), n);
lapack::potrf(Uplo::Upper, n, all_data.R.data(), n);
Expand Down Expand Up @@ -366,8 +370,8 @@ int main(int argc, char *argv[]) {
int64_t i = 0;
// Declare parameters
int64_t m = std::stol(size);
std::vector<int64_t> n = {25, 50, 125, 250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {32, 64, 128, 256, 512, 1024, 2048, 4096, 8192};
std::vector<int64_t> n = {250, 500, 1000, 2000, 4000, 8000};
//std::vector<int64_t> b_sz = {256, 512, 1024, 2048, 4096, 8192};

int64_t nb_start = 256;
auto state = RandBLAS::RNGState();
Expand Down Expand Up @@ -405,13 +409,13 @@ int main(int argc, char *argv[]) {
"\n";
file.flush();

for (i = n.front(); i <= n.back(); i *= 2)
call_wide_qrcp(m_info, numruns, i, all_data, state, output_filename);
for (i = 0; i <= n.size(); ++i)
call_wide_qrcp(m_info, numruns, n[i], all_data, state, output_filename);

for (i = n.front(); i <= n.back(); i *= 2)
call_tsqr(m_info, numruns, i, nb_start, all_data, state, output_filename);
for (i = 0; i <= n.size(); ++i)
call_tsqr(m_info, numruns, n[i], nb_start, all_data, state, output_filename);

for (i = n.front(); i <= n.back(); i *= 2)
call_apply_q(m_info, numruns, i, nb_start, all_data, state, state_B, output_filename);
for (i = 0; i <= n.size(); ++i)
call_apply_q(m_info, numruns, n[i], nb_start, all_data, state, state_B, output_filename);
}
#endif

0 comments on commit e97393e

Please sign in to comment.