taco: parametrize striding benchmark by stride width

rohany · rohany · commit dbee80858499 · 2021-03-08T13:28:30.000-08:00
diff --git a/taco/windowing.cpp b/taco/windowing.cpp
@@ -7,12 +7,8 @@
 
 using namespace taco;
 
-// applyBenchSizes is used to configure the benchmarks to run with the
-// input arguments.
-static void applyBenchSizes(benchmark::internal::Benchmark* b) {
-  // Currently considering these size square tensors.
-  b->ArgsProduct({{5000, 10000, 20000}});
-}
+// The tensor sizes that we want to run each windowing benchmark with.
+std::vector<int64_t> tensorSizes({5000, 10000, 20000});
 
 // WindowConfig corresponds to what sort of window size should be used
 // when evaluating standard windowing benchmarks. This should stay in
@@ -86,32 +82,33 @@ static void bench_add_sparse_window(benchmark::State& state, const Format& f, Wi
 }
 
 #define DECLARE_ADD_SPARSE_WINDOW_BENCH(configName, config) \
-  TACO_BENCH_ARGS(bench_add_sparse_window, csr/configName, CSR, config)->Apply(applyBenchSizes); \
-  TACO_BENCH_ARGS(bench_add_sparse_window, csc/configName, CSC, config)->Apply(applyBenchSizes);
+  TACO_BENCH_ARGS(bench_add_sparse_window, csr/configName, CSR, config)->ArgsProduct({tensorSizes}); \
+  TACO_BENCH_ARGS(bench_add_sparse_window, csc/configName, CSC, config)->ArgsProduct({tensorSizes});
 
 FOREACH_WINDOW_CONFIG(DECLARE_ADD_SPARSE_WINDOW_BENCH)
 
 static void bench_add_sparse_strided_window(benchmark::State& state, const Format& f) {
   int dim = state.range(0);
+  int strideWidth = state.range(1);
   auto sparsity = 0.01;
   Tensor<double> matrix = loadRandomTensor("A", {dim, dim}, sparsity, f);
   matrix.pack();
 
   for (auto _ : state) {
     // Setup.
     state.PauseTiming();
-    Tensor<double> result("B", {(dim-2)/4, (dim-2)/4}, f);
+    Tensor<double> result("B", {dim/strideWidth, dim/strideWidth}, f);
     IndexVar i, j;
-    result(i, j) = matrix(i(1, dim-1, 4), j(1, dim-1, 4)) + matrix(i(1, dim-1, 4), j(1, dim-1, 4));
+    result(i, j) = matrix(i(0, dim, strideWidth), j(0, dim, strideWidth)) + matrix(i(0, dim, strideWidth), j(0, dim, strideWidth));
     result.compile();
     result.assemble();
     state.ResumeTiming();
     // The actual computation.
     result.compute();
   }
 }
-
-// Have benchmarking report milliseconds and run for 10 iterations.
-// Run an instance with both CSR and CSC formats.
-TACO_BENCH_ARG(bench_add_sparse_strided_window, csr, CSR)->Apply(applyBenchSizes);
-TACO_BENCH_ARG(bench_add_sparse_strided_window, csc, CSC)->Apply(applyBenchSizes);
+std::vector<int64_t> strides({2, 4, 8});
+TACO_BENCH_ARG(bench_add_sparse_strided_window, csr, CSR)
+  ->ArgsProduct({tensorSizes, strides});
+TACO_BENCH_ARG(bench_add_sparse_strided_window, csc, CSC)
+  ->ArgsProduct({tensorSizes, strides});