Skip to content

Commit

Permalink
[filter] support constexpr linear algebra
Browse files Browse the repository at this point in the history
  • Loading branch information
FrancoisCarouge committed Jul 8, 2023
1 parent 73f6007 commit 0ada127
Show file tree
Hide file tree
Showing 1,057 changed files with 183,018 additions and 21 deletions.
2 changes: 1 addition & 1 deletion benchmark/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,7 @@ foreach(BENCHMARK "baseline.cpp" "predict_1x1x0.cpp" "predict_1x1x1.cpp"
"--benchmark_out=${NAME}.json")
endforeach()

foreach(BACKEND IN ITEMS "eigen")
foreach(BACKEND IN ITEMS "eigen" "naive")
foreach(STATE_SIZE RANGE 1 2)
foreach(INPUT_SIZE RANGE 1 2)
configure_file(predict_linalg_x1x.cpp
Expand Down
6,011 changes: 6,011 additions & 0 deletions benchmark/image/predict_naive.svg
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
171 changes: 171 additions & 0 deletions benchmark/result/predict_naive_10x1x1.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,171 @@
{
"context": {
"date": "2023-06-14T19:55:36-07:00",
"host_name": "FRANCOIS-DESK",
"executable": "F:/Drive/Projects/cpp/kalman/build/benchmark/Release/kalman_benchmark_predict_naive_10x1x1_driver.exe",
"num_cpus": 8,
"mhz_per_cpu": 4008,
"caches": [
{
"type": "Data",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Instruction",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Unified",
"level": 2,
"size": 262144,
"num_sharing": 2
},
{
"type": "Unified",
"level": 3,
"size": 8388608,
"num_sharing": 8
}
],
"load_avg": [],
"library_build_type": "release"
},
"benchmarks": [
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 0,
"threads": 1,
"iterations": 807583,
"real_time": 8.3960633149454566e+02,
"cpu_time": 8.5130568622667886e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 1,
"threads": 1,
"iterations": 807583,
"real_time": 8.4394309935585272e+02,
"cpu_time": 8.5130568622667886e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 2,
"threads": 1,
"iterations": 807583,
"real_time": 8.4904375154876107e+02,
"cpu_time": 8.9000139923698248e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.4419772746638648e+02,
"cpu_time": 8.6420425723011340e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_median",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.4394309935585272e+02,
"cpu_time": 8.5130568622667886e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 4.7238597487542968e+00,
"cpu_time": 2.2340980322986454e+01,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 3,
"real_time": 5.5956793000753336e-03,
"cpu_time": 2.5851504590583933e-02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_min",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "min",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.3960633149454577e+02,
"cpu_time": 8.5130568622667886e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x1/repeats:3/manual_time_max",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x1/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "max",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.4904375154876107e+02,
"cpu_time": 8.9000139923698259e+02,
"time_unit": "ns"
}
]
}
171 changes: 171 additions & 0 deletions benchmark/result/predict_naive_10x1x10.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,171 @@
{
"context": {
"date": "2023-06-14T19:55:57-07:00",
"host_name": "FRANCOIS-DESK",
"executable": "F:/Drive/Projects/cpp/kalman/build/benchmark/Release/kalman_benchmark_predict_naive_10x1x10_driver.exe",
"num_cpus": 8,
"mhz_per_cpu": 4008,
"caches": [
{
"type": "Data",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Instruction",
"level": 1,
"size": 32768,
"num_sharing": 2
},
{
"type": "Unified",
"level": 2,
"size": 262144,
"num_sharing": 2
},
{
"type": "Unified",
"level": 3,
"size": 8388608,
"num_sharing": 8
}
],
"load_avg": [],
"library_build_type": "release"
},
"benchmarks": [
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 0,
"threads": 1,
"iterations": 791243,
"real_time": 8.9247235046909111e+02,
"cpu_time": 9.6762309429593688e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 1,
"threads": 1,
"iterations": 791243,
"real_time": 8.8162877902591856e+02,
"cpu_time": 9.2812827412059255e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "iteration",
"repetitions": 3,
"repetition_index": 2,
"threads": 1,
"iterations": 791243,
"real_time": 8.8920180020817850e+02,
"cpu_time": 9.6762309429593688e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_mean",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "mean",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.8776764323439613e+02,
"cpu_time": 9.5445815423748866e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_median",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "median",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.8920180020817850e+02,
"cpu_time": 9.6762309429593688e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_stddev",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "stddev",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 5.5622266296561653e+00,
"cpu_time": 2.2802345059834170e+01,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_cv",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "cv",
"aggregate_unit": "percentage",
"iterations": 3,
"real_time": 6.2654081527361745e-03,
"cpu_time": 2.3890355966470669e-02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_min",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "min",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.8162877902591856e+02,
"cpu_time": 9.2812827412059266e+02,
"time_unit": "ns"
},
{
"name": "predict_linalg_10x1x10/repeats:3/manual_time_max",
"family_index": 0,
"per_family_instance_index": 0,
"run_name": "predict_linalg_10x1x10/repeats:3/manual_time",
"run_type": "aggregate",
"repetitions": 3,
"threads": 1,
"aggregate_name": "max",
"aggregate_unit": "time",
"iterations": 3,
"real_time": 8.9247235046909100e+02,
"cpu_time": 9.6762309429593688e+02,
"time_unit": "ns"
}
]
}
Loading

0 comments on commit 0ada127

Please sign in to comment.