Skip to content

Commit

Permalink
cuda docs
Browse files Browse the repository at this point in the history
  • Loading branch information
sronilsson committed Sep 1, 2024
1 parent f8e41e2 commit 92e94ba
Show file tree
Hide file tree
Showing 28 changed files with 536 additions and 74 deletions.
7 changes: 7 additions & 0 deletions docs/conf.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,14 +22,21 @@
extensions = ['sphinx.ext.napoleon',
'sphinx.ext.imgmath',
'sphinx.ext.mathjax',
'sphinx-mathjax-offline',
'sphinx.ext.autodoc',
'sphinx.ext.todo',
'sphinx.ext.viewcode',
'sphinxemoji.sphinxemoji',
#'sphinx_autodoc_typehints',
'sphinx_togglebutton',
'nbsphinx',
'sphinx.ext.intersphinx',
'sphinxcontrib.video']

#mathjax_path = "https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.7/MathJax.js?config=TeX-AMS-MML_HTMLorMML"



intersphinx_mapping = {
'python': ('https://docs.python.org/3', None),
}
Expand Down
1 change: 1 addition & 0 deletions docs/tables/.~lock.direction_two_bps.csv#
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
,simon,simon-Inspiron-15-3520,31.08.2024 19:05,file:///home/simon/.config/libreoffice/4;
1 change: 1 addition & 0 deletions docs/tables/.~lock.is_inside_rectangle.csv#
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
,simon,simon-Inspiron-15-3520,31.08.2024 19:02,file:///home/simon/.config/libreoffice/4;
9 changes: 9 additions & 0 deletions docs/tables/count_values_in_ranges.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
FRAMES (MILLION),TIME (S)
4,0.038
8,0.201
16,0.344
32,0.306
64,0.776
128,1.611
NVIDIA GeForce RTX 4070,
"(n, 11)",
10 changes: 10 additions & 0 deletions docs/tables/cuda_shap.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
FRAMES (THOUSANDS),TIME (S)
1,1.295
10,4.401
20,8.627
40,15.280
80,30.759
160,65.575
240,87.468
NVIDIA GeForce RTX 4070,
"RF: 100 estimators, 501 features",
10 changes: 10 additions & 0 deletions docs/tables/direction_two_bps.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
FRAMES (MILLIONS),CUDA JIT GPU (S)
2,0.0285
4,0.0404
8,0.069
16,0.1352
32,0.2711
64,0.5586
128,0.8525
256,1.6652
512,4.1223
8 changes: 8 additions & 0 deletions docs/tables/get_3pt_angle.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
FRAMES,TIME (S)
**4 million**,0.020
**8 million**,0.040
**16 million**,0.159
**32 million**,0.290
**64 million** ,0.335
**128 million**,0.792
256 million**,1.371
13 changes: 13 additions & 0 deletions docs/tables/get_euclidean_distance_cuda.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
OBSERVATION,TIME (S)
**110k**,0.007
**181k**,0.021
**327k**,0.032
**620k**,0.02
**1.2m**,0.082
**2.4m**,0.046
**4.7m**,0.106
**9.3m**,0.209
**18.6m**,0.238
**37.2m**,0.926
**74.5m**,1.136
**149m**,2.046
23 changes: 23 additions & 0 deletions docs/tables/img_stack_to_grayscale_cuda.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
FRAMES (k),GPU (s),STDEV (s)
1,0.16022,0.125786
2,0.14428,0.003726
3,0.19769,0.005645
4,0.2571,0.006002
5,0.33574,0.017868
6,0.39921,0.026858
7,0.45734,0.0333
8,0.53216,0.015075
9,0.50257,0.023186
10,0.54235,0.090055
11,0.69896,0.00999
12,0.57932,0.0010399
13,0.63791,0.017
14,0.99677,0.1073426
15,1.56103,0.5308574
16,1.08143,0.082
17,1.39189,0.3308389
18,1.23648,0.1386822
19,1.39554,0.161
20,1.962,0.576
NVIDIA GeForce RTX 4070,,
REPEATS= 3,,
12 changes: 12 additions & 0 deletions docs/tables/img_stack_to_grayscale_cupy.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
FRAMES (THOUSANDS),GPU (s)
0.5,0.3419
1,0.52333
1.5,0.81614
2,1.0632
2.5,1.32399
3,1.61488
3.5,1.87857
4,2.30137
4.5,2.54736
5,2.90824
5.5,3.09271
11 changes: 11 additions & 0 deletions docs/tables/is_inside_circle.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
FRAMES (MILLIONS),CUDA JIT GPU (S)
2,0.006
4,0.007
8,0.016
16,0.028
32,0.054
64,0.114
128,0.319
256,0.44
512,1.085
1000,2.966
11 changes: 11 additions & 0 deletions docs/tables/is_inside_polygon.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
FRAMES (MILLIONS),CUDA JIT GPU (S),NUMBA CPU TIME (S)
2,0.002,0.038
4,0.004,0.082
8,0.006,0.170
16,0.009,0.295
32,0.021,0.823
64,0.041,1.395
128,0.101,2.688
256,0.369,4.640
512,0.614,10.940
1000,1.293,19.947
23 changes: 11 additions & 12 deletions docs/tables/is_inside_rectangle.csv
Original file line number Diff line number Diff line change
@@ -1,12 +1,11 @@
FRAMES (MILLION),CUDA JIT GPU (S),NUMBA CPU TIME (S)
**2 million**,0.005,0.022
**4 million**,0.009,0.031
**8 million**,0.016,0.097
**16 million**,0.028,0.199
**32 million**,0.054,0.399
**64 million**,0.111,0.769
**128 million**,0.33,1.3
**256 million**,0.666,2.531
**512 million**,1.161,7.273
**1 billion**,3.828,13.342
NVIDIA GeForce RTX 4070,,
FRAMES (MILLIONS),CUDA JIT GPU (S),NUMBA CPU TIME (S)
2,0.005,0.022
4,0.009,0.031
8,0.016,0.097
16,0.028,0.199
32,0.054,0.399
64,0.111,0.769
128,0.33,1.300
256,0.666,2.531
512,1.161,7.273
1000,3.828,13.342
14 changes: 14 additions & 0 deletions docs/tables/sliding_circular_hotspots.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
2,0.0219,0
4,0.0387,0.002
8,0.0809,0.015
16,0.1304,0.008
32,0.3135,0.043
64,0.593,0.054
128,1.2028,0.156
256,2.3236,0.101
512,4.9477,0.538
1024,10.266,1.351
NVIDIA GeForce RTX 4070,,
BATCH_SIZE: 3e+7,,
REPEATS 5,,
12 changes: 12 additions & 0 deletions docs/tables/sliding_circular_mean.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
1,0.0755,0.07201
2,0.03908,0.00131
4,0.0726,0.00205
8,0.13196,0.00872
16,0.26056,0.01587
32,0.60962,0.07974
64,1.01012,0.02032
128,2.05793,0.15376
256,4.08802,0.14152
512,14.67234,3.66222
1000,27.43026,3.35774
14 changes: 14 additions & 0 deletions docs/tables/sliding_circular_range.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
2,0.055,0.199
4,0.115,0.005
8,0.239,0.003
16,0.398,0.023
32,0.768,0.012
64,1.596,0.04
128,3.118,0.131
256,6.84703,0.73121
512,12.36,0.122
1024,25.17,0.075
NVIDIA GeForce RTX 4070,,
BATCH_SIZE: 3e+7,,
REPEATS 5,,
14 changes: 14 additions & 0 deletions docs/tables/sliding_circular_std.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
2,0.027,0.0009
4,0.048,0.0028
8,0.117,0.0199
16,0.163,0.0052
32,0.362,0.0571
64,0.653,0.0134
128,1.439,0.1888
256,2.836,0.1929
512,6.107,0.232
1024,22.893,5.933
NVIDIA GeForce RTX 4070,,
BATCH_SIZE: 3e+7,,
REPEATS 5,,
12 changes: 12 additions & 0 deletions docs/tables/sliding_mean.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
FRAMES (MILLIONS),TIME (S)
2,0.005
4,0.025
8,0.015
16,0.028
32,0.059
64,0.182
128,0.237
256,0.507
512,1.022
NVIDIA GeForce RTX 4070,
time window = 1s / 10 FPS,
12 changes: 12 additions & 0 deletions docs/tables/sliding_min.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
FRAMES (MILLIONS),TIME (S)
2,0.003
4,0.016
8,0.012
16,0.049
32,0.053
64,0.099
128,0.211
256,0.495
512,1.031
NVIDIA GeForce RTX 4070,
time window = 1s / 10 FPS,
14 changes: 14 additions & 0 deletions docs/tables/sliding_rayleigh_z.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
2,0.02531,0.00328
4,0.04003,0.00533
8,0.07184,0.01016
16,0.12379,0.01608
32,0.2542,0.03084
64,0.52848,0.05978
128,1.05474,0.16997
256,1.93246,0.07944
512,4.45524,0.07773
1000,8.46498,0.33432
NVIDIA GeForce RTX 4070,,
BATCH_SIZE: 3e+7,,
REPEATS 5,,
14 changes: 14 additions & 0 deletions docs/tables/sliding_resultant_vector_length.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
FRAMES (MILLIONS),GPU (s),GPU (STDEV)
2,0.04253,0.002
4,0.06979,0
8,0.14922,0.015
16,0.34029,0.062
32,0.48812,0.012
64,1.0269,0.059
128,2.16228,0.156
256,4.15671,0.027
512,11.4188,2.501
1000,28.76021,2.59123
NVIDIA GeForce RTX 4070,,
BATCH_SIZE: 3e+7,,
REPEATS 5,,
Loading

0 comments on commit 92e94ba

Please sign in to comment.