-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbenchmark_ryzen_nvidia.txt
80 lines (79 loc) · 6.25 KB
/
benchmark_ryzen_nvidia.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
TensorStream::Evaluator::OpenclEvaluator
TensorStream::Evaluator::RubyEvaluator
model name : AMD Ryzen 3 1300X Quad-Core Processor
OpenCL device NVIDIA CUDA GeForce GTX 1060 6GB
Rehearsal ------------------------------------------------------------------------
pure ruby argmin : 0.708414 0.007882 0.716296 ( 0.717201)
opencl argmin : 0.204186 0.222389 0.426575 ( 0.447862)
pure ruby bias_add_grad : 2.048097 0.005187 2.053284 ( 2.057617)
opencl bias_add_grad : 0.012482 0.000426 0.012908 ( 0.013225)
pure ruby bias_add : 2.406516 0.000087 2.406603 ( 2.406307)
opencl bias_add : 0.136466 0.008025 0.144491 ( 0.134989)
pure ruby conv2d_backprop : 3.685220 0.000155 3.685375 ( 3.685049)
opencl conv2d_backprop : 0.028940 0.008031 0.036971 ( 0.029904)
pure ruby conv2d : 0.788991 0.000041 0.789032 ( 0.788881)
opencl conv2d : 0.020150 0.000138 0.020288 ( 0.016917)
pure ruby arr index : 0.003036 0.000000 0.003036 ( 0.003044)
opencl arr index : 0.009626 0.000023 0.009649 ( 0.006703)
pure ruby min : 3.767836 0.007871 3.775707 ( 3.773523)
opencl min : 0.141541 0.008039 0.149580 ( 0.139246)
pure ruby sum : 3.219801 0.000076 3.219877 ( 3.218388)
opencl sum : 0.007480 0.004074 0.011554 ( 0.008261)
pure ruby sum axis 1 : 3.203423 0.000000 3.203423 ( 3.201832)
opencl sum axis 1 : 0.011710 0.000033 0.011743 ( 0.008379)
pure ruby split : 0.016504 0.000008 0.016512 ( 0.016529)
opencl split : 0.041059 0.012026 0.053085 ( 0.043289)
pure ruby add_n : 0.141810 0.000000 0.141810 ( 0.141721)
opencl add_n : 0.013751 0.000000 0.013751 ( 0.012208)
pure ruby ooo matmul : 1.395286 0.000000 1.395286 ( 1.394697)
opencl ooo matmul : 0.013448 0.000000 0.013448 ( 0.009873)
pure ruby softmax : 0.025362 0.000018 0.025380 ( 0.025382)
opencl softmax : 0.014999 0.000051 0.015050 ( 0.011977)
pure ruby matmul : 0.666863 0.000000 0.666863 ( 0.666499)
opencl matmul : 0.008572 0.003920 0.012492 ( 0.009246)
pure ruby : 2.429792 0.000005 2.429797 ( 2.428788)
opencl : 0.140862 0.004014 0.144876 ( 0.137264)
pure ruby single function: 0.340247 0.000000 0.340247 ( 0.340184)
opencl singlefunction: 0.084871 0.007956 0.092827 ( 0.087899)
pure ruby pow float: 0.083372 0.000000 0.083372 ( 0.083339)
opencl pow float: 0.013498 0.000014 0.013512 ( 0.010353)
pure ruby pow int: 0.018739 0.000000 0.018739 ( 0.018753)
opencl pow int: 0.007737 0.004041 0.011778 ( 0.008817)
-------------------------------------------------------------- total: 26.165217sec
user system total real
pure ruby argmin : 0.677097 0.000009 0.677106 ( 0.676828)
opencl argmin : 0.005919 0.003950 0.009869 ( 0.006618)
pure ruby bias_add_grad : 2.027326 0.000000 2.027326 ( 2.026399)
opencl bias_add_grad : 0.011544 0.000050 0.011594 ( 0.008380)
pure ruby bias_add : 2.378283 0.000000 2.378283 ( 2.377411)
opencl bias_add : 0.130993 0.011994 0.142987 ( 0.132772)
pure ruby conv2d_backprop : 3.738167 0.000000 3.738167 ( 3.737946)
opencl conv2d_backprop : 0.031267 0.003958 0.035225 ( 0.030381)
pure ruby conv2d : 0.794182 0.000000 0.794182 ( 0.794100)
opencl conv2d : 0.015865 0.004020 0.019885 ( 0.016878)
pure ruby arr index : 0.003112 0.000000 0.003112 ( 0.003109)
opencl arr index : 0.012100 0.000000 0.012100 ( 0.009728)
pure ruby min : 3.669509 0.003944 3.673453 ( 3.671906)
opencl min : 0.137071 0.004055 0.141126 ( 0.131802)
pure ruby sum : 3.210619 0.000000 3.210619 ( 3.210064)
opencl sum : 0.002431 0.008030 0.010461 ( 0.007522)
pure ruby sum axis 1 : 3.208789 0.000000 3.208789 ( 3.208125)
opencl sum axis 1 : 0.006075 0.003963 0.010038 ( 0.007679)
pure ruby split : 0.013985 0.000000 0.013985 ( 0.013990)
opencl split : 0.029464 0.011999 0.041463 ( 0.030797)
pure ruby add_n : 0.140984 0.000003 0.140987 ( 0.140959)
opencl add_n : 0.003146 0.007934 0.011080 ( 0.007778)
pure ruby ooo matmul : 1.416585 0.000000 1.416585 ( 1.416290)
opencl ooo matmul : 0.011156 0.000000 0.011156 ( 0.008723)
pure ruby softmax : 0.024724 0.000000 0.024724 ( 0.024731)
opencl softmax : 0.006237 0.003945 0.010182 ( 0.009005)
pure ruby matmul : 0.679538 0.000000 0.679538 ( 0.680048)
opencl matmul : 0.003456 0.007965 0.011421 ( 0.008568)
pure ruby : 2.437790 0.004031 2.441821 ( 2.443126)
opencl : 0.133039 0.003996 0.137035 ( 0.130579)
pure ruby single function: 0.332269 0.004003 0.336272 ( 0.336201)
opencl singlefunction: 0.078607 0.004009 0.082616 ( 0.078640)
pure ruby pow float: 0.081409 0.000000 0.081409 ( 0.081364)
opencl pow float: 0.011501 0.000000 0.011501 ( 0.008471)
pure ruby pow int: 0.016687 0.000000 0.016687 ( 0.016711)
opencl pow int: 0.007061 0.003950 0.011011 ( 0.007819)