Benchmark (ONNX) for Addition#

The experiment compares the execution time between numpy and onnxruntime for a series (or cascade) of additions.

$y = (((X + M_1) + M_2) + ...) + M_k$

k is named the number of nodes and the corresponding ONNX graph for k=2 or 4 looks like a cascade of operators Add. Both onnxruntime and numpy use BLAS functions.

k=2	k=4

Overview #

(Source code, png, hires.png, pdf)

Configuration #

<<<

from pyquickhelper.pandashelper import df2rst
import pandas
name = os.path.join(
    __WD__, "../../onnx/results/bench_plot_onnxruntime_casc_add.time.csv")
df = pandas.read_csv(name)
print(df2rst(df, number_format=4))

>>>

name	version	value
date	2019-12-11
python		3.7.2 (default, Mar 1 2019, 18:34:21) [GCC 6.3.0 20170516]
platform		linux
OS		Linux-4.9.0-8-amd64-x86_64-with-debian-9.6
machine		x86_64
processor
release		4.9.0-8-amd64
architecture		(‘64bit’, ‘’)
mlprodict	not-imported
numpy	1.17.4	openblas, language=c
onnx	1.6.34	opset=12
onnxruntime	1.1.992	CPU-MKL-ML
pandas	0.25.3
skl2onnx	1.6.992
sklearn	0.22

Raw results #

bench_plot_onnxruntime_casc_add.csv

<<<

from pyquickhelper.pandashelper import df2rst
from pymlbenchmark.benchmark.bench_helper import bench_pivot
import pandas
name = os.path.join(
    __WD__, "../../onnx/results/bench_plot_onnxruntime_casc_add.perf.csv")
df = pandas.read_csv(name)
piv = bench_pivot(df).reset_index(drop=False)
piv['speedup'] = piv['npy'] / piv['ort']
print(df2rst(piv, number_format=4))

N	dim	nbnode	number	count	npy	ort	speedup
1	1	1	10	20	4.147e-05	0.0001363	0.3042
1	1	2	10	20	6.292e-05	0.0001547	0.4067
1	1	3	10	20	8.279e-05	0.0001573	0.5264
1	1	5	10	20	0.0001188	0.0001733	0.6855
1	1	10	10	20	0.0002147	0.0002089	1.028
1	1	50	10	20	0.0009485	0.0005034	1.884
1	1	100	10	20	0.001855	0.0009153	2.027
1	1	150	10	20	0.002796	0.001228	2.278
1	1	200	10	20	0.003694	0.00168	2.2
1	1	250	10	20	0.004646	0.002086	2.228
1	1	300	10	20	0.005511	0.002449	2.25
1	10	1	10	20	3.124e-05	0.0001417	0.2204
1	10	2	10	20	4.595e-05	0.0001744	0.2634
1	10	3	10	20	5.122e-05	0.0001645	0.3114
1	10	5	10	20	7.151e-05	0.0001827	0.3913
1	10	10	10	20	0.0001242	0.0002133	0.5822
1	10	50	10	20	0.0005177	0.0005033	1.028
1	10	100	10	20	0.0009871	0.000856	1.153
1	10	150	10	20	0.001489	0.001216	1.224
1	10	200	10	20	0.001972	0.00164	1.202
1	10	250	10	20	0.002446	0.001993	1.227
1	10	300	10	20	0.002918	0.002464	1.184
1	100	1	10	20	2.992e-05	0.0001435	0.2084
1	100	2	10	20	4.123e-05	0.0004185	0.09853
1	100	3	10	20	5.212e-05	0.0004394	0.1186
1	100	5	10	20	7.084e-05	0.0004691	0.151
1	100	10	10	20	0.0001248	0.000509	0.2452
1	100	50	10	20	0.0005238	0.0008076	0.6486
1	100	100	10	20	0.001025	0.001165	0.8798
1	100	150	10	20	0.001518	0.001575	0.9641
1	100	200	10	20	0.001996	0.001885	1.059
1	100	250	10	20	0.002472	0.002312	1.069
1	100	300	10	20	0.002998	0.002587	1.159
10	1	1	10	20	2.947e-05	0.0001359	0.2169
10	1	2	10	20	4.099e-05	0.0001511	0.2713
10	1	3	10	20	5.089e-05	0.0001561	0.3261
10	1	5	10	20	7.147e-05	0.0001696	0.4215
10	1	10	10	20	0.0001199	0.0002098	0.5714
10	1	50	10	20	0.0005125	0.0004969	1.031
10	1	100	10	20	0.0009885	0.0008379	1.18
10	1	150	10	20	0.001487	0.001209	1.231
10	1	200	10	20	0.001941	0.001555	1.248
10	1	250	10	20	0.002487	0.00192	1.296
10	1	300	10	20	0.002963	0.002255	1.314
10	10	1	10	20	3.435e-05	0.0001397	0.2458
10	10	2	10	20	5.228e-05	0.0001735	0.3014
10	10	3	10	20	6.115e-05	0.0001656	0.3692
10	10	5	10	20	8.779e-05	0.0001821	0.4821
10	10	10	10	20	0.0001551	0.0002321	0.6683
10	10	50	10	20	0.000668	0.0005767	1.158
10	10	100	10	20	0.001284	0.001007	1.276
10	10	150	10	20	0.00195	0.001441	1.353
10	10	200	10	20	0.00255	0.001859	1.372
10	10	250	10	20	0.003203	0.002327	1.377
10	10	300	10	20	0.003765	0.002727	1.381
10	100	1	10	20	4.008e-05	0.0001518	0.264
10	100	2	10	20	5.729e-05	0.000176	0.3256
10	100	3	10	20	7.325e-05	0.0001826	0.4011
10	100	5	10	20	0.0001061	0.0002073	0.512
10	100	10	10	20	0.000184	0.0002609	0.7055
10	100	50	10	20	0.0008139	0.0006695	1.216
10	100	100	10	20	0.001605	0.0013	1.234
10	100	150	10	20	0.002369	0.001798	1.318
10	100	200	10	20	0.003145	0.002338	1.345
10	100	250	10	20	0.003959	0.002894	1.368
10	100	300	10	20	0.004714	0.00343	1.374
100	1	1	10	20	3.038e-05	0.0001362	0.2231
100	1	2	10	20	4.26e-05	0.0001495	0.2849
100	1	3	10	20	5.146e-05	0.0001541	0.3339
100	1	5	10	20	7.257e-05	0.0001727	0.4201
100	1	10	10	20	0.0001222	0.0002046	0.5969
100	1	50	10	20	0.0005173	0.0004977	1.039
100	1	100	10	20	0.001013	0.0008521	1.189
100	1	150	10	20	0.001517	0.001212	1.251
100	1	200	10	20	0.002023	0.001575	1.285
100	1	250	10	20	0.002505	0.001952	1.283
100	1	300	10	20	0.002993	0.002291	1.306
100	10	1	10	20	4.055e-05	0.0001685	0.2406
100	10	2	10	20	6.169e-05	0.0002092	0.2949
100	10	3	10	20	7.448e-05	0.0002225	0.3348
100	10	5	10	20	0.0001069	0.0002676	0.3996
100	10	10	10	20	0.0001856	0.0003897	0.4764
100	10	50	10	20	0.0008158	0.001314	0.6208
100	10	100	10	20	0.001606	0.002503	0.6416
100	10	150	10	20	0.0024	0.003648	0.658
100	10	200	10	20	0.00317	0.004841	0.6548
100	10	250	10	20	0.003969	0.006026	0.6586
100	10	300	10	20	0.004744	0.00716	0.6626
100	100	1	10	20	7.942e-05	0.0002163	0.3672
100	100	2	10	20	0.0001154	0.0002698	0.4279
100	100	3	10	20	0.0001499	0.0003108	0.4823
100	100	5	10	20	0.0002161	0.0003925	0.5507
100	100	10	10	20	0.000381	0.0005844	0.6519
100	100	50	10	20	0.001693	0.002141	0.7907
100	100	100	10	20	0.003337	0.00399	0.8363
100	100	150	10	20	0.004959	0.00587	0.8448
100	100	200	10	20	0.006533	0.00774	0.844
100	100	250	10	20	0.008242	0.009614	0.8573
100	100	300	10	20	0.009794	0.01147	0.8542
1000	1	1	10	20	4.058e-05	0.0001506	0.2695
1000	1	2	10	20	5.153e-05	0.0001691	0.3048
1000	1	3	10	20	6.485e-05	0.0001737	0.3735
1000	1	5	10	20	9.152e-05	0.000196	0.467
1000	1	10	10	20	0.0001578	0.0002426	0.6506
1000	1	50	10	20	0.0006785	0.0006101	1.112
1000	1	100	10	20	0.001335	0.001064	1.256
1000	1	150	10	20	0.001985	0.001531	1.296
1000	1	200	10	20	0.002627	0.002005	1.31
1000	1	250	10	20	0.003282	0.002463	1.332
1000	1	300	10	20	0.003878	0.002918	1.329
1000	10	1	10	20	8.004e-05	0.0003437	0.2329
1000	10	2	10	20	0.0001194	0.0005427	0.2201
1000	10	3	10	20	0.0001479	0.0006981	0.2119
1000	10	5	10	20	0.0002175	0.00103	0.2111
1000	10	10	10	20	0.0003841	0.001847	0.208
1000	10	50	10	20	0.001692	0.008476	0.1996
1000	10	100	10	20	0.003306	0.01663	0.1988
1000	10	150	10	20	0.004956	0.02487	0.1993
1000	10	200	10	20	0.006497	0.0333	0.1951
1000	10	250	10	20	0.008223	0.04162	0.1976
1000	10	300	10	20	0.009726	0.04966	0.1959
1000	100	1	10	20	0.0005626	0.0007685	0.7321
1000	100	2	10	20	0.0008669	0.001115	0.7774
1000	100	3	10	20	0.001166	0.00149	0.7821
1000	100	5	10	20	0.001748	0.002174	0.804
1000	100	10	10	20	0.003241	0.003907	0.8295
1000	100	50	10	20	0.01502	0.01777	0.8453
1000	100	100	10	20	0.02949	0.03525	0.8368
1000	100	150	10	20	0.04391	0.0527	0.8332
1000	100	200	10	20	0.05849	0.06993	0.8365
1000	100	250	10	20	0.07272	0.08716	0.8343
1000	100	300	10	20	0.08726	0.1042	0.8376
10000	1	1	10	20	8.915e-05	0.0002148	0.4151
10000	1	2	10	20	0.000109	0.0002512	0.4341
10000	1	3	10	20	0.0001388	0.0002798	0.4961
10000	1	5	10	20	0.0002035	0.0003375	0.603
10000	1	10	10	20	0.000351	0.0004659	0.7534
10000	1	50	10	20	0.00153	0.00144	1.062
10000	1	100	10	20	0.003026	0.002611	1.159
10000	1	150	10	20	0.004499	0.003792	1.186
10000	1	200	10	20	0.005992	0.004982	1.203
10000	1	250	10	20	0.007515	0.006115	1.229
10000	1	300	10	20	0.008884	0.007331	1.212
10000	10	1	10	20	0.0006901	0.002107	0.3275
10000	10	2	10	20	0.0008889	0.003729	0.2384
10000	10	3	10	20	0.001185	0.005217	0.2272
10000	10	5	10	20	0.001813	0.008549	0.2121
10000	10	10	10	20	0.003208	0.01631	0.1967
10000	10	50	10	20	0.01493	0.07975	0.1872
10000	10	100	10	20	0.02959	0.1592	0.1859
10000	10	150	10	20	0.04401	0.238	0.1849
10000	10	200	10	20	0.05858	0.3181	0.1841
10000	10	250	10	20	0.07333	0.3959	0.1852
10000	10	300	10	20	0.08809	0.474	0.1858
10000	100	1	10	20	0.009114	0.008093	1.126
10000	100	2	10	20	0.01288	0.01466	0.8787
10000	100	3	10	20	0.01651	0.02192	0.7534
10000	100	5	10	20	0.02369	0.03054	0.7757
10000	100	10	10	20	0.04295	0.04799	0.8949
10000	100	50	10	20	0.1841	0.1989	0.9257
10000	100	100	10	20	0.3722	0.3907	0.9527
10000	100	150	10	20	0.5542	0.5807	0.9542
10000	100	200	10	20	0.7299	0.7707	0.9472
10000	100	250	10	20	0.9327	0.964	0.9676
10000	100	300	10	20	1.053	1.173	0.8975

Benchmark code #

bench_plot_onnxruntime_casc_add.py

# coding: utf-8
"""
Benchmark of :epkg:`onnxruntime` for a cascade of additions.
"""
# Authors: Xavier Dupré (benchmark)
# License: MIT
import matplotlib
matplotlib.use('Agg')

import os
import unittest
import warnings
import contextlib
from time import perf_counter as time
from io import StringIO
import numpy
import pandas
import matplotlib.pyplot as plt
import sklearn
from sklearn.utils._testing import ignore_warnings
from sklearn.utils.extmath import softmax
from pyquickhelper.loghelper import run_cmd, sys_path_append
from pymlbenchmark.benchmark import BenchPerfTest, BenchPerf
from pymlbenchmark.context import machine_information
from pymlbenchmark.datasets.artificial import random_binary_classification
from pymlbenchmark.plotting import plot_bench_results
from skl2onnx.common.data_types import FloatTensorType
from skl2onnx.algebra.onnx_ops import OnnxAdd
from onnxruntime import InferenceSession
from mlprodict import __max_supported_opset__, get_ir_version

################################
# Benchmark
# +++++++++


def generate_onnx_graph(dim, nbnode, input_name='X1'):
    """Generates a series of consecutive additions."""

    matrices = []
    i1 = input_name
    for i in range(nbnode - 1):
        i2 = random_binary_classification(1, dim)[0].astype(numpy.float32)
        matrices.append(i2)
        node = OnnxAdd(i1, i2, op_version=__max_supported_opset__)
        i1 = node
    i2 = random_binary_classification(1, dim)[0].astype(numpy.float32)
    matrices.append(i2)
    node = OnnxAdd(i1, i2, output_names=['Y'],
                   op_version=__max_supported_opset__)
    onx = node.to_onnx([(input_name, FloatTensorType((None, dim)))],
                       outputs=[('Y', FloatTensorType((None, dim)))])
    onx.ir_version = get_ir_version(__max_supported_opset__)
    return onx, matrices


class GraphORtBenchPerfTest(BenchPerfTest):
    def __init__(self, dim=4, nbnode=3):
        BenchPerfTest.__init__(self)
        self.input_name = 'X1'
        self.nbnode = nbnode
        self.onx, self.matrices = generate_onnx_graph(dim,
                                                      nbnode, self.input_name)
        as_string = self.onx.SerializeToString()
        self.ort = InferenceSession(as_string)

    def fcts(self, **kwargs):

        def predict_ort(X, model=self.ort):
            return self.ort.run(None, {self.input_name: X})[0]

        def predict_npy(X, model=self.matrices):
            res = X.copy()
            for mat in model:
                res += X
            return res

        return [{'lib': 'ort', 'fct': predict_ort},
                {'lib': 'npy', 'fct': predict_npy}]

    def data(self, N=10, dim=4, **kwargs):  # pylint: disable=W0221
        return tuple(o.astype(numpy.float32)
                     for o in random_binary_classification(N, dim)[:1])


@ignore_warnings(category=FutureWarning)
def run_bench(repeat=20, number=10, verbose=False):

    pbefore = dict(dim=[1, 10, 100],
                   nbnode=[1, 2, 3, 5, 10, 50, 100, 150, 200, 250, 300])
    pafter = dict(N=[1, 10, 100, 1000, 10000])

    test = lambda dim=None, **opts: GraphORtBenchPerfTest(dim=dim, **opts)
    bp = BenchPerf(pbefore, pafter, test)

    with sklearn.config_context(assume_finite=True):
        start = time()
        results = list(bp.enumerate_run_benchs(repeat=repeat, verbose=verbose,
                                               number=number, stop_if_error=False))
        end = time()

    results_df = pandas.DataFrame(results)
    print("Total time = %0.3f sec\n" % (end - start))
    return results_df

#########################
# Runs the benchmark
# ++++++++++++++++++


filename = os.path.splitext(os.path.split(__file__)[-1])[0]
df = run_bench(verbose=True)
df.to_csv("%s.perf.csv" % filename, index=False)
print(df.head())

#########################
# Extracts information about the machine used
# +++++++++++++++++++++++++++++++++++++++++++

pkgs = ['numpy', 'pandas', 'sklearn', 'skl2onnx',
        'onnxruntime', 'onnx', 'mlprodict']
dfi = pandas.DataFrame(machine_information(pkgs))
dfi.to_csv("%s.time.csv" % filename, index=False)
print(dfi)


#############################
# Plot the results by number of nodes
# +++++++++++++++++++++++++++++++++++

def label_fct(la):
    la = la.replace("onxpython_compiled", "opy")
    la = la.replace("onxpython", "opy")
    la = la.replace("onxonnxruntime1", "ort")
    la = la.replace("fit_intercept", "fi")
    la = la.replace("True", "1")
    la = la.replace("False", "0")
    la = la.replace("max_depth", "mxd")
    return la


from pymlbenchmark.plotting import plot_bench_results
plot_bench_results(df, row_cols='N', col_cols='dim',
                   x_value='nbnode',
                   title="%s\nBenchmark scikit-learn / onnxruntime" % "Cascade Add",
                   label_fct=label_fct)

plt.savefig("%s.node.png" % filename)


##################################
# Plot one ONNX graph
# +++++++++++++++++++

for nbnode in (2, 4):
    onx = generate_onnx_graph(5, nbnode)[0]

    from onnx.tools.net_drawer import GetPydotGraph, GetOpNodeProducer
    pydot_graph = GetPydotGraph(onx.graph, name=onx.graph.name, rankdir="TB",
                                node_producer=GetOpNodeProducer("docstring"))
    pydot_graph.write_dot("graph.%d.dot" % nbnode)
    os.system('dot -O -Tpng graph.%d.dot' % nbnode)

image = plt.imread("graph.%d.dot.png" % nbnode)
plt.imshow(image)
plt.axis('off')
plt.savefig("%s.%d.node.png" % (filename, nbnode))

import sys
if "--quiet" not in sys.argv:
    plt.show()

Benchmark (ONNX) for Addition#

Overview#

Configuration#

Raw results#

Benchmark code#

Overview #

Configuration #

Raw results #

Benchmark code #