Benchmark (ONNX) for Scaler#

The experiment compares the execution time between numpy and onnxruntime for a series (or cascade) of scaling.

$y = (((X + M_1) + M_2) + ...) + M_k$

k is named the number of nodes and the corresponding ONNX graph for k=2 or 4 looks like a cascade of operators Scaler. numpy use BLAS functions, onnxruntime does not.

k=2	k=4

Overview #

(Source code, png, hires.png, pdf)

../_images/onnxruntime_casc_scaler-1.png

Configuration #

<<<

from pyquickhelper.pandashelper import df2rst
import pandas
name = os.path.join(
    __WD__, "../../onnx/results/bench_plot_onnxruntime_casc_scaler.time.csv")
df = pandas.read_csv(name)
print(df2rst(df, number_format=4))

>>>

name	version	value
date	2019-12-11
python		3.7.2 (default, Mar 1 2019, 18:34:21) [GCC 6.3.0 20170516]
platform		linux
OS		Linux-4.9.0-8-amd64-x86_64-with-debian-9.6
machine		x86_64
processor
release		4.9.0-8-amd64
architecture		(‘64bit’, ‘’)
mlprodict	not-imported
numpy	1.17.4	openblas, language=c
onnx	1.6.34	opset=12
onnxruntime	1.1.992	CPU-MKL-ML
pandas	0.25.3
skl2onnx	1.6.992
sklearn	0.22

Raw results #

bench_plot_onnxruntime_casc_scaler.csv

<<<

from pyquickhelper.pandashelper import df2rst
from pymlbenchmark.benchmark.bench_helper import bench_pivot
import pandas
name = os.path.join(
    __WD__, "../../onnx/results/bench_plot_onnxruntime_casc_scaler.perf.csv")
df = pandas.read_csv(name)
piv = bench_pivot(df).reset_index(drop=False)
piv['speedup'] = piv['npy'] / piv['ort']
print(df2rst(piv, number_format=4))

N	dim	nbnode	number	count	npy	ort	speedup
1	1	1	2	20	1.603e-05	2.766e-05	0.5795
1	1	2	2	20	2.465e-05	2.901e-05	0.8498
1	1	3	2	20	3.047e-05	2.725e-05	1.118
1	1	5	2	20	4.625e-05	2.995e-05	1.544
1	1	10	2	20	8.724e-05	3.165e-05	2.757
1	1	50	2	20	0.0004088	5.622e-05	7.271
1	1	100	2	20	0.0007946	8.771e-05	9.06
1	1	150	2	20	0.001182	0.0001185	9.975
1	1	200	2	20	0.00158	0.0001482	10.66
1	1	250	2	20	0.001986	0.0001819	10.92
1	1	300	2	20	0.00236	0.0002098	11.25
1	10	1	2	20	1.351e-05	2.709e-05	0.4987
1	10	2	2	20	2.027e-05	6.18e-05	0.3281
1	10	3	2	20	2.722e-05	6.286e-05	0.433
1	10	5	2	20	4.126e-05	6.341e-05	0.6507
1	10	10	2	20	7.849e-05	6.923e-05	1.134
1	10	50	2	20	0.0003579	0.0001008	3.552
1	10	100	2	20	0.0007039	0.000136	5.177
1	10	150	2	20	0.001053	0.0001737	6.06
1	10	200	2	20	0.001396	0.0002131	6.549
1	10	250	2	20	0.001734	0.0002497	6.943
1	10	300	2	20	0.002082	0.0002877	7.237
1	100	1	2	20	1.373e-05	6.719e-05	0.2043
1	100	2	2	20	2.102e-05	0.0003388	0.06206
1	100	3	2	20	2.922e-05	0.0003446	0.08481
1	100	5	2	20	4.245e-05	0.0003443	0.1233
1	100	10	2	20	7.982e-05	0.0003353	0.2381
1	100	50	2	20	0.0003655	0.0004543	0.8045
1	100	100	2	20	0.0007225	0.0005206	1.388
1	100	150	2	20	0.001081	0.0006117	1.767
1	100	200	2	20	0.001421	0.0007177	1.98
1	100	250	2	20	0.001787	0.0008506	2.1
1	100	300	2	20	0.002164	0.0009353	2.314
10	1	1	2	20	1.439e-05	2.777e-05	0.5184
10	1	2	2	20	2.201e-05	2.872e-05	0.7665
10	1	3	2	20	2.745e-05	2.836e-05	0.9679
10	1	5	2	20	4.09e-05	2.816e-05	1.452
10	1	10	2	20	7.62e-05	3.368e-05	2.263
10	1	50	2	20	0.0003594	6.205e-05	5.791
10	1	100	2	20	0.0007048	9.822e-05	7.175
10	1	150	2	20	0.001053	0.0001362	7.735
10	1	200	2	20	0.001384	0.0001723	8.031
10	1	250	2	20	0.001725	0.0002076	8.311
10	1	300	2	20	0.002072	0.0002435	8.508
10	10	1	2	20	1.498e-05	2.806e-05	0.5339
10	10	2	2	20	2.309e-05	2.987e-05	0.773
10	10	3	2	20	3.12e-05	3.197e-05	0.9758
10	10	5	2	20	4.743e-05	3.664e-05	1.294
10	10	10	2	20	8.973e-05	4.788e-05	1.874
10	10	50	2	20	0.0004143	0.000143	2.898
10	10	100	2	20	0.0008544	0.0002539	3.366
10	10	150	2	20	0.001244	0.0003628	3.428
10	10	200	2	20	0.001632	0.0004774	3.419
10	10	250	2	20	0.002055	0.0005892	3.488
10	10	300	2	20	0.002462	0.0007005	3.514
10	100	1	2	20	2.126e-05	4.402e-05	0.4829
10	100	2	2	20	3.578e-05	6.241e-05	0.5734
10	100	3	2	20	4.825e-05	7.992e-05	0.6037
10	100	5	2	20	7.351e-05	0.0001168	0.6296
10	100	10	2	20	0.0001391	0.0002042	0.6809
10	100	50	2	20	0.0006445	0.0009069	0.7107
10	100	100	2	20	0.001299	0.001786	0.727
10	100	150	2	20	0.001928	0.002658	0.7252
10	100	200	2	20	0.002572	0.003542	0.7261
10	100	250	2	20	0.003203	0.004414	0.7257
10	100	300	2	20	0.003842	0.005289	0.7265
100	1	1	2	20	1.335e-05	2.813e-05	0.4744
100	1	2	2	20	2.064e-05	3.104e-05	0.665
100	1	3	2	20	2.796e-05	3.19e-05	0.8765
100	1	5	2	20	4.169e-05	3.625e-05	1.15
100	1	10	2	20	7.742e-05	4.737e-05	1.634
100	1	50	2	20	0.0003617	0.0001435	2.52
100	1	100	2	20	0.000722	0.000253	2.854
100	1	150	2	20	0.001071	0.0003657	2.928
100	1	200	2	20	0.001428	0.0004783	2.986
100	1	250	2	20	0.001807	0.0005912	3.057
100	1	300	2	20	0.002126	0.0007064	3.009
100	10	1	2	20	2.33e-05	4.389e-05	0.5308
100	10	2	2	20	3.955e-05	6.282e-05	0.6296
100	10	3	2	20	5.501e-05	7.929e-05	0.6938
100	10	5	2	20	8.742e-05	0.000114	0.7668
100	10	10	2	20	0.0001643	0.0002032	0.8083
100	10	50	2	20	0.0007769	0.0009034	0.86
100	10	100	2	20	0.001543	0.001798	0.8584
100	10	150	2	20	0.002308	0.002648	0.8716
100	10	200	2	20	0.003104	0.003515	0.883
100	10	250	2	20	0.003859	0.004389	0.8792
100	10	300	2	20	0.004622	0.00526	0.8786
100	100	1	2	20	6.985e-05	0.0002039	0.3426
100	100	2	2	20	0.0001253	0.000371	0.3377
100	100	3	2	20	0.0001779	0.0005469	0.3253
100	100	5	2	20	0.0002855	0.0008846	0.3227
100	100	10	2	20	0.0005529	0.001732	0.3192
100	100	50	2	20	0.002692	0.008506	0.3165
100	100	100	2	20	0.00537	0.01696	0.3166
100	100	150	2	20	0.008042	0.02544	0.3161
100	100	200	2	20	0.01083	0.03395	0.3191
100	100	250	2	20	0.01351	0.0424	0.3186
100	100	300	2	20	0.01622	0.0508	0.3192
1000	1	1	2	20	2.337e-05	4.626e-05	0.5051
1000	1	2	2	20	3.018e-05	6.56e-05	0.4601
1000	1	3	2	20	4.189e-05	7.951e-05	0.5268
1000	1	5	2	20	6.488e-05	0.0001153	0.5629
1000	1	10	2	20	0.0001218	0.0002043	0.5961
1000	1	50	2	20	0.0005856	0.0009157	0.6395
1000	1	100	2	20	0.001123	0.001789	0.628
1000	1	150	2	20	0.001689	0.002672	0.6319
1000	1	200	2	20	0.002226	0.00355	0.6272
1000	1	250	2	20	0.002783	0.004427	0.6286
1000	1	300	2	20	0.003569	0.005334	0.669
1000	10	1	2	20	9.643e-05	0.0001982	0.4866
1000	10	2	2	20	0.0001761	0.0003755	0.469
1000	10	3	2	20	0.0002564	0.0005407	0.4743
1000	10	5	2	20	0.0004172	0.0008864	0.4707
1000	10	10	2	20	0.00082	0.00173	0.4739
1000	10	50	2	20	0.004029	0.008516	0.4731
1000	10	100	2	20	0.00806	0.01698	0.4748
1000	10	150	2	20	0.01206	0.02542	0.4744
1000	10	200	2	20	0.01604	0.03387	0.4735
1000	10	250	2	20	0.02009	0.0423	0.475
1000	10	300	2	20	0.02412	0.05075	0.4752
1000	100	1	2	20	0.0005876	0.001853	0.3171
1000	100	2	2	20	0.00101	0.003535	0.2858
1000	100	3	2	20	0.001426	0.005222	0.2731
1000	100	5	2	20	0.002261	0.008589	0.2632
1000	100	10	2	20	0.004263	0.01696	0.2513
1000	100	50	2	20	0.02108	0.08405	0.2508
1000	100	100	2	20	0.04183	0.1674	0.2499
1000	100	150	2	20	0.06292	0.2501	0.2516
1000	100	200	2	20	0.08496	0.3334	0.2548
1000	100	250	2	20	0.1053	0.4176	0.252
1000	100	300	2	20	0.125	0.5	0.2501
10000	1	1	2	20	7.066e-05	0.0002172	0.3254
10000	1	2	2	20	9.782e-05	0.0003771	0.2594
10000	1	3	2	20	0.000138	0.0005413	0.2549
10000	1	5	2	20	0.0002189	0.0008909	0.2457
10000	1	10	2	20	0.0004256	0.00176	0.2418
10000	1	50	2	20	0.002026	0.008639	0.2345
10000	1	100	2	20	0.00404	0.01718	0.2352
10000	1	150	2	20	0.006039	0.02569	0.235
10000	1	200	2	20	0.008043	0.03434	0.2343
10000	1	250	2	20	0.01006	0.04289	0.2345
10000	1	300	2	20	0.01205	0.05143	0.2342
10000	10	1	2	20	0.0008476	0.001873	0.4525
10000	10	2	2	20	0.001528	0.003535	0.4323
10000	10	3	2	20	0.00221	0.0052	0.4249
10000	10	5	2	20	0.003565	0.008617	0.4137
10000	10	10	2	20	0.006969	0.01706	0.4085
10000	10	50	2	20	0.03442	0.08498	0.4051
10000	10	100	2	20	0.06824	0.1678	0.4066
10000	10	150	2	20	0.1031	0.2533	0.4071
10000	10	200	2	20	0.1372	0.3348	0.4097
10000	10	250	2	20	0.1696	0.4191	0.4048
10000	10	300	2	20	0.2037	0.5008	0.4068
10000	100	1	2	20	0.006234	0.01833	0.34
10000	100	2	2	20	0.01045	0.03544	0.2949
10000	100	3	2	20	0.01446	0.05254	0.2753
10000	100	5	2	20	0.0231	0.08642	0.2673
10000	100	10	2	20	0.04383	0.1711	0.2561
10000	100	50	2	20	0.2109	0.8493	0.2483
10000	100	100	2	20	0.4204	1.696	0.2478
10000	100	150	2	20	0.6228	2.544	0.2448
10000	100	200	2	20	0.8446	3.393	0.2489
10000	100	250	2	20	1.047	4.242	0.2468
10000	100	300	2	20	1.244	5.089	0.2444

Benchmark code #

bench_plot_onnxruntime_casc_scaler.py

# coding: utf-8
"""
Benchmark of :epkg:`onnxruntime` for a cascade of scalers (additions).
"""
# Authors: Xavier Dupré (benchmark)
# License: MIT
import matplotlib
matplotlib.use('Agg')

import os
import unittest
import warnings
import contextlib
from time import perf_counter as time
from io import StringIO
import numpy
import pandas
import matplotlib.pyplot as plt
import sklearn
from sklearn.utils._testing import ignore_warnings
from sklearn.utils.extmath import softmax
from pyquickhelper.loghelper import run_cmd, sys_path_append
from pymlbenchmark.benchmark import BenchPerfTest, BenchPerf
from pymlbenchmark.context import machine_information
from pymlbenchmark.datasets.artificial import random_binary_classification
from pymlbenchmark.plotting import plot_bench_results
from skl2onnx.common.data_types import FloatTensorType
from skl2onnx.algebra.onnx_ops import OnnxScaler
from onnxruntime import InferenceSession
from mlprodict import get_ir_version, __max_supported_opset__

################################
# Benchmark
# +++++++++


def generate_onnx_graph(dim, nbnode, input_name='X1'):
    """Generates a series of consecutive scalers."""

    matrices = []
    scale = list(numpy.ones((1, dim)).ravel())
    i1 = input_name
    for i in range(nbnode - 1):
        i2 = list(-random_binary_classification(1, dim)[0].ravel())
        matrices.append(i2)
        node = OnnxScaler(i1, offset=i2, scale=scale)
        i1 = node
    i2 = list(-random_binary_classification(1, dim)[0].ravel())
    matrices.append(i2)
    node = OnnxScaler(i1, offset=i2, scale=scale, output_names=['Y'])
    onx = node.to_onnx([(input_name, FloatTensorType((None, dim)))],
                       outputs=[('Y', FloatTensorType((None, dim)))])
    onx.ir_version = get_ir_version(__max_supported_opset__)
    return onx, matrices


class GraphORtBenchPerfTest(BenchPerfTest):
    def __init__(self, dim=4, nbnode=3):
        BenchPerfTest.__init__(self)
        self.input_name = 'X1'
        self.nbnode = nbnode
        self.scale = numpy.ones((1, dim))
        self.onx, self.matrices = generate_onnx_graph(dim,
                                                      nbnode, self.input_name)
        as_string = self.onx.SerializeToString()
        try:
            self.ort = InferenceSession(as_string)
        except RuntimeError as e:
            raise RuntimeError("Issue with {}\n{}".format(
                e, self.onx))

    def fcts(self, **kwargs):

        def predict_ort(X, model=self.ort):
            return self.ort.run(None, {self.input_name: X})[0]

        def predict_npy(X, model=self.matrices, scale=self.scale):
            res = X.copy()
            for mat in model:
                res += X
                res *= scale
            return res

        return [{'lib': 'ort', 'fct': predict_ort},
                {'lib': 'npy', 'fct': predict_npy}]

    def data(self, N=10, dim=4, **kwargs):  # pylint: disable=W0221
        return tuple(o.astype(numpy.float32)
                     for o in random_binary_classification(N, dim)[:1])


@ignore_warnings(category=FutureWarning)
def run_bench(repeat=20, number=2, verbose=False):

    pbefore = dict(dim=[1, 10, 100],
                   nbnode=[1, 2, 3, 5, 10, 50, 100, 150, 200, 250, 300])
    pafter = dict(N=[1, 10, 100, 1000, 10000])

    test = lambda dim=None, **opts: GraphORtBenchPerfTest(dim=dim, **opts)
    bp = BenchPerf(pbefore, pafter, test)

    with sklearn.config_context(assume_finite=True):
        start = time()
        results = list(bp.enumerate_run_benchs(repeat=repeat, verbose=verbose,
                                               number=number, stop_if_error=False))
        end = time()

    results_df = pandas.DataFrame(results)
    print("Total time = %0.3f sec\n" % (end - start))
    return results_df

#########################
# Runs the benchmark
# ++++++++++++++++++


filename = os.path.splitext(os.path.split(__file__)[-1])[0]
df = run_bench(verbose=True)
df.to_csv("%s.perf.csv" % filename, index=False)
print(df.head())

#########################
# Extracts information about the machine used
# +++++++++++++++++++++++++++++++++++++++++++

pkgs = ['numpy', 'pandas', 'sklearn', 'skl2onnx',
        'onnxruntime', 'onnx', 'mlprodict']
dfi = pandas.DataFrame(machine_information(pkgs))
dfi.to_csv("%s.time.csv" % filename, index=False)
print(dfi)


#############################
# Plot the results by number of nodes
# +++++++++++++++++++++++++++++++++++

def label_fct(la):
    la = la.replace("onxpython_compiled", "opy")
    la = la.replace("onxpython", "opy")
    la = la.replace("onxonnxruntime1", "ort")
    la = la.replace("fit_intercept", "fi")
    la = la.replace("True", "1")
    la = la.replace("False", "0")
    la = la.replace("max_depth", "mxd")
    return la


from pymlbenchmark.plotting import plot_bench_results
plot_bench_results(df, row_cols='N', col_cols='dim',
                   x_value='nbnode',
                   title="%s\nBenchmark scikit-learn / onnxruntime" % "Cascade Scaler",
                   label_fct=label_fct)

plt.savefig("%s.node.png" % filename)


##################################
# Plot one ONNX graph
# +++++++++++++++++++

for nbnode in (2, 4):
    onx = generate_onnx_graph(5, nbnode)[0]

    from onnx.tools.net_drawer import GetPydotGraph, GetOpNodeProducer
    pydot_graph = GetPydotGraph(onx.graph, name=onx.graph.name, rankdir="TB",
                                node_producer=GetOpNodeProducer("docstring"))
    pydot_graph.write_dot("graph.%d.dot" % nbnode)
    os.system('dot -O -Tpng graph.%d.dot' % nbnode)

image = plt.imread("graph.%d.dot.png" % nbnode)
plt.imshow(image)
plt.axis('off')
plt.savefig("%s.%d.node.png" % (filename, nbnode))

import sys
if "--quiet" not in sys.argv:
    plt.show()

Benchmark (ONNX) for Scaler#

Overview#

Configuration#

Raw results#

Benchmark code#

Overview #

Configuration #

Raw results #

Benchmark code #