.. DO NOT EDIT.
.. THIS FILE WAS AUTOMATICALLY GENERATED BY SPHINX-GALLERY.
.. TO MAKE CHANGES, EDIT THE SOURCE PYTHON FILE:
.. "gyexamples/plot_op_reducesum.py"
.. LINE NUMBERS ARE GIVEN BELOW.

.. only:: html

    .. note::
        :class: sphx-glr-download-link-note

        Click :ref:`here <sphx_glr_download_gyexamples_plot_op_reducesum.py>`
        to download the full example code

.. rst-class:: sphx-glr-example-title

.. _sphx_glr_gyexamples_plot_op_reducesum.py:


.. _l-b-reducesum:

Compares implementations of ReduceSum
=====================================

This example compares the :epkg:`numpy:sum` from numpy,
to :epkg:`onnxruntime` implementation.
If available, :epkg:`tensorflow` and :epkg:`pytorch` are included as well.

.. contents::
    :local:

Available optimisation
++++++++++++++++++++++

The code shows which parallelisation optimisation could be used,
*AVX* or *SSE* and the number of available processors.

.. GENERATED FROM PYTHON SOURCE LINES 20-32

.. code-block:: default

    import numpy
    import pandas
    import matplotlib.pyplot as plt
    from onnxruntime import InferenceSession
    from skl2onnx.common.data_types import FloatTensorType
    from skl2onnx.algebra.onnx_ops import OnnxReduceSumApi11
    from cpyquickhelper.numbers import measure_time
    from tqdm import tqdm
    from mlprodict.testing.experimental_c_impl.experimental_c import (
        code_optimisation, custom_reducesum_rk_float)
    print(code_optimisation())


.. rst-class:: sphx-glr-script-out

 .. code-block:: none

    AVX-omp=8


.. GENERATED FROM PYTHON SOURCE LINES 33-35

ReduceSum implementations
+++++++++++++++++++++++++

.. GENERATED FROM PYTHON SOURCE LINES 35-175

.. code-block:: default


    try:
        from tensorflow.math import reduce_sum as tf_reduce_sum
        from tensorflow import convert_to_tensor
    except ImportError:
        tf_reduce_sum = None
    try:
        from torch import sum as torch_sum, from_numpy
    except ImportError:
        torch_sum = None


    def build_ort_reducesum(axes, op_version=14):  # opset=13, 14, ...
        node = OnnxReduceSumApi11('x', axes=axes, op_version=op_version,
                                  output_names=['z'])
        onx = node.to_onnx(inputs=[('x', FloatTensorType())],
                           target_opset=op_version)
        sess = InferenceSession(onx.SerializeToString())
        return lambda x, y: sess.run(None, {'x': x})


    def loop_fct(fct, xs, ys):
        for x, y in zip(xs, ys):
            fct(x, y)


    def benchmark_op(axes, repeat=5, number=5, name="ReduceSum", shape_fct=None,
                     custom_impl=False):
        if shape_fct is None:
            def shape_fct(dim):
                return (3, dim, 1, 128, 64)
        ort_fct = build_ort_reducesum(axes)
        res = []
        for dim in tqdm([8, 16, 32, 64, 100, 128, 200,
                         256, 400, 512, 1024]):
            shape = shape_fct(dim)
            n_arrays = 10 if dim < 512 else 4
            xs = [numpy.random.rand(*shape).astype(numpy.float32)
                  for _ in range(n_arrays)]
            ys = [numpy.array(axes, dtype=numpy.int64)
                  for _ in range(n_arrays)]
            info = dict(axes=axes, shape=shape)

            # numpy
            ctx = dict(
                xs=xs, ys=ys,
                fct=lambda x, y: numpy.sum(x, *y),
                loop_fct=loop_fct)
            obs = measure_time(
                "loop_fct(fct, xs, ys)",
                div_by_number=True, context=ctx, repeat=repeat, number=number)
            obs['dim'] = dim
            obs['fct'] = 'numpy'
            obs.update(info)
            res.append(obs)

            # onnxruntime
            ctx['fct'] = ort_fct
            obs = measure_time(
                "loop_fct(fct, xs, ys)",
                div_by_number=True, context=ctx, repeat=repeat, number=number)
            obs['dim'] = dim
            obs['fct'] = 'ort'
            obs.update(info)
            res.append(obs)

            if custom_impl:
                if axes != (0, ):
                    raise RuntimeError(
                        f"Unexpected axes={axes!r}.")
                ctx['fct'] = lambda x, y: custom_reducesum_rk_float(x)
                ctx['xs'] = [x.reshape((x.shape[0], -1)).copy() for x in xs]
                obs = measure_time(
                    "loop_fct(fct, xs, ys)",
                    div_by_number=True, context=ctx, repeat=repeat, number=number)
                obs['dim'] = dim
                obs['fct'] = 'custom'
                obs.update(info)
                res.append(obs)

            if tf_reduce_sum is not None:
                # tensorflow
                ctx['fct'] = tf_reduce_sum
                ctx['xs'] = [convert_to_tensor(x) for x in xs]
                ctx['ys'] = ys
                obs = measure_time(
                    "loop_fct(fct, xs, ys)",
                    div_by_number=True, context=ctx, repeat=repeat, number=number)
                obs['dim'] = dim
                obs['fct'] = 'tf'
                obs.update(info)
                res.append(obs)

            if torch_sum is not None:
                def torch_sum1(x, y):
                    return torch_sum(x, y[0])

                def torch_sum2(x, y):
                    return torch_sum(torch_sum(x, y[1]), y[0])

                # torch
                ctx['fct'] = torch_sum1 if len(axes) == 1 else torch_sum2
                ctx['xs'] = [from_numpy(x) for x in xs]
                ctx['ys'] = ys  # [from_numpy(y) for y in ys]
                obs = measure_time(
                    "loop_fct(fct, xs, ys)",
                    div_by_number=True, context=ctx, repeat=repeat, number=number)
                obs['dim'] = dim
                obs['fct'] = 'torch'
                obs.update(info)
                res.append(obs)

        # Dataframes
        shape_name = str(shape).replace(str(dim), "N")
        df = pandas.DataFrame(res)
        df.columns = [_.replace('dim', 'N') for _ in df.columns]
        piv = df.pivot('N', 'fct', 'average')

        rs = piv.copy()
        for c in ['ort', 'torch', 'tf', 'tf_copy']:
            if c in rs.columns:
                rs[c] = rs['numpy'] / rs[c]
        rs['numpy'] = 1.

        # Graphs.
        fig, ax = plt.subplots(1, 2, figsize=(12, 4))
        piv.plot(logx=True, logy=True, ax=ax[0],
                 title=f"{name} benchmark\n{shape_name!r} - {axes!r} lower better")
        ax[0].legend(prop={"size": 9})
        rs.plot(logx=True, logy=True, ax=ax[1],
                title="%s Speedup, baseline=numpy\n%r - %r"
                      " higher better" % (name, shape_name, axes))
        ax[1].plot([min(rs.index), max(rs.index)], [0.5, 0.5], 'g--')
        ax[1].plot([min(rs.index), max(rs.index)], [2., 2.], 'g--')
        ax[1].legend(prop={"size": 9})
        return df, rs, ax


    dfs = []


.. GENERATED FROM PYTHON SOURCE LINES 176-185

Reduction on a particular case KR
+++++++++++++++++++++++++++++++++

Consecutive axis not reduced and consecutive reduced
axis are merged.
KR means kept axis - reduced axis

(8, 24, 48, N), axis=(3, )
^^^^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 185-191

.. code-block:: default


    axes = (3, )
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (8, 24, 48, dim))
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_001.png
   :alt: ReduceSum benchmark '(8, 24, 48, N)' - (3,) lower better, ReduceSum Speedup, baseline=numpy '(8, 24, 48, N)' - (3,) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_001.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:01<00:13,  1.37s/it]
     18%|#8        | 2/11 [00:03<00:13,  1.55s/it]
     27%|##7       | 3/11 [00:04<00:13,  1.66s/it]
     36%|###6      | 4/11 [00:06<00:11,  1.68s/it]
     45%|####5     | 5/11 [00:08<00:10,  1.71s/it]
     55%|#####4    | 6/11 [00:10<00:09,  1.97s/it]
     64%|######3   | 7/11 [00:13<00:09,  2.28s/it]
     73%|#######2  | 8/11 [00:17<00:07,  2.62s/it]
     82%|########1 | 9/11 [00:21<00:06,  3.04s/it]
     91%|######### | 10/11 [00:22<00:02,  2.66s/it]
    100%|##########| 11/11 [00:25<00:00,  2.77s/it]
    100%|##########| 11/11 [00:25<00:00,  2.35s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:189: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>numpy</th>
          <td>0.004108</td>
          <td>0.004851</td>
          <td>0.006410</td>
          <td>0.007902</td>
          <td>0.010157</td>
          <td>0.011906</td>
          <td>0.017698</td>
          <td>0.021819</td>
          <td>0.031517</td>
          <td>0.015750</td>
          <td>0.031232</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.001496</td>
          <td>0.001562</td>
          <td>0.002094</td>
          <td>0.003191</td>
          <td>0.004674</td>
          <td>0.005394</td>
          <td>0.007278</td>
          <td>0.009411</td>
          <td>0.011706</td>
          <td>0.006069</td>
          <td>0.011118</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.048272</td>
          <td>0.059100</td>
          <td>0.060178</td>
          <td>0.051081</td>
          <td>0.046577</td>
          <td>0.069638</td>
          <td>0.073717</td>
          <td>0.079963</td>
          <td>0.079712</td>
          <td>0.031400</td>
          <td>0.041889</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 192-201

Reduction on a particular case RK
+++++++++++++++++++++++++++++++++

Consecutive axis not reduced and consecutive reduced
axis are merged.
RK means reduced axis - kept axis

(8, 24, 48, N), axis=(0, )
^^^^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 201-208

.. code-block:: default


    axes = (0, )
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (8, 24, 48, dim),
                               custom_impl=True)
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_002.png
   :alt: ReduceSum benchmark '(8, 24, 48, N)' - (0,) lower better, ReduceSum Speedup, baseline=numpy '(8, 24, 48, N)' - (0,) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_002.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:01<00:19,  2.00s/it]
     18%|#8        | 2/11 [00:03<00:15,  1.77s/it]
     27%|##7       | 3/11 [00:06<00:19,  2.45s/it]
     36%|###6      | 4/11 [00:11<00:23,  3.35s/it]
     45%|####5     | 5/11 [00:17<00:24,  4.11s/it]
     55%|#####4    | 6/11 [00:23<00:24,  4.86s/it]
     64%|######3   | 7/11 [00:29<00:20,  5.13s/it]
     73%|#######2  | 8/11 [00:36<00:17,  5.71s/it]
     82%|########1 | 9/11 [00:44<00:13,  6.51s/it]
     91%|######### | 10/11 [00:48<00:05,  5.68s/it]
    100%|##########| 11/11 [00:53<00:00,  5.67s/it]
    100%|##########| 11/11 [00:53<00:00,  4.89s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:206: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>custom</th>
          <td>0.025423</td>
          <td>0.025525</td>
          <td>0.060544</td>
          <td>0.054723</td>
          <td>0.044040</td>
          <td>0.064949</td>
          <td>0.062435</td>
          <td>0.066504</td>
          <td>0.069788</td>
          <td>0.029936</td>
          <td>0.036309</td>
        </tr>
        <tr>
          <th>numpy</th>
          <td>0.001122</td>
          <td>0.002217</td>
          <td>0.003698</td>
          <td>0.006776</td>
          <td>0.010306</td>
          <td>0.017296</td>
          <td>0.027376</td>
          <td>0.035357</td>
          <td>0.054845</td>
          <td>0.030619</td>
          <td>0.054749</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.001106</td>
          <td>0.001787</td>
          <td>0.003138</td>
          <td>0.006356</td>
          <td>0.009423</td>
          <td>0.012132</td>
          <td>0.016790</td>
          <td>0.020318</td>
          <td>0.030337</td>
          <td>0.016819</td>
          <td>0.030457</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.051417</td>
          <td>0.032783</td>
          <td>0.060105</td>
          <td>0.114873</td>
          <td>0.144508</td>
          <td>0.145739</td>
          <td>0.102461</td>
          <td>0.132251</td>
          <td>0.137654</td>
          <td>0.055817</td>
          <td>0.066265</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 209-218

Reduction on a particular case KRK
++++++++++++++++++++++++++++++++++

Consecutive axis not reduced and consecutive reduced
axis are merged.
KRK means kept axis - reduced axis - kept axis,

(8, 24, 48, N), axis=(1, 2)
^^^^^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 218-224

.. code-block:: default


    axes = (1, 2)
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (8, 24, 48, dim))
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_003.png
   :alt: ReduceSum benchmark '(8, 24, 48, N)' - (1, 2) lower better, ReduceSum Speedup, baseline=numpy '(8, 24, 48, N)' - (1, 2) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_003.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:00<00:07,  1.36it/s]
     18%|#8        | 2/11 [00:02<00:11,  1.32s/it]
     27%|##7       | 3/11 [00:04<00:13,  1.69s/it]
     36%|###6      | 4/11 [00:06<00:13,  1.90s/it]
     45%|####5     | 5/11 [00:09<00:12,  2.10s/it]
     55%|#####4    | 6/11 [00:12<00:12,  2.41s/it]
     64%|######3   | 7/11 [00:18<00:14,  3.60s/it]
     73%|#######2  | 8/11 [00:25<00:14,  4.80s/it]
     82%|########1 | 9/11 [00:35<00:12,  6.24s/it]
     91%|######### | 10/11 [00:39<00:05,  5.73s/it]
    100%|##########| 11/11 [00:47<00:00,  6.32s/it]
    100%|##########| 11/11 [00:47<00:00,  4.31s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:222: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>numpy</th>
          <td>0.002650</td>
          <td>0.004995</td>
          <td>0.009114</td>
          <td>0.018171</td>
          <td>0.028635</td>
          <td>0.035755</td>
          <td>0.056285</td>
          <td>0.071005</td>
          <td>0.110573</td>
          <td>0.056279</td>
          <td>0.128533</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.005669</td>
          <td>0.001289</td>
          <td>0.002282</td>
          <td>0.004219</td>
          <td>0.006878</td>
          <td>0.008088</td>
          <td>0.012652</td>
          <td>0.015264</td>
          <td>0.024189</td>
          <td>0.012552</td>
          <td>0.027233</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.020311</td>
          <td>0.061180</td>
          <td>0.070951</td>
          <td>0.060121</td>
          <td>0.053398</td>
          <td>0.065635</td>
          <td>0.154997</td>
          <td>0.184678</td>
          <td>0.205907</td>
          <td>0.095580</td>
          <td>0.114066</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 225-227

(8, 24 * 48, N), axis=1
^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 227-233

.. code-block:: default


    axes = (1, )
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (8, 24 * 48, dim))
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_004.png
   :alt: ReduceSum benchmark '(8, 1152, N)' - (1,) lower better, ReduceSum Speedup, baseline=numpy '(8, 1152, N)' - (1,) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_004.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:00<00:09,  1.04it/s]
     18%|#8        | 2/11 [00:01<00:05,  1.52it/s]
     27%|##7       | 3/11 [00:03<00:10,  1.30s/it]
     36%|###6      | 4/11 [00:04<00:09,  1.39s/it]
     45%|####5     | 5/11 [00:07<00:10,  1.68s/it]
     55%|#####4    | 6/11 [00:09<00:09,  1.98s/it]
     64%|######3   | 7/11 [00:12<00:09,  2.33s/it]
     73%|#######2  | 8/11 [00:16<00:08,  2.75s/it]
     82%|########1 | 9/11 [00:20<00:06,  3.30s/it]
     91%|######### | 10/11 [00:23<00:03,  3.01s/it]
    100%|##########| 11/11 [00:27<00:00,  3.33s/it]
    100%|##########| 11/11 [00:27<00:00,  2.49s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:231: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>numpy</th>
          <td>0.004254</td>
          <td>0.004919</td>
          <td>0.006705</td>
          <td>0.009982</td>
          <td>0.011278</td>
          <td>0.013374</td>
          <td>0.017590</td>
          <td>0.021376</td>
          <td>0.031766</td>
          <td>0.015937</td>
          <td>0.030009</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.005970</td>
          <td>0.001283</td>
          <td>0.002337</td>
          <td>0.004279</td>
          <td>0.006523</td>
          <td>0.008211</td>
          <td>0.012584</td>
          <td>0.015075</td>
          <td>0.023856</td>
          <td>0.012413</td>
          <td>0.027142</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.027301</td>
          <td>0.009960</td>
          <td>0.070464</td>
          <td>0.040462</td>
          <td>0.060979</td>
          <td>0.068766</td>
          <td>0.073370</td>
          <td>0.086237</td>
          <td>0.089010</td>
          <td>0.047131</td>
          <td>0.068266</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 234-236

(2, 8, 12, 24, 2, N), axis=(2, 3)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 236-242

.. code-block:: default


    axes = (2, 3)
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (2, 8, 12, 24, 2, dim))
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_005.png
   :alt: ReduceSum benchmark '(2, 8, 12, 24, 2, N)' - (2, 3) lower better, ReduceSum Speedup, baseline=numpy '(2, 8, 12, 24, 2, N)' - (2, 3) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_005.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:01<00:10,  1.04s/it]
     18%|#8        | 2/11 [00:01<00:08,  1.11it/s]
     27%|##7       | 3/11 [00:03<00:11,  1.43s/it]
     36%|###6      | 4/11 [00:06<00:13,  1.88s/it]
     45%|####5     | 5/11 [00:13<00:21,  3.56s/it]
     55%|#####4    | 6/11 [00:19<00:23,  4.68s/it]
     64%|######3   | 7/11 [00:27<00:22,  5.68s/it]
     73%|#######2  | 8/11 [00:36<00:19,  6.55s/it]
     82%|########1 | 9/11 [00:45<00:14,  7.49s/it]
     91%|######### | 10/11 [00:49<00:06,  6.52s/it]
    100%|##########| 11/11 [00:57<00:00,  6.86s/it]
    100%|##########| 11/11 [00:57<00:00,  5.23s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:240: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>numpy</th>
          <td>0.002786</td>
          <td>0.005112</td>
          <td>0.009414</td>
          <td>0.019250</td>
          <td>0.029668</td>
          <td>0.036974</td>
          <td>0.057420</td>
          <td>0.073561</td>
          <td>0.113452</td>
          <td>0.058290</td>
          <td>0.124900</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.001672</td>
          <td>0.001371</td>
          <td>0.002411</td>
          <td>0.004568</td>
          <td>0.007558</td>
          <td>0.008682</td>
          <td>0.012172</td>
          <td>0.015954</td>
          <td>0.022385</td>
          <td>0.014245</td>
          <td>0.036048</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.036366</td>
          <td>0.023836</td>
          <td>0.067237</td>
          <td>0.073253</td>
          <td>0.214941</td>
          <td>0.216737</td>
          <td>0.222536</td>
          <td>0.223638</td>
          <td>0.210876</td>
          <td>0.082061</td>
          <td>0.107904</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 243-248

Reduction on a particular case RKRK
+++++++++++++++++++++++++++++++++++

(8, 24, 48, N), axis=(0, 2)
^^^^^^^^^^^^^^^^^^^^^^^^^^^

.. GENERATED FROM PYTHON SOURCE LINES 248-254

.. code-block:: default


    axes = (0, 2)
    df, piv, ax = benchmark_op(axes, shape_fct=lambda dim: (8, 24, 48, dim))
    dfs.append(df)
    df.pivot("fct", "N", "average")


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_006.png
   :alt: ReduceSum benchmark '(8, 24, 48, N)' - (0, 2) lower better, ReduceSum Speedup, baseline=numpy '(8, 24, 48, N)' - (0, 2) higher better
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_006.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-script-out

 .. code-block:: none


      0%|          | 0/11 [00:00<?, ?it/s]
      9%|9         | 1/11 [00:01<00:10,  1.05s/it]
     18%|#8        | 2/11 [00:02<00:13,  1.48s/it]
     27%|##7       | 3/11 [00:05<00:14,  1.80s/it]
     36%|###6      | 4/11 [00:07<00:15,  2.17s/it]
     45%|####5     | 5/11 [00:10<00:14,  2.46s/it]
     55%|#####4    | 6/11 [00:14<00:14,  2.86s/it]
     64%|######3   | 7/11 [00:22<00:17,  4.46s/it]
     73%|#######2  | 8/11 [00:29<00:16,  5.51s/it]
     82%|########1 | 9/11 [00:40<00:14,  7.17s/it]
     91%|######### | 10/11 [00:46<00:06,  6.66s/it]
    100%|##########| 11/11 [00:59<00:00,  8.66s/it]
    100%|##########| 11/11 [00:59<00:00,  5.40s/it]
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:151: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      piv = df.pivot('N', 'fct', 'average')
    somewhere/workspace/mlprodict/mlprodict_UT_39_std/_doc/examples/plot_op_reducesum.py:252: FutureWarning: In a future version of pandas all arguments of DataFrame.pivot will be keyword-only.
      df.pivot("fct", "N", "average")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <div>
    <style scoped>
        .dataframe tbody tr th:only-of-type {
            vertical-align: middle;
        }

        .dataframe tbody tr th {
            vertical-align: top;
        }

        .dataframe thead th {
            text-align: right;
        }
    </style>
    <table border="1" class="dataframe">
      <thead>
        <tr style="text-align: right;">
          <th>N</th>
          <th>8</th>
          <th>16</th>
          <th>32</th>
          <th>64</th>
          <th>100</th>
          <th>128</th>
          <th>200</th>
          <th>256</th>
          <th>400</th>
          <th>512</th>
          <th>1024</th>
        </tr>
        <tr>
          <th>fct</th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
          <th></th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th>numpy</th>
          <td>0.002737</td>
          <td>0.005142</td>
          <td>0.009669</td>
          <td>0.021690</td>
          <td>0.034115</td>
          <td>0.043409</td>
          <td>0.068213</td>
          <td>0.083322</td>
          <td>0.133460</td>
          <td>0.067885</td>
          <td>0.134256</td>
        </tr>
        <tr>
          <th>ort</th>
          <td>0.001075</td>
          <td>0.001807</td>
          <td>0.003684</td>
          <td>0.006777</td>
          <td>0.008837</td>
          <td>0.013446</td>
          <td>0.018525</td>
          <td>0.025275</td>
          <td>0.036985</td>
          <td>0.043171</td>
          <td>0.246788</td>
        </tr>
        <tr>
          <th>torch</th>
          <td>0.037370</td>
          <td>0.062487</td>
          <td>0.070774</td>
          <td>0.074768</td>
          <td>0.067579</td>
          <td>0.076031</td>
          <td>0.205576</td>
          <td>0.178567</td>
          <td>0.225860</td>
          <td>0.091197</td>
          <td>0.110022</td>
        </tr>
      </tbody>
    </table>
    </div>
    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 255-261

Conclusion
++++++++++

Some of the configurations should be investigated.
:ref:`l-reducesum-problem1`. The reduction on tensorflow
in one dimension seems to be lazy.

.. GENERATED FROM PYTHON SOURCE LINES 261-269

.. code-block:: default


    merged = pandas.concat(dfs)
    name = "reducesum"
    merged.to_csv(f"plot_{name}.csv", index=False)
    merged.to_excel(f"plot_{name}.xlsx", index=False)
    plt.savefig(f"plot_{name}.png")

    plt.show()


.. image-sg:: /gyexamples/images/sphx_glr_plot_op_reducesum_007.png
   :alt: plot op reducesum
   :srcset: /gyexamples/images/sphx_glr_plot_op_reducesum_007.png
   :class: sphx-glr-single-img


.. rst-class:: sphx-glr-timing

   **Total running time of the script:** ( 4 minutes  43.395 seconds)


.. _sphx_glr_download_gyexamples_plot_op_reducesum.py:

.. only:: html

  .. container:: sphx-glr-footer sphx-glr-footer-example


    .. container:: sphx-glr-download sphx-glr-download-python

      :download:`Download Python source code: plot_op_reducesum.py <plot_op_reducesum.py>`

    .. container:: sphx-glr-download sphx-glr-download-jupyter

      :download:`Download Jupyter notebook: plot_op_reducesum.ipynb <plot_op_reducesum.ipynb>`


.. only:: html

 .. rst-class:: sphx-glr-signature

    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.github.io>`_