[tutorials][hist] Refactor histogram tutorials to return void instead of TCanvas*

siliataider · siliataider · commit 89d34713b9f0 · 2025-11-05T09:49:55.000+01:00
diff --git a/bindings/pyroot/cppyy/CPyCppyy/src/MyWrapper.h b/bindings/pyroot/cppyy/CPyCppyy/src/MyWrapper.h
@@ -0,0 +1,9 @@
+#pragma once
+
+#include <string>
+
+namespace CPyCppyy {
+namespace MyWrapper {
+    std::string CreateCallbackWrapper(std::string);
+}
+}
diff --git a/bindings/pyroot/pythonizations/python/ROOT/repro_cppyy_mock_rdf.py b/bindings/pyroot/pythonizations/python/ROOT/repro_cppyy_mock_rdf.py
@@ -0,0 +1,25 @@
+import cppyy
+
+cppyy.cppdef(
+    r"""
+#include <utility>
+#include <iostream>
+#include <string>
+
+void foo() { std::cout << "foo!\n";}
+
+void bar(int a, float b) { std::cout << "bar(" << a << "," << b << ")\n"; }
+
+template <typename T, typename U>
+void baz(T a, U b, std::string c) { std::cout << "baz(" << a << "," << b << ",\"" << c << "\")\n"; }
+
+template<typename F, typename... Args>
+void dataframe_define_mock(F callable, Args&&... args) {
+    callable(std::forward<Args>(args)...);
+}
+"""
+)
+
+cppyy.gbl.dataframe_define_mock(cppyy.gbl.foo)
+cppyy.gbl.dataframe_define_mock(cppyy.gbl.bar, 42, 11.11)
+cppyy.gbl.dataframe_define_mock(cppyy.gbl.baz[int, float], 33, 101.101, "hello")
diff --git a/bindings/pyroot/pythonizations/test/repro_op_plus.py b/bindings/pyroot/pythonizations/test/repro_op_plus.py
@@ -0,0 +1,11 @@
+import ROOT
+
+a = ROOT.TH1D("", "", 5, 0., 1.)
+b = ROOT.TH1D("", "", 5, 0., 1.)
+ab = a + b
+print(ab)
+
+c = ROOT.TH2D("", "", 5, 0., 1., 5, 0., 1.)
+d = ROOT.TH2D("", "", 5, 0., 1., 5, 0., 1.)
+cd = c + d
+print(cd)
diff --git a/documentation/users-guide/repro_rdf_poster.py b/documentation/users-guide/repro_rdf_poster.py
@@ -0,0 +1,17 @@
+import ROOT
+import numpy as np
+
+
+def make_write_hist(entry: int) -> ROOT.TH1D:
+    hname = f"h_{entry}"
+    h = ROOT.TH1D(hname, hname, entry, 0, entry)
+    h[...] = np.random.uniform(0, entry, entry)
+    with ROOT.TFile.Open("bench_out/histos.root", "update") as f:
+        f.WriteObject(h, hname)
+    return h
+
+rdf = ROOT.RDataFrame(10) \
+        .Define("x", "(int)rdfentry_ + 1") \
+        .Define("hist", make_write_hist, ["x"])
+
+rdf.Display().Print()
diff --git a/tutorials/CMakeLists.txt b/tutorials/CMakeLists.txt
@@ -550,13 +550,6 @@ set(returncode_1 math/fit/fit2a.C
                  visualisation/graphics/tmathtext.C visualisation/graphics/tmathtext2.C
                  visualisation/graphs/gr106_exclusiongraph.C
                  visualisation/graphs/gr016_struct.C
-                 hist/hist102_TH2_contour_list.C
-                 hist/hist006_TH1_bar_charts.C
-                 hist/hist037_TH2Poly_boxes.C
-                 hist/hist060_TH1_stats.C
-                 hist/hist014_TH1_cumulative.C
-                 hist/hist004_TH1_labels.C
-                 hist/hist036_TH2_labels.C
                  analysis/tree/h1analysis.C
                  math/chi2test.C
                  math/r/SimpleFitting.C)
diff --git a/tutorials/analysis/dataframe/bench_numba_cppyy.py b/tutorials/analysis/dataframe/bench_numba_cppyy.py
@@ -0,0 +1,112 @@
+import time
+
+import matplotlib.pyplot as plt
+import numpy as np
+import ROOT
+
+# ROOT.EnableImplicitMT()
+
+@ROOT.Numba.Declare(['double', 'int'], 'double')
+def pypow_numba(x, y):
+    return x**y
+
+def pypow_cppyy(x: float, y: int) -> float:
+    return x**y
+
+def benchmark(N):
+    rdf = ROOT.RDataFrame(N).Define("x", "(double)rdfentry_").Define("y", "2")
+
+    # cppyy version
+    start_cppyy = time.perf_counter()
+    rdf_cppyy = rdf.Define("pow_cppyy", pypow_cppyy, ["x", "y"])
+    mean_cppyy = rdf_cppyy.Mean("pow_cppyy").GetValue()
+    end_cppyy = time.perf_counter()
+
+    # Numba version
+    start_numba = time.perf_counter()
+    rdf_numba = rdf.Define("pow_numba", "Numba::pypow_numba(x, y)")
+    mean_numba = rdf_numba.Mean("pow_numba").GetValue()
+    end_numba = time.perf_counter()
+
+    return {
+        "N": N,
+        "mean_numba": mean_numba,
+        "mean_cppyy": mean_cppyy,
+        "time_numba": end_numba - start_numba,
+        "time_cppyy": end_cppyy - start_cppyy,
+    }
+
+N_values = [10_000, 100_000, 1_000_000, 5_000_000, 10_000_000, 50_000_000, 100_000_000]
+results = [benchmark(N) for N in N_values]
+
+print("Résultats :)")
+print(f"{'N':>10} | {'Numba time (s)':>15} | {'cppyy time (s)':>15} | {'cppyy speedup':>15} | {'Δ Mean':>10}")
+print("-" * 75)
+for r in results[1:]:
+    mean_diff = abs(r["mean_numba"] - r["mean_cppyy"])
+    cppyy_speedup = r["time_numba"] / r["time_cppyy"] if r["time_cppyy"] > 0 else float('inf')
+    print(f"{r['N']:>10} | {r['time_numba']:>15.3f} | {r['time_cppyy']:>15.3f} | {cppyy_speedup:>15.2f} | {mean_diff:>10.5f}")
+
+
+plt.figure(figsize=(7,5))
+plt.plot(N_values, [r["time_numba"] for r in results], "-o", label="Numba")
+plt.plot(N_values, [r["time_cppyy"] for r in results], "-o", label="cppyy")
+
+plt.xlabel("Number of entries")
+plt.ylabel("Execution time (s)")
+plt.title("RDataFrame Define(): Numba vs cppyy")
+plt.legend()
+plt.grid(True)
+plt.savefig("/home/siliataider/Documents/root/bench_out/benchmark_numba_vs_cppyy.png")
+plt.show()
+
+# N = 5_000_000
+# rdf = ROOT.RDataFrame(N).Define("x", "(double)rdfentry_").Define("y", "2.0")
+
+# # --- Numba version --------------------------------------------------------
+# @ROOT.Numba.Declare(['double', 'int'], 'double')
+# def pypow_numba(x, y):
+#     return x**y
+
+# start_numba = time.perf_counter()
+
+# rdf_numba = rdf.Define("pow_numba", "Numba::pypow_numba(x, y)")
+# mean_numba = rdf_numba.Mean("pow_numba").GetValue()
+
+# end_numba = time.perf_counter()
+
+# print(f"[Numba] Mean: {mean_numba:.5f}, time: {end_numba - start_numba:.3f} s")
+
+# # --- cppyy version --------------------------------------------------------
+# def pypow_cppyy(x: float, y: int) -> float:
+#     return x**y
+
+# start_cppyy = time.perf_counter()
+
+# rdf_cppyy = rdf.Define("pow_cppyy", pypow_cppyy, ["x", "y"])
+# mean_cppyy = rdf_cppyy.Mean("pow_cppyy").GetValue()
+
+# end_cppyy = time.perf_counter()
+
+# print(f"[cppyy] Mean: {mean_cppyy:.5f}, time: {end_cppyy - start_cppyy:.3f} s")
+
+
+
+import ROOT
+
+ROOT.gInterpreter.Declare("""
+#include <ROOT/RVec.hxx>
+using namespace ROOT::VecOps;
+
+template <typename T>
+struct SquareVecT {
+    RVec<T> operator()(const RVec<T>& xvec) const {
+        return xvec * xvec;
+    }
+};
+""")
+
+square_vec_int = ROOT.SquareVecT[int]()
+rdf = ROOT.RDataFrame(3) \
+    .Define("xvec", "ROOT::VecOps::RVec{(int)rdfentry_, (int)rdfentry_ + 1, (int)rdfentry_ + 2}") \
+    .Define("squared_xvec", square_vec_int, ["xvec"])
diff --git a/tutorials/hist/hist004_TH1_labels.C b/tutorials/hist/hist004_TH1_labels.C
@@ -11,7 +11,7 @@
 /// \date November 2024
 /// \author Rene Brun
 
-TCanvas *hist004_TH1_labels()
+void hist004_TH1_labels()
 {
    // Create the histogram
    const std::array people{"Jean",    "Pierre", "Marie",    "Odile",   "Sebastien", "Fons",  "Rene",
@@ -56,6 +56,4 @@ TCanvas *hist004_TH1_labels()
    pt->AddText(" \">\"   to sort by decreasing values");
    pt->AddText(" \"<\"   to sort by increasing values");
    pt->Draw();
-
-   return c1;
 }
diff --git a/tutorials/hist/hist006_TH1_bar_charts.C b/tutorials/hist/hist006_TH1_bar_charts.C
@@ -9,7 +9,7 @@
 /// \date November 2024
 /// \author Rene Brun
 
-TCanvas *hist006_TH1_bar_charts()
+void hist006_TH1_bar_charts()
 {
    // Try to open first the file cernstaff.root in tutorials/io/tree directory
    TString filedir = gROOT->GetTutorialDir();
@@ -88,6 +88,4 @@ TCanvas *hist006_TH1_bar_charts()
    legend->Draw();
 
    c1->cd();
-
-   return c1;
 }
diff --git a/tutorials/hist/hist014_TH1_cumulative.C b/tutorials/hist/hist014_TH1_cumulative.C
@@ -17,7 +17,7 @@
 #include "TCanvas.h"
 #include "TRandom.h"
 
-TCanvas *hist014_TH1_cumulative()
+void hist014_TH1_cumulative()
 {
    TH1 *h = new TH1D("h", "h", 100, -5., 5.);
    gRandom->SetSeed();
@@ -37,6 +37,4 @@ TCanvas *hist014_TH1_cumulative()
    c->cd(2);
    hc->Draw();
    c->Update();
-
-   return c;
 }
diff --git a/tutorials/hist/hist036_TH2_labels.C b/tutorials/hist/hist036_TH2_labels.C
@@ -9,7 +9,7 @@
 /// \date July 2016
 /// \author Rene Brun
 
-TCanvas *hist036_TH2_labels()
+void hist036_TH2_labels()
 {
    const Int_t nx = 12;
    const Int_t ny = 20;
@@ -44,5 +44,4 @@ TCanvas *hist036_TH2_labels()
    pt->AddText(" \">\"   to sort by decreasing values");
    pt->AddText(" \"<\"   to sort by increasing values");
    pt->Draw();
-   return c1;
 }
diff --git a/tutorials/hist/hist037_TH2Poly_boxes.C b/tutorials/hist/hist037_TH2Poly_boxes.C
@@ -10,7 +10,7 @@
 /// \date August 2016
 /// \author Olivier Couet
 
-TCanvas *hist037_TH2Poly_boxes()
+void hist037_TH2Poly_boxes()
 {
    TCanvas *ch2p2 = new TCanvas("ch2p2", "ch2p2", 600, 400);
    gStyle->SetPalette(57);
@@ -44,5 +44,4 @@ TCanvas *hist037_TH2Poly_boxes()
    }
 
    h2p->Draw("COLZ");
-   return ch2p2;
 }
diff --git a/tutorials/hist/hist060_TH1_stats.C b/tutorials/hist/hist060_TH1_stats.C
@@ -13,7 +13,7 @@
 /// \date August 2016
 /// \author  Olivier Couet
 
-TCanvas *hist060_TH1_stats()
+void hist060_TH1_stats()
 {
    // Create and plot a test histogram with stats
    TCanvas *se = new TCanvas;
@@ -44,5 +44,4 @@ TCanvas *hist060_TH1_stats()
    h->SetStats(0);
 
    se->Modified();
-   return se;
 }
diff --git a/tutorials/hist/hist102_TH2_contour_list.C b/tutorials/hist/hist102_TH2_contour_list.C
@@ -20,7 +20,7 @@
 
 Double_t SawTooth(Double_t x, Double_t WaveLen);
 
-TCanvas *hist102_TH2_contour_list()
+void hist102_TH2_contour_list()
 {
 
    const Double_t PI = TMath::Pi();
@@ -157,7 +157,6 @@ TCanvas *hist102_TH2_contour_list()
    printf("\n\n\tExtracted %d Contours and %d Graphs \n", TotalConts, nGraphs);
    gStyle->SetTitleW(0.);
    gStyle->SetTitleH(0.);
-   return c1;
 }
 
 Double_t SawTooth(Double_t x, Double_t WaveLen)
diff --git a/tutorials/hist/repro_pyhep.py b/tutorials/hist/repro_pyhep.py
@@ -0,0 +1,23 @@
+import ROOT
+import numpy as np
+
+# def make_array(x, y):
+#     val = np.sum(y)
+#     return np.full(x, val)
+
+# rdf = ROOT.RDataFrame(3) \
+#         .Define("x", "(int)rdfentry_ + 1") \
+#         .Define("y", "ROOT::VecOps::RVec{(int)rdfentry_, (int)rdfentry_ + 1, (int)rdfentry_ + 2}") \
+#         .Define("vec_x", make_array, ["x", "y"])
+
+
+def combine_vectors(a, b):
+   return np.sqrt(a**2 + b**2)
+
+rdf = (ROOT.RDataFrame(3)
+      .Define("a", "ROOT::RVec<float>{1, 2, 3}")
+      .Define("b", "std::vector<float>{0.1, 0.2, 0.3}")
+      .Define("c", combine_vectors))
+
+
+rdf.Display().Print()

Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@`
`11`	`11`	`/// \date November 2024`
`12`	`12`	`/// \author Rene Brun`
`13`	`13`
`14`		`-TCanvas *hist004_TH1_labels()`
	`14`	`+void hist004_TH1_labels()`
`15`	`15`	`{`
`16`	`16`	`// Create the histogram`
`17`	`17`	`const std::array people{"Jean", "Pierre", "Marie", "Odile", "Sebastien", "Fons", "Rene",`
`@@ -56,6 +56,4 @@ TCanvas *hist004_TH1_labels()`
`56`	`56`	`pt->AddText(" \">\" to sort by decreasing values");`
`57`	`57`	`pt->AddText(" \"<\" to sort by increasing values");`
`58`	`58`	`pt->Draw();`
`59`		`-`
`60`		`- return c1;`
`61`	`59`	`}`
Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@`
`9`	`9`	`/// \date November 2024`
`10`	`10`	`/// \author Rene Brun`
`11`	`11`
`12`		`-TCanvas *hist006_TH1_bar_charts()`
	`12`	`+void hist006_TH1_bar_charts()`
`13`	`13`	`{`
`14`	`14`	`// Try to open first the file cernstaff.root in tutorials/io/tree directory`
`15`	`15`	`TString filedir = gROOT->GetTutorialDir();`
`@@ -88,6 +88,4 @@ TCanvas *hist006_TH1_bar_charts()`
`88`	`88`	`legend->Draw();`
`89`	`89`
`90`	`90`	`c1->cd();`
`91`		`-`
`92`		`- return c1;`
`93`	`91`	`}`
Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@`
`17`	`17`	`#include "TCanvas.h"`
`18`	`18`	`#include "TRandom.h"`
`19`	`19`
`20`		`-TCanvas *hist014_TH1_cumulative()`
	`20`	`+void hist014_TH1_cumulative()`
`21`	`21`	`{`
`22`	`22`	`TH1 *h = new TH1D("h", "h", 100, -5., 5.);`
`23`	`23`	`gRandom->SetSeed();`
`@@ -37,6 +37,4 @@ TCanvas *hist014_TH1_cumulative()`
`37`	`37`	`c->cd(2);`
`38`	`38`	`hc->Draw();`
`39`	`39`	`c->Update();`
`40`		`-`
`41`		`- return c;`
`42`	`40`	`}`
Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@`
`9`	`9`	`/// \date July 2016`
`10`	`10`	`/// \author Rene Brun`
`11`	`11`
`12`		`-TCanvas *hist036_TH2_labels()`
	`12`	`+void hist036_TH2_labels()`
`13`	`13`	`{`
`14`	`14`	`const Int_t nx = 12;`
`15`	`15`	`const Int_t ny = 20;`
`@@ -44,5 +44,4 @@ TCanvas *hist036_TH2_labels()`
`44`	`44`	`pt->AddText(" \">\" to sort by decreasing values");`
`45`	`45`	`pt->AddText(" \"<\" to sort by increasing values");`
`46`	`46`	`pt->Draw();`
`47`		`- return c1;`
`48`	`47`	`}`