Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

make dsum, fill, and relu parametric in sizes #224

Merged
merged 6 commits into from
May 21, 2024

Conversation

superlopuh
Copy link
Collaborator

No description provided.

Copy link

kernels,baseline,linalg,linalg_xdsl,scf_xdsl,snitch_stream,snrt,min_llvm_mlir
conv2d_d1_s1_3x3 1x1x8x8xf64,1466,1732,,,1526,1501,1466
ddot 128xf64,961,957,,2243,205,569,957
dense 8x8xf64,3199,3518,,,2729,2737,3199
dsum 12x12xf64,,,229,,,,
dsum 12x16xf64,,,286,,,,
dsum 12x4xf64,,,122,,,,
dsum 12x8xf64,,,169,,,,
dsum 16x12xf64,,,286,,,,
dsum 16x16xf64,,,356,,,,
dsum 16x4xf64,,,138,,,,
dsum 16x8xf64,,,199,,,,
dsum 4x12xf64,,,143,,,,
dsum 4x16xf64,,,163,,,,
dsum 4x4xf64,,,94,,,,
dsum 4x8xf64,,,123,,,,
dsum 8x12xf64,,,169,,,,
dsum 8x16xf64,,,199,,,,
dsum 8x4xf64,,,106,,,,
dsum 8x8xf64,,,138,,,,
fill 12x12xf64,,,185,,,,
fill 12x16xf64,,,233,,,,
fill 12x4xf64,,,100,,,,
fill 12x8xf64,,,137,,,,
fill 16x12xf64,,,233,,,,
fill 16x16xf64,,,297,,,,
fill 16x4xf64,,,120,,,,
fill 16x8xf64,,,169,,,,
fill 4x12xf64,,,89,,,,
fill 4x16xf64,,,105,,,,
fill 4x4xf64,,,66,,,,
fill 4x8xf64,,,73,,,,
fill 8x12xf64,,,137,,,,
fill 8x16xf64,,,169,,,,
fill 8x4xf64,,,80,,,,
fill 8x8xf64,,,105,,,,
matmul 4x4x4xf64,,,,,207,,
matmul 4x4x8xf64,,,,,251,,
matmul 4x8x4xf64,,,,,255,,
matmul 4x8x8xf64,,,,,382,,
matmul 8x4x4xf64,,,,,265,,
matmul 8x4x8xf64,,,,,381,,
matmul 8x8x4xf64,,,,,386,,
matmul 8x8x8xf64,,,,,648,,
pooling_nchw_max_d1_s2_3x3 1x1x16x16xf64,1391,1435,,,1120,1121,1391
pooling_nchw_sum_d1_s2_3x3 1x1x16x16xf64,1710,2175,,,2003,1992,1710
relu 12x12xf64,,,213,,,,
relu 12x16xf64,,,262,,,,
relu 12x4xf64,,,127,,,,
relu 12x8xf64,,,159,,,,
relu 16x12xf64,,,262,,,,
relu 16x16xf64,,,352,,,,
relu 16x4xf64,,,147,,,,
relu 16x8xf64,,,190,,,,
relu 4x12xf64,,,106,,,,
relu 4x16xf64,,,122,,,,
relu 4x4xf64,,,106,,,,
relu 4x8xf64,,,89,,,,
relu 8x12xf64,,,159,,,,
relu 8x16xf64,,,190,,,,
relu 8x4xf64,,,106,,,,
relu 8x8xf64,,,122,,,,

Copy link

kernels,baseline,linalg,linalg_xdsl,scf_xdsl,snitch_stream,snrt
conv2d_d1_s1_3x3 1x1x8x8xf64,0.22,0.19,,,0.26,0.27
ddot 128xf64,0.13,0.14,,0.06,0.66,0.23
dense 8x8xf64,0.20,0.18,,,0.26,0.26
dsum 12x12xf64,,,0.63,,,
dsum 12x16xf64,,,0.67,,,
dsum 12x4xf64,,,0.40,,,
dsum 12x8xf64,,,0.57,,,
dsum 16x12xf64,,,0.67,,,
dsum 16x16xf64,,,0.72,,,
dsum 16x4xf64,,,0.47,,,
dsum 16x8xf64,,,0.65,,,
dsum 4x12xf64,,,0.34,,,
dsum 4x16xf64,,,0.40,,,
dsum 4x4xf64,,,0.18,,,
dsum 4x8xf64,,,0.27,,,
dsum 8x12xf64,,,0.57,,,
dsum 8x16xf64,,,0.65,,,
dsum 8x4xf64,,,0.31,,,
dsum 8x8xf64,,,0.47,,,
fill 12x12xf64,,,0.79,,,
fill 12x16xf64,,,0.83,,,
fill 12x4xf64,,,0.50,,,
fill 12x8xf64,,,0.72,,,
fill 16x12xf64,,,0.83,,,
fill 16x16xf64,,,0.87,,,
fill 16x4xf64,,,0.55,,,
fill 16x8xf64,,,0.77,,,
fill 4x12xf64,,,0.56,,,
fill 4x16xf64,,,0.63,,,
fill 4x4xf64,,,0.27,,,
fill 4x8xf64,,,0.47,,,
fill 8x12xf64,,,0.72,,,
fill 8x16xf64,,,0.77,,,
fill 8x4xf64,,,0.42,,,
fill 8x8xf64,,,0.63,,,
matmul 4x4x4xf64,,,,,0.31,
matmul 4x4x8xf64,,,,,0.51,
matmul 4x8x4xf64,,,,,0.51,
matmul 4x8x8xf64,,,,,0.67,
matmul 8x4x4xf64,,,,,0.49,
matmul 8x4x8xf64,,,,,0.67,
matmul 8x8x4xf64,,,,,0.67,
matmul 8x8x8xf64,,,,,0.79,
pooling_nchw_max_d1_s2_3x3 1x1x16x16xf64,0.32,0.31,,,0.48,0.48
pooling_nchw_sum_d1_s2_3x3 1x1x16x16xf64,0.23,0.20,,,0.27,0.27
relu 12x12xf64,,,0.69,,,
relu 12x16xf64,,,0.74,,,
relu 12x4xf64,,,0.39,,,
relu 12x8xf64,,,0.62,,,
relu 16x12xf64,,,0.74,,,
relu 16x16xf64,,,0.73,,,
relu 16x4xf64,,,0.45,,,
relu 16x8xf64,,,0.68,,,
relu 4x12xf64,,,0.47,,,
relu 4x16xf64,,,0.54,,,
relu 4x4xf64,,,0.17,,,
relu 4x8xf64,,,0.38,,,
relu 8x12xf64,,,0.62,,,
relu 8x16xf64,,,0.68,,,
relu 8x4xf64,,,0.32,,,
relu 8x8xf64,,,0.54,,,

Base automatically changed from sasha/linalg-xdsl-parallel to main May 21, 2024 12:17
@superlopuh superlopuh merged commit f428638 into main May 21, 2024
1 check passed
@superlopuh superlopuh deleted the sasha/parametric-parallel branch May 21, 2024 12:18
Copy link

kernels,baseline,linalg,linalg_xdsl,scf_xdsl,snitch_stream,snrt,min_llvm_mlir
conv2d_d1_s1_3x3 1x1x8x8xf64,1466,1732,,,1526,1501,1466
ddot 128xf64,961,957,,2243,205,569,957
dense 8x8xf64,3199,3518,,,2729,2737,3199
dsum 12x12xf64,,,229,,,,
dsum 12x16xf64,,,286,,,,
dsum 12x4xf64,,,122,,,,
dsum 12x8xf64,,,169,,,,
dsum 16x12xf64,,,286,,,,
dsum 16x16xf64,,,356,,,,
dsum 16x4xf64,,,138,,,,
dsum 16x8xf64,,,199,,,,
dsum 4x12xf64,,,143,,,,
dsum 4x16xf64,,,163,,,,
dsum 4x4xf64,,,94,,,,
dsum 4x8xf64,,,123,,,,
dsum 8x12xf64,,,169,,,,
dsum 8x16xf64,,,199,,,,
dsum 8x4xf64,,,106,,,,
dsum 8x8xf64,,,138,,,,
fill 12x12xf64,,,185,,,,
fill 12x16xf64,,,233,,,,
fill 12x4xf64,,,100,,,,
fill 12x8xf64,,,137,,,,
fill 16x12xf64,,,233,,,,
fill 16x16xf64,,,297,,,,
fill 16x4xf64,,,120,,,,
fill 16x8xf64,,,169,,,,
fill 4x12xf64,,,89,,,,
fill 4x16xf64,,,105,,,,
fill 4x4xf64,,,66,,,,
fill 4x8xf64,,,73,,,,
fill 8x12xf64,,,137,,,,
fill 8x16xf64,,,169,,,,
fill 8x4xf64,,,80,,,,
fill 8x8xf64,,,105,,,,
matmul 4x4x4xf64,,,,,207,,
matmul 4x4x8xf64,,,,,251,,
matmul 4x8x4xf64,,,,,255,,
matmul 4x8x8xf64,,,,,382,,
matmul 8x4x4xf64,,,,,265,,
matmul 8x4x8xf64,,,,,381,,
matmul 8x8x4xf64,,,,,386,,
matmul 8x8x8xf64,,,,,648,,
pooling_nchw_max_d1_s2_3x3 1x1x16x16xf64,1391,1435,,,1120,1121,1391
pooling_nchw_sum_d1_s2_3x3 1x1x16x16xf64,1710,2175,,,2003,1992,1710
relu 12x12xf64,,,213,,,,
relu 12x16xf64,,,262,,,,
relu 12x4xf64,,,127,,,,
relu 12x8xf64,,,159,,,,
relu 16x12xf64,,,262,,,,
relu 16x16xf64,,,352,,,,
relu 16x4xf64,,,147,,,,
relu 16x8xf64,,,190,,,,
relu 4x12xf64,,,106,,,,
relu 4x16xf64,,,122,,,,
relu 4x4xf64,,,106,,,,
relu 4x8xf64,,,89,,,,
relu 8x12xf64,,,159,,,,
relu 8x16xf64,,,190,,,,
relu 8x4xf64,,,106,,,,
relu 8x8xf64,,,122,,,,

Copy link

kernels,baseline,linalg,linalg_xdsl,scf_xdsl,snitch_stream,snrt
conv2d_d1_s1_3x3 1x1x8x8xf64,0.22,0.19,,,0.26,0.27
ddot 128xf64,0.13,0.14,,0.06,0.66,0.23
dense 8x8xf64,0.20,0.18,,,0.26,0.26
dsum 12x12xf64,,,0.63,,,
dsum 12x16xf64,,,0.67,,,
dsum 12x4xf64,,,0.40,,,
dsum 12x8xf64,,,0.57,,,
dsum 16x12xf64,,,0.67,,,
dsum 16x16xf64,,,0.72,,,
dsum 16x4xf64,,,0.47,,,
dsum 16x8xf64,,,0.65,,,
dsum 4x12xf64,,,0.34,,,
dsum 4x16xf64,,,0.40,,,
dsum 4x4xf64,,,0.18,,,
dsum 4x8xf64,,,0.27,,,
dsum 8x12xf64,,,0.57,,,
dsum 8x16xf64,,,0.65,,,
dsum 8x4xf64,,,0.31,,,
dsum 8x8xf64,,,0.47,,,
fill 12x12xf64,,,0.79,,,
fill 12x16xf64,,,0.83,,,
fill 12x4xf64,,,0.50,,,
fill 12x8xf64,,,0.72,,,
fill 16x12xf64,,,0.83,,,
fill 16x16xf64,,,0.87,,,
fill 16x4xf64,,,0.55,,,
fill 16x8xf64,,,0.77,,,
fill 4x12xf64,,,0.56,,,
fill 4x16xf64,,,0.63,,,
fill 4x4xf64,,,0.27,,,
fill 4x8xf64,,,0.47,,,
fill 8x12xf64,,,0.72,,,
fill 8x16xf64,,,0.77,,,
fill 8x4xf64,,,0.42,,,
fill 8x8xf64,,,0.63,,,
matmul 4x4x4xf64,,,,,0.31,
matmul 4x4x8xf64,,,,,0.51,
matmul 4x8x4xf64,,,,,0.51,
matmul 4x8x8xf64,,,,,0.67,
matmul 8x4x4xf64,,,,,0.49,
matmul 8x4x8xf64,,,,,0.67,
matmul 8x8x4xf64,,,,,0.67,
matmul 8x8x8xf64,,,,,0.79,
pooling_nchw_max_d1_s2_3x3 1x1x16x16xf64,0.32,0.31,,,0.48,0.48
pooling_nchw_sum_d1_s2_3x3 1x1x16x16xf64,0.23,0.20,,,0.27,0.27
relu 12x12xf64,,,0.69,,,
relu 12x16xf64,,,0.74,,,
relu 12x4xf64,,,0.39,,,
relu 12x8xf64,,,0.62,,,
relu 16x12xf64,,,0.74,,,
relu 16x16xf64,,,0.73,,,
relu 16x4xf64,,,0.45,,,
relu 16x8xf64,,,0.68,,,
relu 4x12xf64,,,0.47,,,
relu 4x16xf64,,,0.54,,,
relu 4x4xf64,,,0.17,,,
relu 4x8xf64,,,0.38,,,
relu 8x12xf64,,,0.62,,,
relu 8x16xf64,,,0.68,,,
relu 8x4xf64,,,0.32,,,
relu 8x8xf64,,,0.54,,,

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment
Projects
None yet
Development

Successfully merging this pull request may close these issues.

2 participants