diff --git a/tuning/autotune.py b/tuning/autotune.py index ff8891f..a7ef63a 100644 --- a/tuning/autotune.py +++ b/tuning/autotune.py @@ -543,7 +543,7 @@ def compile_unet_candidates( f"Hash value '{hash_val}' collided at candidate {indices}." ) unique_unet_candidates.append( - candidate_trackers[indices[0]].unet_candidate_path + candidate_trackers[indices[0]].unet_candidate_path # If collision occurs, use the first candidate index in the list ) return unique_unet_candidates if collision_detected else unet_candidates @@ -626,7 +626,7 @@ def main(): best_log = benchmark_top_candidates( args, base_dir, candidates_dir, compiled_files, candidate_trackers ) - print(f"Top candidates results are stored in {best_log}\n") + print(f"Top20 candidates results are stored in {best_log}\n") print("Compiling unet candidates...") unet_candidates = compile_unet_candidates( @@ -634,7 +634,7 @@ def main(): ) print(f"Unet candidates compiled in {base_dir}\n") - print("Bnechmarking unet candidates...") + print(f"Bnechmarking [{len(unet_candidates)}] unet candidates...") unet_result_log = benchmark_unet( args, base_dir, unet_candidates, candidate_trackers ) diff --git a/tuning/tune.py b/tuning/tune.py index 6517a6f..7756542 100755 --- a/tuning/tune.py +++ b/tuning/tune.py @@ -557,7 +557,9 @@ def generate_constraints( constraints += [k == intrinsic_mn * z3.FreshInt()] constraints += [k * n % (wg_x * wg_y * wg_z) == 0] constraints += [k * m % (wg_x * wg_y * wg_z) == 0] - constraints += [subgroup_m_count * subgroup_n_count == 4] + # constraints += [subgroup_m_count * subgroup_n_count == 4] # splat + # constraints += [subgroup_m_count * subgroup_n_count == 2] # real_weights + constraints += [subgroup_m_count * subgroup_n_count == 5] # conv constraints += [z3.Or(waves_per_eu == 1, waves_per_eu == 2, waves_per_eu == 4)]