Skip to content
Snippets Groups Projects
Commit ce8f3cc4 authored by Dominic Kempf's avatar Dominic Kempf
Browse files

Small adjustments to prevent stupid stuff

parent c97ec72a
No related branches found
No related tags found
No related merge requests found
......@@ -57,13 +57,17 @@ def costmodel(sf):
# Penalize vertical vectorization
vertical_penalty = 1 + math.log(sf.vertical_width)
memory_penalty = 1.0
if isinstance(sf, VectorizedSumfactKernel):
memory_penalty = 1.0 + math.log(len(set(k.interface for k in sf.kernels)), 2)
# Penalize scalar sum factorization kernels
scalar_penalty = 1
if isinstance(sf, SumfactKernel):
scalar_penalty = get_vcl_type_size(dtype_floatingpoint())
# Return total operations
return sf.operations * vertical_penalty * scalar_penalty
return sf.operations * vertical_penalty * memory_penalty * scalar_penalty
def explicit_costfunction(sf):
......@@ -367,7 +371,7 @@ def _level2_optimal_vectorization_strategy_generator(sumfacts, width, qp, alread
def get_vectorization_dict(sumfacts, vertical, horizontal, qp):
# Discard opportunities that do not contain enough horizontal kernels
if len(sumfacts) not in (horizontal, horizontal - 1):
if len(sumfacts) not in (horizontal, horizontal * vertical - 1):
return None
# Enhance the list of sumfact nodes by adding vertical splittings
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment