Skip to content
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions dace/codegen/targets/cuda.py
Original file line number Diff line number Diff line change
Expand Up @@ -2139,8 +2139,8 @@ def get_kernel_dimensions(self, dfg_scope):

# Check block size against configured maximum values, if those can be determined
total_bsize = prod(block_size)
total_limit = Config.get('compiler', 'cuda', 'block_size_limit')
lastdim_limit = Config.get('compiler', 'cuda', 'block_size_lastdim_limit')
total_limit = int(Config.get('compiler', 'cuda', 'block_size_limit'))
lastdim_limit = int(Config.get('compiler', 'cuda', 'block_size_lastdim_limit'))
if (total_bsize > total_limit) == True:
raise ValueError(f'Block size for kernel "{kernelmap_entry.map.label}" ({block_size}) '
f'is larger than the possible number of threads per block ({total_limit}). '
Expand Down
4 changes: 2 additions & 2 deletions dace/transformation/dataflow/add_threadblock_map.py
Original file line number Diff line number Diff line change
Expand Up @@ -76,8 +76,8 @@ def validate_block_size_limits(kernel_map_entry: nodes.MapEntry, block_size: Lis
kernel_map_label = kernel_map_entry.map.label

total_block_size = product(block_size)
limit = Config.get('compiler', 'cuda', 'block_size_limit')
lastdim_limit = Config.get('compiler', 'cuda', 'block_size_lastdim_limit')
limit = int(Config.get('compiler', 'cuda', 'block_size_limit'))
lastdim_limit = int(Config.get('compiler', 'cuda', 'block_size_lastdim_limit'))

if (total_block_size > limit) == True:
raise ValueError(f'Block size for kernel "{kernel_map_label}" ({block_size}) '
Expand Down