nty = int(math.ceil(exec_size[1] / workgroup_size[1]))