Fix a bug to increment stride tile correctly (#503)
* Fix a bug to increment stride tile correctly * Update regular_tile_access_iterator_tensor_op.h Co-authored-by: peisun1115 <peis@google.com> Co-authored-by: Haicheng Wu <57973641+hwu36@users.noreply.github.com>
This commit is contained in:
parent
0abaac84ea
commit
a29dfb1c63
@ -614,7 +614,7 @@ class RegularTileAccessIterator<Shape_, Element_,
|
|||||||
add_pointer_offset(coord.contiguous() * sections_per_stage_ * stride_ *
|
add_pointer_offset(coord.contiguous() * sections_per_stage_ * stride_ *
|
||||||
ThreadMap::kElementsPerAccess / sections_ +
|
ThreadMap::kElementsPerAccess / sections_ +
|
||||||
coord.strided() * Shape::kStrided * stride_ *
|
coord.strided() * Shape::kStrided * stride_ *
|
||||||
Layout::kElementsPerAccess);
|
Layout::kElementsPerAccess / Layout::kFactor);
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user