Revert a change in attention

This commit is contained in:
Changming Sun 2020-04-23 19:18:05 -07:00 committed by Changming Sun
parent 2ab78c5da1
commit d97cb7338c

View file

@ -319,7 +319,7 @@ Status Attention<T>::Compute(OpKernelContext* context) const {
for (std::ptrdiff_t i = begin; i != end; ++i) {
T* current_tmp_data = reinterpret_cast<T*>(out_tmp_data) + sequence_length_mul_head_size * i;
math::MatMul<T>(sequence_length, head_size, sequence_length,
reinterpret_cast<T*>(scratch_data) + sequence_length_mul_head_size * i,
reinterpret_cast<T*>(scratch_data) + sequence_length * sequence_length * i,
V + sequence_length_mul_head_size * i, current_tmp_data, nullptr);
// transpose: out(B, S, N, H) = transpose out_tmp(B, N, S, H)