import sys from numpy import ones from numpy import triu, transpose, sqrt, exp, max, sum, zeros def attention(n,m,h): X = ones((n,m)) W1 = triu(ones((m,h))) W2 = triu(ones((m,h))) W3 = triu(ones((m,h))) Q = X@W1 # 矩阵相乘,请用@,千万别用*!!! K = X@W2 V = X@W3 S = (Q @ transpose(K)) / sqrt(h) def softmax(X): a...