Add File

2025-09-04 14:09:18 +08:00
parent dadd15e1f6
commit 1bb0766f75
1 changed files with 250 additions and 0 deletions
--- a/src/main/java/org/dromara/easyai/transFormer/seflAttention/LayNorm.java
+++ b/src/main/java/org/dromara/easyai/transFormer/seflAttention/LayNorm.java
@@ -0,0 +1,250 @@
 package org.dromara.easyai.transFormer.seflAttention;
 import org.dromara.easyai.i.OutBack;
 import org.dromara.easyai.matrixTools.Matrix;
 import org.dromara.easyai.matrixTools.MatrixList;
 import org.dromara.easyai.matrixTools.MatrixOperation;
 import org.dromara.easyai.transFormer.CodecBlock;
 import org.dromara.easyai.transFormer.FirstDecoderBlock;
 import org.dromara.easyai.transFormer.model.LayNormModel;
 import org.dromara.easyai.transFormer.nerve.HiddenNerve;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Random;
 public class LayNorm {//残差与归一化
    private MultiSelfAttention multiSelfAttention;//多头
    private final CodecBlock myEncoderBlock;
    private final int featureDimension;//特征维度
    private List<HiddenNerve> hiddenNerves;//第一层隐层
    private final int type;//类别层模型需要保存
    private final Map<Long, MatrixList> reMatrixMap = new HashMap<>();
    private final FirstDecoderBlock firstDecoderBlock;
    private Matrix bTa;//模型需要保存
    private Matrix power;//模型需要保存
    private Matrix myNormData;//第一步归一化后的数据
    private final float study;//学习率
    private Matrix myFinalError;//从FNN传来的总误差
    private int number;//记录fnn传来的误差次数
    private final MatrixOperation matrixOperation;
    private final boolean encoder;
    private final int depth;
    public LayNormModel getModel() throws Exception {
        LayNormModel layNormModel = new LayNormModel();
        layNormModel.setbTa(bTa.getMatrix());
        layNormModel.setPower(power.getMatrix());
        return layNormModel;
    }
    public void insertModel(LayNormModel layNormModel) throws Exception {
        insertPower(layNormModel.getPower(), power);
        insertPower(layNormModel.getbTa(), bTa);
    }
    private void insertPower(float[][] modelPower, Matrix power) throws Exception {
        for (int i = 0; i < power.getX(); i++) {
            for (int j = 0; j < power.getY(); j++) {
                power.setNub(i, j, modelPower[i][j]);
            }
        }
    }
    public LayNorm(int type, int featureDimension, CodecBlock myEncoderBlock, FirstDecoderBlock firstDecoderBlock
            , float study, int coreNumber, boolean encoder, int depth) throws Exception {
        this.study = study;
        this.myEncoderBlock = myEncoderBlock;
        this.encoder = encoder;
        this.depth = depth;
        this.type = type;
        this.featureDimension = featureDimension;
        this.firstDecoderBlock = firstDecoderBlock;
        matrixOperation = new MatrixOperation(coreNumber);
        bTa = new Matrix(1, featureDimension);
        power = new Matrix(featureDimension, featureDimension);
        Random random = new Random();
        float sh = 1;
        if (!encoder && depth == 1) {
            sh = featureDimension * featureDimension;
        }
        for (int i = 0; i < featureDimension; i++) {
            float value = random.nextFloat() / sh;
            bTa.setNub(0, i, value);
        }
        for (int i = 0; i < featureDimension; i++) {
            for (int j = 0; j < featureDimension; j++) {
                float value = random.nextFloat() / sh;
                power.setNub(i, j, value);
            }
        }
    }
    private Matrix back(Matrix errorMatrix, Matrix myData) throws Exception {
        Matrix subPower = matrixOperation.matrixMulPd(errorMatrix, myData, power, false);
        Matrix sub = matrixOperation.matrixMulPd(errorMatrix, myData, power, true);
        power = matrixOperation.add(subPower, power);
        float n = (float) Math.sqrt(sub.getY());
        float nt = -n / (n - 1);
        Matrix subMatrix = new Matrix(1, sub.getY());
        for (int i = 0; i < sub.getY(); i++) {
            float subValue = sub.getNumber(0, i) * study;
            float value = subValue * n + subMatrix.getNumber(0, i);
            subMatrix.setNub(0, i, value);
            for (int j = 0; j < sub.getY(); j++) {
                if (i != j) {
                    float otherValue = subValue * nt + subMatrix.getNumber(0, j);
                    subMatrix.setNub(0, j, otherValue);
                }
            }
        }
        return subMatrix;
    }
    public void backErrorFromFNN(Matrix errorMatrix, long eventID, Matrix allError) throws Exception {//从fnn传下来的误差类别为1
        number++;
        if (myFinalError == null) {
            myFinalError = errorMatrix;
        } else {
            myFinalError = matrixOperation.add(myFinalError, errorMatrix);
        }
        if (number == featureDimension) {
            number = 0;
            Matrix error = myFinalError.getSonOfMatrix(0, 0, myFinalError.getX(), myFinalError.getY() - 1);
            myFinalError = null;
            Matrix myError = matrixOperation.add(error, allError);//残差误差与FNN回传误差相加
            backErrorFromLine(myError, eventID);
        }
    }
    public void backLastError(Matrix errorMatrix) throws Exception {//作为编码器最后一层接收误差
        if (myFinalError == null) {
            myFinalError = errorMatrix;
        } else {
            myFinalError = matrixOperation.add(myFinalError, errorMatrix);
        }
    }
    public void encoderBackStart(long eventID) throws Exception {
        Matrix error = myFinalError.copy();
        myFinalError = null;
        backErrorFromLine(error, eventID);
    }
    public void backErrorFromLine(Matrix errorMatrix, long eventID) throws Exception {//从线性层后传，类别为2
        matrixOperation.mathMul(errorMatrix, study);
        int x = errorMatrix.getX();
        MatrixList errorMatrixList = null;
        for (int i = 0; i < x; i++) {
            Matrix error = errorMatrix.getRow(i);
            Matrix myData = myNormData.getRow(i);
            bTa = matrixOperation.add(error, bTa);//更新bTa
            Matrix myRowError = back(error, myData);
            if (i == 0) {
                errorMatrixList = new MatrixList(myRowError, true);
            } else {
                errorMatrixList.add(myRowError);
            }
        }
        Matrix myError = errorMatrixList.getMatrix();
        //本模块误差处理完毕继续向后传播 2返回到fnn,1返回注意力
        if (type == 2) {//返回fnn
            int size = hiddenNerves.size();
            for (int i = 0; i < size; i++) {
                hiddenNerves.get(i).receiveErrorMatrix(myError.getColumn(i), eventID, myError);
            }
        } else {//误差返回注意力
            multiSelfAttention.backError(myError, eventID);
        }
    }
    public void addNorm(Matrix feature, Matrix outMatrix, long eventID, boolean isStudy
            , OutBack outBack, List<Integer> E, Matrix encoderFeature, boolean outAllPro) throws Exception {//残差及归一化
        Matrix myMatrix = matrixOperation.add(feature, outMatrix);//残差相加
        Matrix out = layNorm(myMatrix, isStudy);
 //        if (!encoder && depth > 1 && type == 1) {
 //            System.out.println(feature);
 //            System.out.println(outMatrix);
 //        }
        if (type == 1) {
            if (myEncoderBlock != null) {
                sendHiddenParameter(out, eventID, isStudy, outBack, E, encoderFeature, outAllPro);//发送线性第一层
            } else if (firstDecoderBlock != null) {//解码器第一层//输出
                firstDecoderBlock.sendOutputMatrix(eventID, out, isStudy, outBack, E, outAllPro);
            }
        } else {//输出矩阵
            myEncoderBlock.sendOutputMatrix(eventID, out, isStudy, outBack, E, encoderFeature, outAllPro);
        }
    }
    public void addNormFromNerve(long eventID, boolean isStudy, Matrix parameter, Matrix allFeature,
                                 OutBack outBack, List<Integer> E, Matrix encoderFeature, boolean outAllPro) throws Exception {
        MatrixList matrixFeature;
        if (reMatrixMap.containsKey(eventID)) {
            matrixFeature = reMatrixMap.get(eventID);
            matrixFeature.add(parameter);
        } else {
            matrixFeature = new MatrixList(parameter, false);
            reMatrixMap.put(eventID, matrixFeature);
        }
        if (matrixFeature.getY() == featureDimension) {//执行残差
            reMatrixMap.remove(eventID);
            addNorm(matrixFeature.getMatrix(), allFeature, eventID, isStudy, outBack, E, encoderFeature, outAllPro);
        }
    }
    private void sendHiddenParameter(Matrix feature, long eventId, boolean isStudy
            , OutBack outBack, List<Integer> E, Matrix encoderFeature, boolean outAllPro) throws Exception {//hiddenNerves
        for (HiddenNerve hiddenNerve : hiddenNerves) {
            hiddenNerve.receive(feature, eventId, isStudy, outBack, E, encoderFeature, outAllPro);
        }
    }
    private Matrix norm(Matrix row) throws Exception {
        Matrix result = new Matrix(1, row.getY());
        float avg = row.getAVG();//平均值
        float sd = matrixOperation.getSdByMatrix(row, avg, 0.0000001f);//标准差
        for (int i = 0; i < row.getY(); i++) {
            float value = (row.getNumber(0, i) - avg) / sd;
            result.setNub(0, i, value);
        }
        return result;
    }
    private Matrix layNorm(Matrix feature, boolean isStudy) throws Exception {//进行归一化
        int x = feature.getX();
        MatrixList normMatrixList = null;
        MatrixList outMatrixList = null;
        for (int i = 0; i < x; i++) {
            Matrix normData = norm(feature.getRow(i));//back时候需要
            if (isStudy) {
                if (i == 0) {
                    normMatrixList = new MatrixList(normData, true);
                } else {
                    normMatrixList.add(normData);
                }
            }
            Matrix want = matrixOperation.add(matrixOperation.mulMatrix(normData, power), bTa);
            if (i == 0) {
                outMatrixList = new MatrixList(want, true);
            } else {
                outMatrixList.add(want);
            }
        }
        if (isStudy) {
            myNormData = normMatrixList.getMatrix();
        }
        return outMatrixList.getMatrix();
    }
    public void setHiddenNerves(List<HiddenNerve> hiddenNerves) {
        this.hiddenNerves = hiddenNerves;
    }
    public void setMultiSelfAttention(MultiSelfAttention multiSelfAttention) {
        this.multiSelfAttention = multiSelfAttention;
    }
 }