android/renderscript/ScriptIntrinsicBLAS.java

25207df658d6a8a3e885c7017fcc25702363583cTim Murray/*
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * Copyright (C) 2015 The Android Open Source Project
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * Licensed under the Apache License, Version 2.0 (the "License");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * you may not use this file except in compliance with the License.
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * You may obtain a copy of the License at
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *      http://www.apache.org/licenses/LICENSE-2.0
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * Unless required by applicable law or agreed to in writing, software
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * distributed under the License is distributed on an "AS IS" BASIS,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * See the License for the specific language governing permissions and
25207df658d6a8a3e885c7017fcc25702363583cTim Murray * limitations under the License.
25207df658d6a8a3e885c7017fcc25702363583cTim Murray */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murraypackage android.renderscript;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murrayimport android.annotation.IntDef;
25207df658d6a8a3e885c7017fcc25702363583cTim Murrayimport java.lang.annotation.Retention;
25207df658d6a8a3e885c7017fcc25702363583cTim Murrayimport java.lang.annotation.RetentionPolicy;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray/**
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang * ScriptIntrinsicBLAS class provides high performance RenderScript APIs to BLAS.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang * The BLAS (Basic Linear Algebra Subprograms) are routines that provide standard
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang * building blocks for performing basic vector and matrix operations.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang * For detailed description of BLAS, please refer to http://www.netlib.org/blas/
25207df658d6a8a3e885c7017fcc25702363583cTim Murray *
25207df658d6a8a3e885c7017fcc25702363583cTim Murray **/
25207df658d6a8a3e885c7017fcc25702363583cTim Murraypublic final class ScriptIntrinsicBLAS extends ScriptIntrinsic {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private Allocation mLUT;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private ScriptIntrinsicBLAS(long id, RenderScript rs) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        super(id, rs);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sdsdot = 1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsdot = 2;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sdot = 3;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ddot = 4;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cdotu_sub = 5;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cdotc_sub = 6;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zdotu_sub = 7;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zdotc_sub = 8;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_snrm2 = 9;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sasum = 10;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dnrm2 = 11;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dasum = 12;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_scnrm2 = 13;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_scasum = 14;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dznrm2 = 15;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dzasum = 16;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_isamax = 17;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_idamax = 18;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_icamax = 19;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_izamax = 20;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sswap = 21;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_scopy = 22;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_saxpy = 23;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dswap = 24;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dcopy = 25;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_daxpy = 26;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cswap = 27;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ccopy = 28;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_caxpy = 29;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zswap = 30;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zcopy = 31;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zaxpy = 32;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_srotg = 33;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_srotmg = 34;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_srot = 35;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_srotm = 36;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_drotg = 37;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_drotmg = 38;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_drot = 39;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_drotm = 40;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sscal = 41;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dscal = 42;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cscal = 43;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zscal = 44;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_csscal = 45;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zdscal = 46;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sgemv = 47;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sgbmv = 48;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_strmv = 49;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_stbmv = 50;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_stpmv = 51;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_strsv = 52;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_stbsv = 53;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_stpsv = 54;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dgemv = 55;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dgbmv = 56;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtrmv = 57;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtbmv = 58;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtpmv = 59;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtrsv = 60;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtbsv = 61;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtpsv = 62;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cgemv = 63;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cgbmv = 64;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctrmv = 65;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctbmv = 66;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctpmv = 67;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctrsv = 68;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctbsv = 69;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctpsv = 70;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zgemv = 71;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zgbmv = 72;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztrmv = 73;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztbmv = 74;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztpmv = 75;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztrsv = 76;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztbsv = 77;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztpsv = 78;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssymv = 79;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssbmv = 80;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sspmv = 81;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sger = 82;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssyr = 83;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sspr = 84;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssyr2 = 85;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sspr2 = 86;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsymv = 87;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsbmv = 88;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dspmv = 89;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dger = 90;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsyr = 91;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dspr = 92;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsyr2 = 93;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dspr2 = 94;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chemv = 95;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chbmv = 96;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chpmv = 97;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cgeru = 98;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cgerc = 99;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cher = 100;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chpr = 101;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cher2 = 102;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chpr2 = 103;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhemv = 104;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhbmv = 105;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhpmv = 106;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zgeru = 107;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zgerc = 108;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zher = 109;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhpr = 110;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zher2 = 111;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhpr2 = 112;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_sgemm = 113;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssymm = 114;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssyrk = 115;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ssyr2k = 116;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_strmm = 117;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_strsm = 118;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dgemm = 119;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsymm = 120;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsyrk = 121;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dsyr2k = 122;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtrmm = 123;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_dtrsm = 124;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cgemm = 125;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_csymm = 126;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_csyrk = 127;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_csyr2k = 128;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctrmm = 129;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ctrsm = 130;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zgemm = 131;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zsymm = 132;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zsyrk = 133;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zsyr2k = 134;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztrmm = 135;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_ztrsm = 136;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_chemm = 137;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cherk = 138;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_cher2k = 139;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zhemm = 140;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zherk = 141;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    private static final int RsBlas_zher2k = 142;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray    // BLAS extensions start here
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray    private static final int RsBlas_bnnm = 1000;
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Create an intrinsic to access BLAS subroutines.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param rs The RenderScript context
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @return ScriptIntrinsicBLAS
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static ScriptIntrinsicBLAS create(RenderScript rs) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        long id = rs.nScriptIntrinsicCreate(13, Element.U32(rs).getID(rs));
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return new ScriptIntrinsicBLAS(id, rs);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @hide
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @IntDef({NO_TRANSPOSE, TRANSPOSE, CONJ_TRANSPOSE})
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @Retention(RetentionPolicy.SOURCE)
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public @interface Transpose {}
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @hide
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @IntDef({UPPER, LOWER})
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @Retention(RetentionPolicy.SOURCE)
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public @interface Uplo {}
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @hide
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @IntDef({NON_UNIT, UNIT})
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @Retention(RetentionPolicy.SOURCE)
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public @interface Diag {}
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @hide
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @IntDef({LEFT, RIGHT})
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    @Retention(RetentionPolicy.SOURCE)
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public @interface Side {}
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int NO_TRANSPOSE = 111;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int TRANSPOSE = 112;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int CONJ_TRANSPOSE = 113;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int UPPER = 121;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int LOWER = 122;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int NON_UNIT = 131;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int UNIT = 132;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int LEFT = 141;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public static final int RIGHT = 142;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateSide(@Side int Side) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Side != LEFT && Side != RIGHT) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid side passed to BLAS");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateTranspose(@Transpose int Trans) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans != NO_TRANSPOSE && Trans != TRANSPOSE &&
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            Trans != CONJ_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid transpose passed to BLAS");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateConjTranspose(@Transpose int Trans) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans != NO_TRANSPOSE &&
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            Trans != CONJ_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid transpose passed to BLAS");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateDiag(@Diag int Diag) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Diag != NON_UNIT && Diag != UNIT) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid diag passed to BLAS");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateUplo(@Uplo int Uplo) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Uplo != UPPER && Uplo != LOWER) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid uplo passed to BLAS");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    /**
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     * Level 2 BLAS
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateGEMV(Element e, int TransA, Allocation A, Allocation X, int incX, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (incX <= 0 || incY <= 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Vector increments must be greater than 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = -1, expectedYDim = -1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (TransA == NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            expectedYDim = 1 + (M - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            expectedXDim = 1 + (M - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim ||
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for GEMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SGEMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d58/sgemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SGEMV(@Transpose int TransA, float alpha, Allocation A, Allocation X, int incX, float beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F32(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sgemv, TransA, 0, 0, 0, 0, M, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DGEMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dc/da8/dgemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DGEMV(@Transpose int TransA, double alpha, Allocation A, Allocation X, int incX, double beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F64(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dgemv, TransA, 0, 0, 0, 0, M, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CGEMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y   or   y := alpha*A**H*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/d8a/cgemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CGEMV(@Transpose int TransA, Float2 alpha, Allocation A, Allocation X, int incX, Float2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F32_2(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cgemv, TransA, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZGEMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y   or   y := alpha*A**H*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d40/zgemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZGEMV(@Transpose int TransA, Double2 alpha, Allocation A, Allocation X, int incX, Double2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F64_2(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zgemv, TransA, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SGBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d46/sgbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a M*N matrix, the input Allocation should also be of size M*N (dimY = M, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region M*(KL+KU+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert the original matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, m):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(max(0, i-kl), min(i+ku+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i+kl] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KL The number of sub-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KU The number of super-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains the band matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SGBMV(@Transpose int TransA, int KL, int KU, float alpha, Allocation A, Allocation X, int incX, float beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // GBMV has the same validation requirements as GEMV + KL and KU >= 0
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F32(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (KL < 0 || KU < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("KL and KU must be greater than or equal to 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sgbmv, TransA, 0, 0, 0, 0, M, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, KL, KU);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DGBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d3f/dgbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a M*N matrix, the input Allocation should also be of size M*N (dimY = M, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region M*(KL+KU+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert the original matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, m):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(max(0, i-kl), min(i+ku+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i+kl] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KL The number of sub-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KU The number of super-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains the band matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DGBMV(@Transpose int TransA, int KL, int KU, double alpha, Allocation A, Allocation X, int incX, double beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // GBMV has the same validation requirements as GEMV + KL and KU >= 0
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F64(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (KL < 0 || KU < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("KL and KU must be greater than or equal to 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dgbmv, TransA, 0, 0, 0, 0, M, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, KL, KU);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CGBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y   or   y := alpha*A**H*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d75/cgbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a M*N matrix, the input Allocation should also be of size M*N (dimY = M, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region M*(KL+KU+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert the original matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, m):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(max(0, i-kl), min(i+ku+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i+kl] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KL The number of sub-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KU The number of super-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains the band matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CGBMV(@Transpose int TransA, int KL, int KU, Float2 alpha, Allocation A, Allocation X, int incX, Float2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // GBMV has the same validation requirements as GEMV + KL and KU >= 0
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F32_2(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (KL < 0 || KU < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("KL and KU must be greater than or equal to 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cgbmv, TransA, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, KL, KU);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZGBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y   or   y := alpha*A**T*x + beta*y   or   y := alpha*A**H*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d9/d46/zgbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a M*N matrix, the input Allocation should also be of size M*N (dimY = M, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region M*(KL+KU+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert the original matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, m):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(max(0, i-kl), min(i+ku+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i+kl] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KL The number of sub-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param KU The number of super-diagonals of the matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains the band matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZGBMV(@Transpose int TransA, int KL, int KU, Double2 alpha, Allocation A, Allocation X, int incX, Double2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // GBMV has the same validation requirements as GEMV + KL and KU >= 0
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGEMV(Element.F64_2(mRS), TransA, A, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (KL < 0 || KU < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("KL and KU must be greater than or equal to 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zgbmv, TransA, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, KL, KU);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang    static void validateTRMV(Element e, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation A, Allocation X, int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateUplo(Uplo);
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (A.getType().getX() != N) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("A must be a square matrix for TRMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (incX <= 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Vector increments must be greater than 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for TRMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateTPMV(Element e, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation Ap, Allocation X, int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!Ap.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Ap must have a Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = (int)Math.sqrt((double)Ap.getType().getX() * 2);
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        //is it really doing anything?
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getX() != ((N * (N+1)) / 2)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid dimension for Ap");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Incorrect vector dimensions for TPMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STRMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d45/strmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STRMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation A, Allocation X, int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_strmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTRMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dc/d7e/dtrmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTRMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation A, Allocation X, int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtrmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTRMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d78/ctrmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTRMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation A, Allocation X, int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctrmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTRMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/dd1/ztrmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTRMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Allocation A, Allocation X, int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztrmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d7d/stbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STBMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBMV has the same requirements as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_stbmv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d29/dtbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTBMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBMV has the same requirements as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtbmv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/dcd/ctbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTBMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBMV has the same requirements as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctbmv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTBMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d39/ztbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTBMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBMV has the same requirements as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztbmv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STPMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/db1/stpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STPMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F32(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_stpmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTPMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dc/dcd/dtpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTPMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F64(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtpmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTPMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/dbb/ctpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTPMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F32_2(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctpmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTPMV performs one of the matrix-vector operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * x := A*x   or   x := A**T*x   or   x := A**H*x
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d9e/ztpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTPMV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F64_2(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztpmv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STRSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d2a/strsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STRSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation A,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TRSV is the same as TRMV
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_strsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTRSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d96/dtrsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTRSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation A,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TRSV is the same as TRMV
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtrsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTRSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/dc8/ctrsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTRSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation A,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TRSV is the same as TRMV
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctrsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTRSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d1/d2f/ztrsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTRSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation A,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TRSV is the same as TRMV
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztrsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STBSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d1f/stbsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STBSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBSV is the same as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Number of diagonals must be positive");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_stbsv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTBSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/dcf/dtbsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTBSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBSV is the same as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Number of diagonals must be positive");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtbsv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, A.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTBSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d9/d5f/ctbsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTBSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBSV is the same as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F32_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Number of diagonals must be positive");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctbsv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTBSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/d5a/ztbsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTBSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  int K, Allocation A,  Allocation X,  int incX) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // TBSV is the same as TRMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateTRMV(Element.F64_2(mRS), Uplo, TransA, Diag, A, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Number of diagonals must be positive");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztbsv, TransA, 0, 0, Uplo, Diag, 0, N, K, 0, 0, A.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STPSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d7c/stpsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void STPSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TPSV is same as TPMV
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F32(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_stpsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTPSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d9/d84/dtpsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DTPSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TPSV is same as TPMV
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F64(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtpsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTPSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/d56/ctpsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CTPSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TPSV is same as TPMV
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F32_2(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctpsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTPSV solves one of the systems of equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A*x = b   or   A**T*x = b   or   A**H*x = b
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/da/d57/ztpsv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the matrix is an upper or lower triangular matrix.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains packed matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZTPSV(@Uplo int Uplo, @Transpose int TransA, @Diag int Diag,  Allocation Ap,  Allocation X,  int incX) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // TPSV is same as TPMV
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateTPMV(Element.F64_2(mRS), Uplo, TransA, Diag, Ap, X, incX);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztpsv, TransA, 0, 0, Uplo, Diag, 0, N, 0, 0, 0, Ap.getID(mRS), X.getID(mRS), 0, 0, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    /**
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     * Level 2, S and D only
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSYMV(Element e, @Uplo int Uplo, Allocation A, Allocation X, Allocation Y, int incX, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (A.getType().getX() != N) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("A must be a square matrix for SYMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e) ) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (incX <= 0 || incY <= 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Vector increments must be greater than 0");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SYMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SYMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSPMV(Element e, @Uplo int Uplo, Allocation Ap, Allocation X, int incX, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!Ap.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Ap must have a Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = (int)Math.sqrt((double)Ap.getType().getX() * 2);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getX() != ((N * (N+1)) / 2)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid dimension for Ap");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0 || incY <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SPMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SPMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateGER(Element e, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e) ) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (N < 1 || M < 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("M and N must be 1 or greater for GER");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0 || incY <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        int expectedXDim = 1 + (M - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for GER");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for GER");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSYR(Element e, @Uplo int Uplo, Allocation X, int incX, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (N != A.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("A must be a symmetric matrix");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SYR");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSPR(Element e, @Uplo int Uplo, Allocation X, int incX, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!Ap.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Ap must have a Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = (int)Math.sqrt((double)Ap.getType().getX() * 2);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getX() != ((N * (N+1)) / 2)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid dimension for Ap");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Incorrect vector dimensions for SPR");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSYR2(Element e, @Uplo int Uplo, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (N != A.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("A must be a symmetric matrix");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0 || incY <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim || Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for SYR");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static int validateSPR2(Element e, @Uplo int Uplo, Allocation X, int incX, Allocation Y, int incY, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!Ap.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Ap must have a Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = (int)Math.sqrt((double)Ap.getType().getX() * 2);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Ap.getType().getX() != ((N * (N+1)) / 2)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid dimension for Ap");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0 || incY <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedXDim = 1 + (N - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim || Y.getType().getX() != expectedYDim) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Incorrect vector dimensions for SPR2");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        return N;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d94/ssymv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSYMV(@Uplo int Uplo, float alpha, Allocation A, Allocation X, int incX, float beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYMV(Element.F32(mRS), Uplo, A, X, Y, incX, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssymv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSBMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/da1/ssbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the band matrix A is being supplied.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSBMV(@Uplo int Uplo, int K, float alpha, Allocation A, Allocation X, int incX, float beta, Allocation Y, int incY) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // SBMV is the same as SYMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYMV(Element.F32(mRS), Uplo, A, X, Y, incX, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssbmv, 0, 0, 0, Uplo, 0, 0, N, K, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSPMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/d68/sspmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the matrix A is supplied in packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSPMV(@Uplo int Uplo, float alpha, Allocation Ap, Allocation X, int incX, float beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPMV(Element.F32(mRS), Uplo, Ap, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sspmv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, Ap.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SGER performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d5c/sger_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SGER(float alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateGER(Element.F32(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sger, 0, 0, 0, 0, 0, M, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0.f, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/dac/ssyr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSYR(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR(Element.F32(mRS), Uplo, X, incX, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssyr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), A.getID(mRS), 0.f, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSPR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d9b/sspr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSPR(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR(Element.F32(mRS), Uplo, X, incX, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sspr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Ap.getID(mRS), 0.f, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + alpha*y*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d99/ssyr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSYR2(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F32(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssyr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSPR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + alpha*y*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d3e/sspr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void SSPR2(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation Y, int incY, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F32(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sspr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0, Ap.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/dbe/dsymv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSYMV(@Uplo int Uplo, double alpha, Allocation A, Allocation X, int incX, double beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYMV(Element.F64(mRS), Uplo, A, X, Y, incX, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsymv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSBMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/d1e/dsbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the band matrix A is being supplied.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSBMV(@Uplo int Uplo, int K, double alpha, Allocation A, Allocation X, int incX, double beta, Allocation Y, int incY) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        // SBMV is the same as SYMV + K >= 0
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (K < 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("K must be greater than or equal to 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYMV(Element.F64(mRS), Uplo, A, X, Y, incX, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsbmv, 0, 0, 0, Uplo, 0, 0, N, K, alpha, A.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSPMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/d85/dspmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the matrix A is supplied in packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSPMV(@Uplo int Uplo, double alpha, Allocation Ap, Allocation X, int incX, double beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPMV(Element.F64(mRS), Uplo, Ap, X, incX, Y, incY);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dspmv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, Ap.getID(mRS), X.getID(mRS), beta, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DGER performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dc/da8/dger_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DGER(double alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        validateGER(Element.F64(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dger, 0, 0, 0, 0, 0, M, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0.f, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d60/dsyr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    public void DSYR(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation A) {
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang        int N = validateSYR(Element.F64(mRS), Uplo, X, incX, A);
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsyr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), A.getID(mRS), 0.f, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSPR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dd/dba/dspr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSPR(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR(Element.F64(mRS), Uplo, X, incX, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dspr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Ap.getID(mRS), 0.f, 0, incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + alpha*y*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d41/dsyr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSYR2(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F64(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsyr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSPR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + alpha*y*x**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dd/d9e/dspr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void DSPR2(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation Y, int incY, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F64(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dspr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, X.getID(mRS), Y.getID(mRS), 0, Ap.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    /**
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     * Level 2, C and Z only
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateGERU(Element e, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !X.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !Y.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getY() > 1 || Y.getType().getY() > 1) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("BLAS vectors must have Y dimension of 0 or 1");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        if (incX <= 0 || incY <= 0) {
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang            throw new RSRuntimeException("Vector increments must be greater than 0");
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        }
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        int expectedXDim = 1 + (M - 1) * incX;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (X.getType().getX() != expectedXDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for GERU");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int expectedYDim = 1 + (N - 1) * incY;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Y.getType().getX() != expectedYDim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Incorrect vector dimensions for GERU");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHEMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/d51/chemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHEMV(@Uplo int Uplo, Float2 alpha, Allocation A, Allocation X, int incX, Float2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HEMV is the same as SYR2 validation-wise
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F32_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chemv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHBMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/dc2/chbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the band matrix A is being supplied.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHBMV(@Uplo int Uplo, int K, Float2 alpha, Allocation A, Allocation X, int incX, Float2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HBMV is the same as SYR2 validation-wise
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F32_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("K must be 0 or greater for HBMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chbmv, 0, 0, 0, Uplo, 0, 0, N, K, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHPMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d06/chpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the matrix A is supplied in packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHPMV(@Uplo int Uplo, Float2 alpha, Allocation Ap, Allocation X, int incX, Float2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HPMV is the same as SPR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F32_2(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chpmv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, Ap.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CGERU performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d5f/cgeru_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CGERU(Float2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGERU(Element.F32_2(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cgeru, 0, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CGERC performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dd/d84/cgerc_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CGERC(Float2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as GERU
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGERU(Element.F32_2(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cgerc, 0, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHER performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d6d/cher_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHER(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SYR
68ca43ebe6e162ff13fc4f96d5aacd494980f6b6Miao Wang        int N = validateSYR(Element.F32_2(mRS), Uplo, X, incX, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cher, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, 0, X.getID(mRS), 0, 0, 0, A.getID(mRS), incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHPR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/dcd/chpr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHPR(@Uplo int Uplo, float alpha, Allocation X, int incX, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // equivalent to SPR for validation
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR(Element.F32_2(mRS), Uplo, X, incX, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chpr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, 0, X.getID(mRS), 0, 0, 0, Ap.getID(mRS), incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHER2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + alpha*y*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d87/cher2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHER2(@Uplo int Uplo, Float2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SYR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F32_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cher2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHPR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + alpha*y*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d44/chpr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void CHPR2(@Uplo int Uplo, Float2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SPR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F32_2(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chpr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, Ap.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHEMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/ddd/zhemv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHEMV(@Uplo int Uplo, Double2 alpha, Allocation A, Allocation X, int incX, Double2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HEMV is the same as SYR2 validation-wise
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F64_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhemv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHBMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d1a/zhbmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should also be of size N*N (dimY = N, dimX = N),
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       but only the region N*(K+1) will be referenced. The following subroutine can is an
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       example showing how to convert a UPPER trianglar matrix 'a' to row-based band matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, min(i+k+1, n)):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[i, j-i] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the band matrix A is being supplied.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param K The number of off-diagonals of the matrix A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHBMV(@Uplo int Uplo, int K, Double2 alpha, Allocation A, Allocation X, int incX, Double2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HBMV is the same as SYR2 validation-wise
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F64_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (K < 0) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("K must be 0 or greater for HBMV");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhbmv, 0, 0, 0, Uplo, 0, 0, N, K, alpha.x, alpha.y, A.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHPMV performs the matrix-vector operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * y := alpha*A*x + beta*y
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d60/zhpmv_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of the matrix A is supplied in packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHPMV(@Uplo int Uplo, Double2 alpha, Allocation Ap, Allocation X, int incX, Double2 beta, Allocation Y, int incY) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // HPMV is the same as SPR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F64_2(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhpmv, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, Ap.getID(mRS), X.getID(mRS), beta.x, beta.y, Y.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZGERU performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**T + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/d12/zgeru_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZGERU(Double2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGERU(Element.F64_2(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zgeru, 0, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZGERC performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/dad/zgerc_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZGERC(Double2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as GERU
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateGERU(Element.F64_2(mRS), X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zgerc, 0, 0, 0, 0, 0, M, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHER performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d0e/zher_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHER(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SYR
cecc00aba1012d4f19bc78fcd12ddcbccdd49182Miao Wang        int N = validateSYR(Element.F64_2(mRS), Uplo, X, incX, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zher, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, 0, X.getID(mRS), 0, 0, 0, A.getID(mRS), incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHPR performs the rank 1 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/de1/zhpr_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHPR(@Uplo int Uplo, double alpha, Allocation X, int incX, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // equivalent to SPR for validation
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR(Element.F64_2(mRS), Uplo, X, incX, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhpr, 0, 0, 0, Uplo, 0, 0, N, 0, alpha, 0, X.getID(mRS), 0, 0, 0, Ap.getID(mRS), incX, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHER2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + alpha*y*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/da/d8a/zher2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHER2(@Uplo int Uplo, Double2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation A) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SYR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSYR2(Element.F64_2(mRS), Uplo, X, incX, Y, incY, A);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zher2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, A.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHPR2 performs the symmetric rank 2 operation
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * A := alpha*x*y**H + alpha*y*x**H + A
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d5/d52/zhpr2_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Note: For a N*N matrix, the input Allocation should be a 1D allocation of size dimX = N*(N+1)/2,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       The following subroutine can is an example showing how to convert a UPPER trianglar matrix
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *       'a' to packed matrix 'b'.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           k = 0
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *           for i in range(0, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *              for j in range(i, n):
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *                  b[k++] = a[i, j]
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be supplied in the packed form.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param X The input allocation contains vector x, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incX The increment for the elements of vector x, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Y The input allocation contains vector y, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param incY The increment for the elements of vector y, must be larger than zero.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Ap The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
89c3a5f8c5fd96016e7e277fc49e1f4be10c617bMiao Wang    public void ZHPR2(@Uplo int Uplo, Double2 alpha, Allocation X, int incX, Allocation Y, int incY, Allocation Ap) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // same as SPR2
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int N = validateSPR2(Element.F64_2(mRS), Uplo, X, incX, Y, incY, Ap);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhpr2, 0, 0, 0, Uplo, 0, 0, N, 0, alpha.x, alpha.y, X.getID(mRS), Y.getID(mRS), 0, 0, Ap.getID(mRS), incX, incY, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    /**
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     * Level 3 BLAS
25207df658d6a8a3e885c7017fcc25702363583cTim Murray     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateL3(Element e, int TransA, int TransB, int Side, Allocation A, Allocation B, Allocation C) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        int aM = -1, aN = -1, bM = -1, bN = -1, cM = -1, cN = -1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if ((A != null && !A.getType().getElement().isCompatible(e)) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            (B != null && !B.getType().getElement().isCompatible(e)) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            (C != null && !C.getType().getElement().isCompatible(e))) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (C == null) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            //since matrix C is used to store the result, it cannot be null.
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Allocation C cannot be null");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        cM = C.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        cN = C.getType().getX();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Side == RIGHT) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if ((A == null && B != null) || (A != null && B == null)) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                throw new RSRuntimeException("Provided Matrix A without Matrix B, or vice versa");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (B != null) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                bM = A.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                bN = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (A != null) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                aM = B.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                aN = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (A != null) {
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang                if (TransA == TRANSPOSE || TransA == CONJ_TRANSPOSE) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    aN = A.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    aM = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                } else {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    aM = A.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    aN = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (B != null) {
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang                if (TransB == TRANSPOSE || TransB == CONJ_TRANSPOSE) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    bN = B.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    bM = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                } else {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    bM = B.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                    bN = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (A != null && B != null && C != null) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (aN != bM || aM != cM || bN != cN) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called BLAS with invalid dimensions");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else if (A != null && C != null) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            // A and C only, for SYRK
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (cM != cN) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                throw new RSRuntimeException("Matrix C is not symmetric");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            }
50a8ff108f40fe912690ebb34340783bb4f052aeMiao Wang            if (aM != cM) {
50a8ff108f40fe912690ebb34340783bb4f052aeMiao Wang                throw new RSRuntimeException("Called BLAS with invalid dimensions");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else if (A != null && B != null) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // A and B only
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (aN != bM) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang                throw new RSRuntimeException("Called BLAS with invalid dimensions");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SGEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*op(A)*op(B) + beta*C   where op(X) is one of op(X) = X  or  op(X) = X**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/de2/sgemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransB The type of transpose applied to matrix B.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void SGEMM(@Transpose int TransA, @Transpose int TransB, float alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransB);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32(mRS), TransA, TransB, 0, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = -1, N = -1, K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransA != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransB != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_sgemm, TransA, TransB, 0, 0, 0, M, N, K,  alpha, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DGEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*op(A)*op(B) + beta*C   where op(X) is one of op(X) = X  or  op(X) = X**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/d2b/dgemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransB The type of transpose applied to matrix B.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DGEMM(@Transpose int TransA, @Transpose int TransB, double alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransB);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64(mRS), TransA, TransB, 0, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = -1, N = -1, K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransA != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransB != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dgemm, TransA, TransB, 0, 0, 0, M, N, K,  alpha, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CGEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*op(A)*op(B) + beta*C   where op(X) is one of op(X) = X  or  op(X) = X**T  or  op(X) = X**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d5b/cgemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransB The type of transpose applied to matrix B.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CGEMM(@Transpose int TransA, @Transpose int TransB, Float2 alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, Float2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransB);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32_2(mRS), TransA, TransB, 0, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = -1, N = -1, K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransA != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransB != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cgemm, TransA, TransB, 0, 0, 0, M, N, K,  alpha.x, alpha.y, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZGEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*op(A)*op(B) + beta*C   where op(X) is one of op(X) = X  or  op(X) = X**T  or  op(X) = X**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/d76/zgemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransB The type of transpose applied to matrix B.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
54de77470de4f605eef7f4b4e01718b301fe275eElliot Waite     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
54de77470de4f605eef7f4b4e01718b301fe275eElliot Waite     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
54de77470de4f605eef7f4b4e01718b301fe275eElliot Waite     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZGEMM(@Transpose int TransA, @Transpose int TransB, Double2 alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, Double2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransB);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64_2(mRS), TransA, TransB, 0, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int M = -1, N = -1, K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransA != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            M = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (TransB != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            N = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zgemm, TransA, TransB, 0, 0, 0, M, N, K,  alpha.x, alpha.y, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/d42/ssymm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void SSYMM(@Side int Side, @Uplo int Uplo, float alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        //For SYMM, Matrix A should be symmetric
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (A.getType().getX() != A.getType().getY()) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Matrix A is not symmetric");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32(mRS), 0, 0, Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssymm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0, alpha, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/db0/dsymm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DSYMM(@Side int Side, @Uplo int Uplo, double alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (A.getType().getX() != A.getType().getY()) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Matrix A is not symmetric");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64(mRS), 0, 0, Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsymm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0, alpha, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CSYMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/db/d59/csymm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CSYMM(@Side int Side, @Uplo int Uplo, Float2 alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, Float2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (A.getType().getX() != A.getType().getY()) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Matrix A is not symmetric");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32_2(mRS), 0, 0, Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_csymm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0, alpha.x, alpha.y, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZSYMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d51/zsymm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZSYMM(@Side int Side, @Uplo int Uplo, Double2 alpha, Allocation A,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                      Allocation B, Double2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (A.getType().getX() != A.getType().getY()) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Matrix A is not symmetric");
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64_2(mRS), 0, 0, Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zsymm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0, alpha.x, alpha.y, A.getID(mRS), B.getID(mRS),
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYRK performs one of the symmetric rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**T + beta*C   or   C := alpha*A**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d0/d40/ssyrk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void SSYRK(@Uplo int Uplo, @Transpose int Trans, float alpha, Allocation A, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32(mRS), Trans, 0, 0, A, null, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssyrk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha, A.getID(mRS), 0, beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYRK performs one of the symmetric rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**T + beta*C   or   C := alpha*A**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dc/d05/dsyrk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DSYRK(@Uplo int Uplo, @Transpose int Trans, double alpha, Allocation A, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64(mRS), Trans, 0, 0, A, null, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsyrk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha, A.getID(mRS), 0, beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CSYRK performs one of the symmetric rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**T + beta*C   or   C := alpha*A**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d6a/csyrk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang    public void CSYRK(@Uplo int Uplo, @Transpose int Trans, Float2 alpha, Allocation A, Float2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F32_2(mRS), Trans, 0, 0, A, null, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_csyrk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha.x, alpha.y, A.getID(mRS), 0, beta.x, beta.y,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZSYRK performs one of the symmetric rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**T + beta*C   or   C := alpha*A**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d54/zsyrk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang    public void ZSYRK(@Uplo int Uplo, @Transpose int Trans, Double2 alpha, Allocation A, Double2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateL3(Element.F64_2(mRS), Trans, 0, 0, A, null, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zsyrk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha.x, alpha.y, A.getID(mRS), 0, beta.x, beta.y,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateSYR2K(Element e, @Transpose int Trans, Allocation A, Allocation B, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !B.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !C.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int Cdim = -1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // A is n x k if no transpose, k x n if transpose
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // C is n x n
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans == TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // check columns versus C
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            Cdim = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // check rows versus C
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            Cdim = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (C.getType().getX() != Cdim || C.getType().getY() != Cdim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid symmetric matrix in SYR2K");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // A dims == B dims
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (A.getType().getX() != B.getType().getX() || A.getType().getY() != B.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Invalid A and B in SYR2K");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * SSYR2K performs one of the symmetric rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**T + alpha*B*A**T + beta*C   or   C := alpha*A**T*B + alpha*B**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d3d/ssyr2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void SSYR2K(@Uplo int Uplo, @Transpose int Trans, float alpha, Allocation A, Allocation B, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSYR2K(Element.F32(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_ssyr2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha, A.getID(mRS), B.getID(mRS), beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DSYR2K performs one of the symmetric rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**T + alpha*B*A**T + beta*C   or   C := alpha*A**T*B + alpha*B**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d1/dec/dsyr2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DSYR2K(@Uplo int Uplo, @Transpose int Trans, double alpha, Allocation A, Allocation B, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSYR2K(Element.F64(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dsyr2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha, A.getID(mRS), B.getID(mRS), beta, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CSYR2K performs one of the symmetric rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**T + alpha*B*A**T + beta*C   or   C := alpha*A**T*B + alpha*B**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d7e/csyr2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CSYR2K(@Uplo int Uplo, @Transpose int Trans, Float2 alpha, Allocation A, Allocation B, Float2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSYR2K(Element.F32_2(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_csyr2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZSYR2K performs one of the symmetric rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**T + alpha*B*A**T + beta*C   or   C := alpha*A**T*B + alpha*B**T*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d20/zsyr2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZSYR2K(@Uplo int Uplo, @Transpose int Trans, Double2 alpha, Allocation A, Allocation B, Double2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSYR2K(Element.F64_2(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int K = -1;
1e940d87c46edc672964c7674cff8da6441e9559Miao Wang        if (Trans != NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            K = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zsyr2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), K, alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateTRMM(Element e, @Side int Side, @Transpose int TransA, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        int aM = -1, aN = -1, bM = -1, bN = -1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !B.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        aM = A.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        aN = A.getType().getX();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (aM != aN) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            throw new RSRuntimeException("Called TRMM with a non-symmetric matrix A");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        bM = B.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        bN = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Side == LEFT) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (aN != bM) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called TRMM with invalid matrices");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (bN != aM) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called TRMM with invalid matrices");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STRMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * B := alpha*op(A)*B   or   B := alpha*B*op(A)
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/df/d01/strmm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void STRMM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, float alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRMM(Element.F32(mRS), Side, TransA, A, B);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_strmm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        alpha, A.getID(mRS), B.getID(mRS), 0.f, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTRMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * B := alpha*op(A)*B   or   B := alpha*B*op(A)
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/dd/d19/dtrmm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DTRMM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, double alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRMM(Element.F64(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtrmm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang                                        alpha, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTRMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * B := alpha*op(A)*B   or   B := alpha*B*op(A)
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T  or  op(A) = A**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d4/d9b/ctrmm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CTRMM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Float2 alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRMM(Element.F32_2(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctrmm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTRMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * B := alpha*op(A)*B   or   B := alpha*B*op(A)
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T  or  op(A) = A**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/de1/ztrmm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZTRMM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Double2 alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRMM(Element.F64_2(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztrmm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateTRSM(Element e, @Side int Side, @Transpose int TransA, Allocation A, Allocation B) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        int adim = -1, bM = -1, bN = -1;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTranspose(TransA);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !B.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        adim = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (adim != A.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // this may be unnecessary, the restriction could potentially be relaxed
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // A needs to contain at least that symmetric matrix but could theoretically be larger
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // for now we assume adapters are sufficient, will reevaluate in the future
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called TRSM with a non-symmetric matrix A");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        bM = B.getType().getY();
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        bN = B.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Side == LEFT) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // A is M*M
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (adim != bM) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called TRSM with invalid matrix dimensions");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            // A is N*N
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (adim != bN) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called TRSM with invalid matrix dimensions");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * STRSM solves one of the matrix equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A)*X := alpha*B   or   X*op(A) := alpha*B
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d2/d8b/strsm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void STRSM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, float alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRSM(Element.F32(mRS), Side, TransA, A, B);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Single(getID(mRS), RsBlas_strsm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        alpha, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * DTRSM solves one of the matrix equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A)*X := alpha*B   or   X*op(A) := alpha*B
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/da7/dtrsm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void DTRSM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, double alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRSM(Element.F64(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Double(getID(mRS), RsBlas_dtrsm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                        alpha, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CTRSM solves one of the matrix equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A)*X := alpha*B   or   X*op(A) := alpha*B
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T  or  op(A) = A**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/de/d30/ctrsm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CTRSM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Float2 alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRSM(Element.F32_2(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_ctrsm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZTRSM solves one of the matrix equations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A)*X := alpha*B   or   X*op(A) := alpha*B
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * op(A) is one of  op(A) = A  or  op(A) = A**T  or  op(A) = A**H
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d1/d39/ztrsm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether matrix A is upper or lower triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param TransA The type of transpose applied to matrix A.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Diag Specifies whether or not A is unit triangular.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZTRSM(@Side int Side, @Uplo int Uplo, @Transpose int TransA, @Diag int Diag, Double2 alpha, Allocation A, Allocation B) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateDiag(Diag);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateTRSM(Element.F64_2(mRS), Side, TransA, A, B);
194679ed952b8205283ce71cab6d7250a47e946eMiao Wang        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_ztrsm, TransA, 0, Side, Uplo, Diag, B.getType().getY(), B.getType().getX(), 0,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), 0, 0, 0, 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateHEMM(Element e, @Side int Side, Allocation A, Allocation B, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateSide(Side);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !B.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !C.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        // A must be square; can potentially be relaxed similar to TRSM
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int adim = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (adim != A.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HEMM with non-square A");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if ((Side == LEFT && adim != B.getType().getY()) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            (Side == RIGHT && adim != B.getType().getX())) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HEMM with invalid B");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (B.getType().getX() != C.getType().getX() ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            B.getType().getY() != C.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HEMM with mismatched B and C");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d3/d66/chemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang    public void CHEMM(@Side int Side, @Uplo int Uplo, Float2 alpha, Allocation A, Allocation B, Float2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateHEMM(Element.F32_2(mRS), Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_chemm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0,
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang                                         alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHEMM performs one of the matrix-matrix operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B + beta*C   or   C := alpha*B*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d6/d3e/zhemm_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Side Specifies whether the symmetric matrix A appears on the left or right.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang    public void ZHEMM(@Side int Side, @Uplo int Uplo, Double2 alpha, Allocation A, Allocation B, Double2 beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        validateHEMM(Element.F64_2(mRS), Side, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zhemm, 0, 0, Side, Uplo, 0, C.getType().getY(), C.getType().getX(), 0,
4c472745221f724b01819fd1667b12f9d300f8cbMiao Wang                                   alpha.x, alpha.y, A.getID(mRS), B.getID(mRS), beta.x, beta.y, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateHERK(Element e, @Transpose int Trans, Allocation A, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !C.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateConjTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int cdim = C.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (cdim != C.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HERK with non-square C");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans == NO_TRANSPOSE) {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (cdim != A.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called HERK with invalid A");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang            if (cdim != A.getType().getX()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called HERK with invalid A");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHERK performs one of the hermitian rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**H + beta*C   or   C := alpha*A**H*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d8/d52/cherk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CHERK(@Uplo int Uplo, @Transpose int Trans, float alpha, Allocation A, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateHERK(Element.F32_2(mRS), Trans, A, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int k = 0;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans == CONJ_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cherk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), k,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         alpha, 0, A.getID(mRS), 0, beta, 0, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHERK performs one of the hermitian rank k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*A**H + beta*C   or   C := alpha*A**H*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d1/db1/zherk_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZHERK(@Uplo int Uplo, @Transpose int Trans, double alpha, Allocation A, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateHERK(Element.F64_2(mRS), Trans, A, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int k = 0;
37ae07c6435380e20ec0e6eaf6295800bdf9f24cMiao Wang        if (Trans == CONJ_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zherk, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), k,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   alpha, 0, A.getID(mRS), 0, beta, 0, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    static void validateHER2K(Element e, @Transpose int Trans, Allocation A, Allocation B, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (!A.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !B.getType().getElement().isCompatible(e) ||
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            !C.getType().getElement().isCompatible(e)) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called BLAS with wrong Element type");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateConjTranspose(Trans);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int cdim = C.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (cdim != C.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HER2K with non-square C");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans == NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (A.getType().getY() != cdim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called HER2K with invalid matrices");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            if (A.getType().getX() != cdim) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                throw new RSRuntimeException("Called HER2K with invalid matrices");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (A.getType().getX() != B.getType().getX() || A.getType().getY() != B.getType().getY()) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            throw new RSRuntimeException("Called HER2K with invalid A and B matrices");
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * CHER2K performs one of the hermitian rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**H + conjg( alpha )*B*A**H + beta*C   or   C := alpha*A**H*B + conjg( alpha )*B**H*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d1/d82/cher2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F32_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void CHER2K(@Uplo int Uplo, @Transpose int Trans, Float2 alpha, Allocation A, Allocation B, float beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateHER2K(Element.F32_2(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int k = 0;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans == NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Complex(getID(mRS), RsBlas_cher2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), k, alpha.x, alpha.y,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                         A.getID(mRS), B.getID(mRS), beta, 0, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang    /**
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * ZHER2K performs one of the hermitian rank 2k operations
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * C := alpha*A*B**H + conjg( alpha )*B*A**H + beta*C   or   C := alpha*A**H*B + conjg( alpha )*B**H*A + beta*C
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Details: http://www.netlib.org/lapack/explore-html/d7/dfa/zher2k_8f.html
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Uplo Specifies whether the upper or lower triangular part of C is to be referenced.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param Trans The type of transpose applied to the operation.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param alpha The scalar alpha.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param beta The scalar beta.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#F64_2}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     */
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    public void ZHER2K(@Uplo int Uplo, @Transpose int Trans, Double2 alpha, Allocation A, Allocation B, double beta, Allocation C) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateUplo(Uplo);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        validateHER2K(Element.F64_2(mRS), Trans, A, B, C);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        int k = 0;
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        if (Trans == NO_TRANSPOSE) {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getX();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        } else {
25207df658d6a8a3e885c7017fcc25702363583cTim Murray            k = A.getType().getY();
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray        mRS.nScriptIntrinsicBLAS_Z(getID(mRS), RsBlas_zher2k, Trans, 0, 0, Uplo, 0, 0, C.getType().getX(), k, alpha.x, alpha.y,
25207df658d6a8a3e885c7017fcc25702363583cTim Murray                                   A.getID(mRS), B.getID(mRS), beta, 0, C.getID(mRS), 0, 0, 0, 0);
25207df658d6a8a3e885c7017fcc25702363583cTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray    /**
d7d413ad0bfaea2d4bb4adcd8011239c2f5f74aeMiao Wang     * 8-bit GEMM-like operation for neural networks: C = A * Transpose(B)
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * Calculations are done in 1.10.21 fixed-point format for the final output,
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * just before there's a shift down to drop the fractional parts. The output
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * values are gated to 0 to 255 to fit in a byte, but the 10-bit format
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * gives some headroom to avoid wrapping around on small overflows.
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang     *
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param A The input allocation contains matrix A, supported elements type {@link Element#U8}.
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang     * @param a_offset The offset for all values in matrix A, e.g A[i,j] = A[i,j] - a_offset. Value should be from 0 to 255.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param B The input allocation contains matrix B, supported elements type {@link Element#U8}.
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang     * @param b_offset The offset for all values in matrix B, e.g B[i,j] = B[i,j] - b_offset. Value should be from 0 to 255.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param C The input allocation contains matrix C, supported elements type {@link Element#U8}.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param c_offset The offset for all values in matrix C.
fb675a53966f8a1664405d2134665b67db071ec0Miao Wang     * @param c_mult The multiplier for all values in matrix C, e.g C[i,j] = (C[i,j] + c_offset) * c_mult.
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray     **/
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray    public void BNNM(Allocation A, int a_offset, Allocation B, int b_offset, Allocation C, int c_offset, int c_mult) {
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        validateL3(Element.U8(mRS), NO_TRANSPOSE, TRANSPOSE, 0, A, B, C);
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang        if (a_offset < 0 || a_offset > 255) {
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang            throw new RSRuntimeException("Invalid a_offset passed to BNNM");
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang        }
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang        if (b_offset < 0 || b_offset > 255) {
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang            throw new RSRuntimeException("Invalid b_offset passed to BNNM");
6099ee6e081904e73e0fad331e326b0607b6b1dcMiao Wang        }
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        int M = -1, N = -1, K = -1;
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        M = A.getType().getY();
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        N = B.getType().getY();
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        K = A.getType().getX();
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray        mRS.nScriptIntrinsicBLAS_BNNM(getID(mRS), M, N, K, A.getID(mRS), a_offset, B.getID(mRS), b_offset, C.getID(mRS), c_offset, c_mult);
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray
9cb16a2f91c79845e5425fbf55f3b679fb18a4ddTim Murray    }
25207df658d6a8a3e885c7017fcc25702363583cTim Murray
25207df658d6a8a3e885c7017fcc25702363583cTim Murray}