-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathmatrix_blas_dense.t
114 lines (101 loc) · 3.22 KB
/
matrix_blas_dense.t
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
-- SPDX-FileCopyrightText: 2024 René Hiemstra <[email protected]>
-- SPDX-FileCopyrightText: 2024 Torsten Keßler <[email protected]>
--
-- SPDX-License-Identifier: MIT
import "terraform"
local matrix = require("matrix")
local concepts = require("concepts")
local blas = require("blas")
local vecblas = require("vector_blas")
local err = require("assert")
local function BLASDenseMatrixBase(M)
local T = M.eltype
local BLASDenseMatrix = concepts.BLASDenseMatrix(T)
local BLASVector = concepts.BLASVector(T)
local BLASNumber = concepts.BLASNumber
local Complex = concepts.Complex
local Bool = concepts.Bool
local Integral = concepts.Integral
--check if interfaces of BLASDenseMatrix is implemented
assert(BLASDenseMatrix(M), "CompileError: BLASDenseMatrix is not implemented.")
local conjtrans = function(T)
if Complex(T) then
return `blas.ConjTrans
else
return `blas.Trans
end
end
terraform M:apply(trans : bool, alpha : T, x : &V1, beta : T, y : &V2)
where {V1 : BLASVector, V2 : BLASVector}
var nx, xptr, incx = x:getblasinfo()
var ny, yptr, incy = y:getblasinfo()
var rows, cols, aptr, ld = self:getblasdenseinfo()
if trans then
err.assert(cols == ny and rows == nx)
else
err.assert(rows == ny and cols == nx)
end
var flag = 0
if trans then
flag = [conjtrans(M.eltype)]
else
flag = blas.NoTrans
end
blas.gemv(blas.RowMajor, flag,
rows, cols, alpha, aptr, ld, xptr, incx,
beta, yptr, incy)
end
terraform M:mul(beta : T, alpha : T, atrans : bool, a : &M1, btrans : bool, b : &M2)
where {M1 : BLASDenseMatrix, M2 : BLASDenseMatrix}
var nc, mc, ptrc, ldc = self:getblasdenseinfo()
var na, ma, ptra, lda = a:getblasdenseinfo()
var nb, mb, ptrb, ldb = b:getblasdenseinfo()
var m: uint64, n: uint64, k: uint64
if atrans and btrans then
err.assert(nc == ma)
err.assert(mc == nb)
err.assert(na == mb)
m = nc
n = mc
k = na
elseif atrans and not btrans then
err.assert(nc == ma)
err.assert(mc == mb)
err.assert(na == nb)
m = nc
n = mc
k = na
elseif not atrans and btrans then
err.assert(nc == na)
err.assert(mc == nb)
err.assert(ma == nb)
m = nc
n = mc
k = ma
else
err.assert(nc == na)
err.assert(mc == mb)
err.assert(ma == nb)
m = nc
n = mc
k = ma
end
var fa = 0
if atrans then
fa = [ conjtrans(M.eltype) ]
else
fa = blas.NoTrans
end
var fb = 0
if btrans then
fb = [ conjtrans(M.eltype) ]
else
fb = blas.NoTrans
end
blas.gemm(blas.RowMajor, fa, fb, n, m, k,
alpha, ptra, lda, ptrb, ldb, beta, ptrc, ldc)
end
end
return {
BLASDenseMatrixBase = BLASDenseMatrixBase
}