|
|
// Copyright ©2014 The Gonum Authors. All rights reserved.
|
|
|
// Use of this source code is governed by a BSD-style
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
|
package mat
|
|
|
|
|
|
import (
|
|
|
"sync"
|
|
|
|
|
|
"gonum.org/v1/gonum/blas"
|
|
|
"gonum.org/v1/gonum/blas/blas64"
|
|
|
)
|
|
|
|
|
|
var tab64 = [64]byte{
|
|
|
0x3f, 0x00, 0x3a, 0x01, 0x3b, 0x2f, 0x35, 0x02,
|
|
|
0x3c, 0x27, 0x30, 0x1b, 0x36, 0x21, 0x2a, 0x03,
|
|
|
0x3d, 0x33, 0x25, 0x28, 0x31, 0x12, 0x1c, 0x14,
|
|
|
0x37, 0x1e, 0x22, 0x0b, 0x2b, 0x0e, 0x16, 0x04,
|
|
|
0x3e, 0x39, 0x2e, 0x34, 0x26, 0x1a, 0x20, 0x29,
|
|
|
0x32, 0x24, 0x11, 0x13, 0x1d, 0x0a, 0x0d, 0x15,
|
|
|
0x38, 0x2d, 0x19, 0x1f, 0x23, 0x10, 0x09, 0x0c,
|
|
|
0x2c, 0x18, 0x0f, 0x08, 0x17, 0x07, 0x06, 0x05,
|
|
|
}
|
|
|
|
|
|
// bits returns the ceiling of base 2 log of v.
|
|
|
// Approach based on http://stackoverflow.com/a/11398748.
|
|
|
func bits(v uint64) byte {
|
|
|
if v == 0 {
|
|
|
return 0
|
|
|
}
|
|
|
v <<= 2
|
|
|
v--
|
|
|
v |= v >> 1
|
|
|
v |= v >> 2
|
|
|
v |= v >> 4
|
|
|
v |= v >> 8
|
|
|
v |= v >> 16
|
|
|
v |= v >> 32
|
|
|
return tab64[((v-(v>>1))*0x07EDD5E59A4E28C2)>>58] - 1
|
|
|
}
|
|
|
|
|
|
var (
|
|
|
// pool contains size stratified workspace Dense pools.
|
|
|
// Each pool element i returns sized matrices with a data
|
|
|
// slice capped at 1<<i.
|
|
|
pool [63]sync.Pool
|
|
|
|
|
|
// poolSym is the SymDense equivalent of pool.
|
|
|
poolSym [63]sync.Pool
|
|
|
|
|
|
// poolTri is the TriDense equivalent of pool.
|
|
|
poolTri [63]sync.Pool
|
|
|
|
|
|
// poolVec is the VecDense equivalent of pool.
|
|
|
poolVec [63]sync.Pool
|
|
|
|
|
|
// poolFloats is the []float64 equivalent of pool.
|
|
|
poolFloats [63]sync.Pool
|
|
|
|
|
|
// poolInts is the []int equivalent of pool.
|
|
|
poolInts [63]sync.Pool
|
|
|
)
|
|
|
|
|
|
func init() {
|
|
|
for i := range pool {
|
|
|
l := 1 << uint(i)
|
|
|
pool[i].New = func() interface{} {
|
|
|
return &Dense{mat: blas64.General{
|
|
|
Data: make([]float64, l),
|
|
|
}}
|
|
|
}
|
|
|
poolSym[i].New = func() interface{} {
|
|
|
return &SymDense{mat: blas64.Symmetric{
|
|
|
Uplo: blas.Upper,
|
|
|
Data: make([]float64, l),
|
|
|
}}
|
|
|
}
|
|
|
poolTri[i].New = func() interface{} {
|
|
|
return &TriDense{mat: blas64.Triangular{
|
|
|
Data: make([]float64, l),
|
|
|
}}
|
|
|
}
|
|
|
poolVec[i].New = func() interface{} {
|
|
|
return &VecDense{mat: blas64.Vector{
|
|
|
Inc: 1,
|
|
|
Data: make([]float64, l),
|
|
|
}}
|
|
|
}
|
|
|
poolFloats[i].New = func() interface{} {
|
|
|
s := make([]float64, l)
|
|
|
return &s
|
|
|
}
|
|
|
poolInts[i].New = func() interface{} {
|
|
|
s := make([]int, l)
|
|
|
return &s
|
|
|
}
|
|
|
}
|
|
|
}
|
|
|
|
|
|
// getWorkspace returns a *Dense of size r×c and a data slice
|
|
|
// with a cap that is less than 2*r*c. If clear is true, the
|
|
|
// data slice visible through the Matrix interface is zeroed.
|
|
|
func getWorkspace(r, c int, clear bool) *Dense {
|
|
|
l := uint64(r * c)
|
|
|
w := pool[bits(l)].Get().(*Dense)
|
|
|
w.mat.Data = w.mat.Data[:l]
|
|
|
if clear {
|
|
|
zero(w.mat.Data)
|
|
|
}
|
|
|
w.mat.Rows = r
|
|
|
w.mat.Cols = c
|
|
|
w.mat.Stride = c
|
|
|
w.capRows = r
|
|
|
w.capCols = c
|
|
|
return w
|
|
|
}
|
|
|
|
|
|
// putWorkspace replaces a used *Dense into the appropriate size
|
|
|
// workspace pool. putWorkspace must not be called with a matrix
|
|
|
// where references to the underlying data slice have been kept.
|
|
|
func putWorkspace(w *Dense) {
|
|
|
pool[bits(uint64(cap(w.mat.Data)))].Put(w)
|
|
|
}
|
|
|
|
|
|
// getWorkspaceSym returns a *SymDense of size n and a cap that
|
|
|
// is less than 2*n. If clear is true, the data slice visible
|
|
|
// through the Matrix interface is zeroed.
|
|
|
func getWorkspaceSym(n int, clear bool) *SymDense {
|
|
|
l := uint64(n)
|
|
|
l *= l
|
|
|
s := poolSym[bits(l)].Get().(*SymDense)
|
|
|
s.mat.Data = s.mat.Data[:l]
|
|
|
if clear {
|
|
|
zero(s.mat.Data)
|
|
|
}
|
|
|
s.mat.N = n
|
|
|
s.mat.Stride = n
|
|
|
s.cap = n
|
|
|
return s
|
|
|
}
|
|
|
|
|
|
// putWorkspaceSym replaces a used *SymDense into the appropriate size
|
|
|
// workspace pool. putWorkspaceSym must not be called with a matrix
|
|
|
// where references to the underlying data slice have been kept.
|
|
|
func putWorkspaceSym(s *SymDense) {
|
|
|
poolSym[bits(uint64(cap(s.mat.Data)))].Put(s)
|
|
|
}
|
|
|
|
|
|
// getWorkspaceTri returns a *TriDense of size n and a cap that
|
|
|
// is less than 2*n. If clear is true, the data slice visible
|
|
|
// through the Matrix interface is zeroed.
|
|
|
func getWorkspaceTri(n int, kind TriKind, clear bool) *TriDense {
|
|
|
l := uint64(n)
|
|
|
l *= l
|
|
|
t := poolTri[bits(l)].Get().(*TriDense)
|
|
|
t.mat.Data = t.mat.Data[:l]
|
|
|
if clear {
|
|
|
zero(t.mat.Data)
|
|
|
}
|
|
|
t.mat.N = n
|
|
|
t.mat.Stride = n
|
|
|
if kind == Upper {
|
|
|
t.mat.Uplo = blas.Upper
|
|
|
} else if kind == Lower {
|
|
|
t.mat.Uplo = blas.Lower
|
|
|
} else {
|
|
|
panic(ErrTriangle)
|
|
|
}
|
|
|
t.mat.Diag = blas.NonUnit
|
|
|
t.cap = n
|
|
|
return t
|
|
|
}
|
|
|
|
|
|
// putWorkspaceTri replaces a used *TriDense into the appropriate size
|
|
|
// workspace pool. putWorkspaceTri must not be called with a matrix
|
|
|
// where references to the underlying data slice have been kept.
|
|
|
func putWorkspaceTri(t *TriDense) {
|
|
|
poolTri[bits(uint64(cap(t.mat.Data)))].Put(t)
|
|
|
}
|
|
|
|
|
|
// getWorkspaceVec returns a *VecDense of length n and a cap that
|
|
|
// is less than 2*n. If clear is true, the data slice visible
|
|
|
// through the Matrix interface is zeroed.
|
|
|
func getWorkspaceVec(n int, clear bool) *VecDense {
|
|
|
l := uint64(n)
|
|
|
v := poolVec[bits(l)].Get().(*VecDense)
|
|
|
v.mat.Data = v.mat.Data[:l]
|
|
|
if clear {
|
|
|
zero(v.mat.Data)
|
|
|
}
|
|
|
v.mat.N = n
|
|
|
return v
|
|
|
}
|
|
|
|
|
|
// putWorkspaceVec replaces a used *VecDense into the appropriate size
|
|
|
// workspace pool. putWorkspaceVec must not be called with a matrix
|
|
|
// where references to the underlying data slice have been kept.
|
|
|
func putWorkspaceVec(v *VecDense) {
|
|
|
poolVec[bits(uint64(cap(v.mat.Data)))].Put(v)
|
|
|
}
|
|
|
|
|
|
// getFloats returns a []float64 of length l and a cap that is
|
|
|
// less than 2*l. If clear is true, the slice visible is zeroed.
|
|
|
func getFloats(l int, clear bool) []float64 {
|
|
|
w := *poolFloats[bits(uint64(l))].Get().(*[]float64)
|
|
|
w = w[:l]
|
|
|
if clear {
|
|
|
zero(w)
|
|
|
}
|
|
|
return w
|
|
|
}
|
|
|
|
|
|
// putFloats replaces a used []float64 into the appropriate size
|
|
|
// workspace pool. putFloats must not be called with a slice
|
|
|
// where references to the underlying data have been kept.
|
|
|
func putFloats(w []float64) {
|
|
|
poolFloats[bits(uint64(cap(w)))].Put(&w)
|
|
|
}
|
|
|
|
|
|
// getInts returns a []ints of length l and a cap that is
|
|
|
// less than 2*l. If clear is true, the slice visible is zeroed.
|
|
|
func getInts(l int, clear bool) []int {
|
|
|
w := *poolInts[bits(uint64(l))].Get().(*[]int)
|
|
|
w = w[:l]
|
|
|
if clear {
|
|
|
for i := range w {
|
|
|
w[i] = 0
|
|
|
}
|
|
|
}
|
|
|
return w
|
|
|
}
|
|
|
|
|
|
// putInts replaces a used []int into the appropriate size
|
|
|
// workspace pool. putInts must not be called with a slice
|
|
|
// where references to the underlying data have been kept.
|
|
|
func putInts(w []int) {
|
|
|
poolInts[bits(uint64(cap(w)))].Put(&w)
|
|
|
}
|