major optimization by packing wavefront values
This commit is contained in:
parent
8679c51fb0
commit
3da3ddf10c
@ -1,61 +1,5 @@
|
|||||||
package wfa
|
package wfa
|
||||||
|
|
||||||
import (
|
|
||||||
"golang.org/x/exp/constraints"
|
|
||||||
)
|
|
||||||
|
|
||||||
type Wavefront[T constraints.Integer] struct { // since wavefronts store diag distance, they should never be negative, and traceback data can be stored as uint8
|
|
||||||
data []T
|
|
||||||
valid []bool
|
|
||||||
lo int
|
|
||||||
}
|
|
||||||
|
|
||||||
func NewWavefront[T constraints.Integer](lo int, hi int) *Wavefront[T] {
|
|
||||||
a := &Wavefront[T]{}
|
|
||||||
|
|
||||||
a.lo = lo
|
|
||||||
size := a.TranslateIndex(hi)
|
|
||||||
|
|
||||||
newData := make([]T, size+1)
|
|
||||||
a.data = newData
|
|
||||||
|
|
||||||
newValid := make([]bool, size+1)
|
|
||||||
a.valid = newValid
|
|
||||||
|
|
||||||
return a
|
|
||||||
}
|
|
||||||
|
|
||||||
func (a *Wavefront[T]) TranslateIndex(idx int) int {
|
|
||||||
return idx - a.lo
|
|
||||||
}
|
|
||||||
|
|
||||||
func (a *Wavefront[T]) Valid(idx int) bool {
|
|
||||||
actualIdx := a.TranslateIndex(idx)
|
|
||||||
return 0 <= actualIdx && actualIdx < len(a.data) && a.valid[actualIdx]
|
|
||||||
}
|
|
||||||
|
|
||||||
func (a *Wavefront[T]) Get(idx int) T {
|
|
||||||
actualIdx := a.TranslateIndex(idx)
|
|
||||||
if 0 <= actualIdx && actualIdx < len(a.data) { // idx is in the slice
|
|
||||||
return a.data[actualIdx]
|
|
||||||
} else { // idx is out of the slice
|
|
||||||
return 0
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
func (a *Wavefront[T]) Set(idx int, value T) {
|
|
||||||
actualIdx := a.TranslateIndex(idx)
|
|
||||||
|
|
||||||
/* in theory idx is always in bounds because the wavefront is preallocated
|
|
||||||
if actualIdx < 0 || actualIdx >= len(a.data) {
|
|
||||||
return
|
|
||||||
}
|
|
||||||
*/
|
|
||||||
|
|
||||||
a.data[actualIdx] = value
|
|
||||||
a.valid[actualIdx] = true
|
|
||||||
}
|
|
||||||
|
|
||||||
type PositiveSlice[T any] struct {
|
type PositiveSlice[T any] struct {
|
||||||
data []T
|
data []T
|
||||||
valid []bool
|
valid []bool
|
||||||
|
12
pkg/debug.go
12
pkg/debug.go
@ -1,5 +1,3 @@
|
|||||||
//go:build debug
|
|
||||||
|
|
||||||
package wfa
|
package wfa
|
||||||
|
|
||||||
import (
|
import (
|
||||||
@ -46,8 +44,9 @@ func (w *WavefrontComponent) String(score int) string {
|
|||||||
hi := w.hi.Get(i)
|
hi := w.hi.Get(i)
|
||||||
// print out wavefront matrix
|
// print out wavefront matrix
|
||||||
for k := min_lo; k <= max_hi; k++ {
|
for k := min_lo; k <= max_hi; k++ {
|
||||||
if w.W.Valid(i) && w.W.Get(i).Valid(k) {
|
valid, val, _ := UnpackWavefrontValue(w.W.Get(i).Get(k))
|
||||||
s = s + fmt.Sprintf("%02d", w.W.Get(i).Get(k))
|
if valid {
|
||||||
|
s = s + fmt.Sprintf("%02d", val)
|
||||||
} else if k < lo || k > hi {
|
} else if k < lo || k > hi {
|
||||||
s = s + "--"
|
s = s + "--"
|
||||||
} else {
|
} else {
|
||||||
@ -61,8 +60,9 @@ func (w *WavefrontComponent) String(score int) string {
|
|||||||
s = s + "]\t["
|
s = s + "]\t["
|
||||||
// print out traceback matrix
|
// print out traceback matrix
|
||||||
for k := min_lo; k <= max_hi; k++ {
|
for k := min_lo; k <= max_hi; k++ {
|
||||||
if w.A.Valid(i) && w.A.Get(i).Valid(k) {
|
valid, _, tb := UnpackWavefrontValue(w.W.Get(i).Get(k))
|
||||||
s = s + traceback_str[w.A.Get(i).Get(k)]
|
if valid {
|
||||||
|
s = s + traceback_str[tb]
|
||||||
} else if k < lo || k > hi {
|
} else if k < lo || k > hi {
|
||||||
s = s + "--"
|
s = s + "--"
|
||||||
} else {
|
} else {
|
||||||
|
130
pkg/types.go
130
pkg/types.go
@ -12,10 +12,10 @@ type Penalty struct {
|
|||||||
E int
|
E int
|
||||||
}
|
}
|
||||||
|
|
||||||
type traceback byte
|
type Traceback byte
|
||||||
|
|
||||||
const (
|
const (
|
||||||
OpenIns traceback = iota
|
OpenIns Traceback = iota
|
||||||
ExtdIns
|
ExtdIns
|
||||||
OpenDel
|
OpenDel
|
||||||
ExtdDel
|
ExtdDel
|
||||||
@ -25,19 +25,87 @@ const (
|
|||||||
End
|
End
|
||||||
)
|
)
|
||||||
|
|
||||||
type WavefrontComponent struct {
|
// bitpacked wavefront values with 1 valid bit, 3 traceback bits, and 28 bits for the diag distance
|
||||||
lo *PositiveSlice[int] // lo for each wavefront
|
// technically this restricts to solutions within 268 million score but that should be sufficient for most cases
|
||||||
hi *PositiveSlice[int] // hi for each wavefront
|
type WavefrontValue uint32
|
||||||
W *PositiveSlice[*Wavefront[int]] // wavefront diag distance for each wavefront
|
|
||||||
A *PositiveSlice[*Wavefront[traceback]] // compact CIGAR for backtrace for each wavefront
|
// TODO: add 64 bit packed value in case more than 268 million score is needed
|
||||||
|
|
||||||
|
// PackWavefrontValue: packs a diag value and traceback into a WavefrontValue
|
||||||
|
func PackWavefrontValue(value uint32, traceback Traceback) WavefrontValue {
|
||||||
|
valueBM := value & 0x0FFF_FFFF
|
||||||
|
tracebackBM := uint32(traceback&0x0000_0007) << 28
|
||||||
|
return WavefrontValue(0x8000_0000 | valueBM | tracebackBM)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// UnpackWavefrontValue: opens a WavefrontValue into a valid bool, diag value and traceback
|
||||||
|
func UnpackWavefrontValue(wf WavefrontValue) (bool, uint32, Traceback) {
|
||||||
|
valueBM := uint32(wf & 0x0FFF_FFFF)
|
||||||
|
tracebackBM := uint8(wf & 0x7000_0000 >> 28)
|
||||||
|
validBM := wf&0x8000_0000 != 0
|
||||||
|
return validBM, valueBM, Traceback(tracebackBM)
|
||||||
|
}
|
||||||
|
|
||||||
|
// Wavefront: stores a single wavefront, stores wavefront's lo value and hi is naturally lo + len(data)
|
||||||
|
type Wavefront struct { // since wavefronts store diag distance, they should never be negative, and traceback data can be stored as uint8
|
||||||
|
data []WavefrontValue
|
||||||
|
lo int
|
||||||
|
}
|
||||||
|
|
||||||
|
// NewWavefront: returns a new wavefront with size accomodating lo and hi (inclusive)
|
||||||
|
func NewWavefront(lo int, hi int) *Wavefront {
|
||||||
|
a := &Wavefront{}
|
||||||
|
|
||||||
|
a.lo = lo
|
||||||
|
size := a.TranslateIndex(hi)
|
||||||
|
|
||||||
|
newData := make([]WavefrontValue, size+1)
|
||||||
|
a.data = newData
|
||||||
|
|
||||||
|
return a
|
||||||
|
}
|
||||||
|
|
||||||
|
// TranslateIndex: utility function for getting the data index given a diagonal
|
||||||
|
func (a *Wavefront) TranslateIndex(diagonal int) int {
|
||||||
|
return diagonal - a.lo
|
||||||
|
}
|
||||||
|
|
||||||
|
// Get: returns WavefrontValue for given diagonal
|
||||||
|
func (a *Wavefront) Get(diagonal int) WavefrontValue {
|
||||||
|
actualIdx := a.TranslateIndex(diagonal)
|
||||||
|
if 0 <= actualIdx && actualIdx < len(a.data) { // idx is in the slice
|
||||||
|
return a.data[actualIdx]
|
||||||
|
} else { // idx is out of the slice
|
||||||
|
return 0
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Set: the diagonal to a WavefrontValue
|
||||||
|
func (a *Wavefront) Set(diagonal int, value WavefrontValue) {
|
||||||
|
actualIdx := a.TranslateIndex(diagonal)
|
||||||
|
|
||||||
|
/* in theory idx is always in bounds because the wavefront is preallocated
|
||||||
|
if actualIdx < 0 || actualIdx >= len(a.data) {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
*/
|
||||||
|
|
||||||
|
a.data[actualIdx] = value
|
||||||
|
}
|
||||||
|
|
||||||
|
// WavefrontComponent: each M/I/D wavefront matrix including the wavefront data, lo and hi
|
||||||
|
type WavefrontComponent struct {
|
||||||
|
lo *PositiveSlice[int] // lo for each wavefront
|
||||||
|
hi *PositiveSlice[int] // hi for each wavefront
|
||||||
|
W *PositiveSlice[*Wavefront] // wavefront diag distance and traceback for each wavefront
|
||||||
|
}
|
||||||
|
|
||||||
|
// NewWavefrontComponent: returns initialized WavefrontComponent
|
||||||
func NewWavefrontComponent(preallocateSize int) WavefrontComponent {
|
func NewWavefrontComponent(preallocateSize int) WavefrontComponent {
|
||||||
// new wavefront component = {
|
// new wavefront component = {
|
||||||
// lo = [0]
|
// lo = [0]
|
||||||
// hi = [0]
|
// hi = [0]
|
||||||
// W = []
|
// W = []
|
||||||
// A = []
|
|
||||||
// }
|
// }
|
||||||
w := WavefrontComponent{
|
w := WavefrontComponent{
|
||||||
lo: &PositiveSlice[int]{
|
lo: &PositiveSlice[int]{
|
||||||
@ -48,16 +116,9 @@ func NewWavefrontComponent(preallocateSize int) WavefrontComponent {
|
|||||||
data: []int{0},
|
data: []int{0},
|
||||||
valid: []bool{true},
|
valid: []bool{true},
|
||||||
},
|
},
|
||||||
W: &PositiveSlice[*Wavefront[int]]{
|
W: &PositiveSlice[*Wavefront]{
|
||||||
defaultValue: &Wavefront[int]{
|
defaultValue: &Wavefront{
|
||||||
data: []int{0},
|
data: []WavefrontValue{0},
|
||||||
valid: []bool{false},
|
|
||||||
},
|
|
||||||
},
|
|
||||||
A: &PositiveSlice[*Wavefront[traceback]]{
|
|
||||||
defaultValue: &Wavefront[traceback]{
|
|
||||||
data: []traceback{0},
|
|
||||||
valid: []bool{false},
|
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
@ -65,32 +126,21 @@ func NewWavefrontComponent(preallocateSize int) WavefrontComponent {
|
|||||||
w.lo.Preallocate(preallocateSize)
|
w.lo.Preallocate(preallocateSize)
|
||||||
w.hi.Preallocate(preallocateSize)
|
w.hi.Preallocate(preallocateSize)
|
||||||
w.W.Preallocate(preallocateSize)
|
w.W.Preallocate(preallocateSize)
|
||||||
w.A.Preallocate(preallocateSize)
|
|
||||||
|
|
||||||
return w
|
return w
|
||||||
}
|
}
|
||||||
|
|
||||||
// get value for wavefront=score, diag=k => returns ok, value
|
// GetVal: get value for wavefront=score, diag=k => returns ok, value, traceback
|
||||||
func (w *WavefrontComponent) GetVal(score int, k int) (bool, int) {
|
func (w *WavefrontComponent) GetVal(score int, k int) (bool, uint32, Traceback) {
|
||||||
return w.W.Valid(score) && w.W.Get(score).Valid(k), w.W.Get(score).Get(k)
|
return UnpackWavefrontValue(w.W.Get(score).Get(k))
|
||||||
}
|
}
|
||||||
|
|
||||||
// set value for wavefront=score, diag=k
|
// SetVal: set value, traceback for wavefront=score, diag=k
|
||||||
func (w *WavefrontComponent) SetVal(score int, k int, val int) {
|
func (w *WavefrontComponent) SetVal(score int, k int, val uint32, tb Traceback) {
|
||||||
w.W.Get(score).Set(k, val)
|
w.W.Get(score).Set(k, PackWavefrontValue(val, tb))
|
||||||
}
|
}
|
||||||
|
|
||||||
// get alignment traceback for wavefront=score, diag=k => returns ok, value
|
// GetLoHi: get lo and hi for wavefront=score
|
||||||
func (w *WavefrontComponent) GetTraceback(score int, k int) (bool, traceback) {
|
|
||||||
return w.A.Valid(score) && w.A.Get(score).Valid(k), w.A.Get(score).Get(k)
|
|
||||||
}
|
|
||||||
|
|
||||||
// set alignment traceback for wavefront=score, diag=k
|
|
||||||
func (w *WavefrontComponent) SetTraceback(score int, k int, val traceback) {
|
|
||||||
w.A.Get(score).Set(k, val)
|
|
||||||
}
|
|
||||||
|
|
||||||
// get hi for wavefront=score
|
|
||||||
func (w *WavefrontComponent) GetLoHi(score int) (bool, int, int) {
|
func (w *WavefrontComponent) GetLoHi(score int) (bool, int, int) {
|
||||||
// if lo[score] and hi[score] are valid
|
// if lo[score] and hi[score] are valid
|
||||||
if w.lo.Valid(score) && w.hi.Valid(score) {
|
if w.lo.Valid(score) && w.hi.Valid(score) {
|
||||||
@ -101,18 +151,14 @@ func (w *WavefrontComponent) GetLoHi(score int) (bool, int, int) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// set hi for wavefront=score
|
// SetLoHi: set lo and hi for wavefront=score
|
||||||
func (w *WavefrontComponent) SetLoHi(score int, lo int, hi int) {
|
func (w *WavefrontComponent) SetLoHi(score int, lo int, hi int) {
|
||||||
// lo[score] = lo
|
// lo[score] = lo
|
||||||
w.lo.Set(score, lo)
|
w.lo.Set(score, lo)
|
||||||
// hi[score] = hi
|
// hi[score] = hi
|
||||||
w.hi.Set(score, hi)
|
w.hi.Set(score, hi)
|
||||||
|
|
||||||
// preemptively setup w.A
|
|
||||||
a := NewWavefront[traceback](lo, hi)
|
|
||||||
w.A.Set(score, a)
|
|
||||||
|
|
||||||
// preemptively setup w.W
|
// preemptively setup w.W
|
||||||
b := NewWavefront[int](lo, hi)
|
b := NewWavefront(lo, hi)
|
||||||
w.W.Set(score, b)
|
w.W.Set(score, b)
|
||||||
}
|
}
|
||||||
|
53
pkg/utils.go
53
pkg/utils.go
@ -3,25 +3,27 @@ package wfa
|
|||||||
import (
|
import (
|
||||||
"math"
|
"math"
|
||||||
"unicode/utf8"
|
"unicode/utf8"
|
||||||
|
|
||||||
|
"golang.org/x/exp/constraints"
|
||||||
)
|
)
|
||||||
|
|
||||||
func SafeMin(values []int, idx int) int {
|
func SafeMin[T constraints.Integer](values []T, idx int) T {
|
||||||
return values[idx]
|
return values[idx]
|
||||||
}
|
}
|
||||||
|
|
||||||
func SafeMax(values []int, idx int) int {
|
func SafeMax[T constraints.Integer](values []T, idx int) T {
|
||||||
return values[idx]
|
return values[idx]
|
||||||
}
|
}
|
||||||
|
|
||||||
func SafeArgMax(valids []bool, values []int) (bool, int) {
|
func SafeArgMax[T constraints.Integer](valids []bool, values []T) (bool, int) {
|
||||||
hasValid := false
|
hasValid := false
|
||||||
maxIndex := 0
|
maxIndex := 0
|
||||||
maxValue := math.MinInt
|
maxValue := math.MinInt
|
||||||
for i := 0; i < len(valids); i++ {
|
for i := 0; i < len(valids); i++ {
|
||||||
if valids[i] && values[i] > maxValue {
|
if valids[i] && int(values[i]) > maxValue {
|
||||||
hasValid = true
|
hasValid = true
|
||||||
maxIndex = i
|
maxIndex = i
|
||||||
maxValue = values[i]
|
maxValue = int(values[i])
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if hasValid {
|
if hasValid {
|
||||||
@ -31,15 +33,15 @@ func SafeArgMax(valids []bool, values []int) (bool, int) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
func SafeArgMin(valids []bool, values []int) (bool, int) {
|
func SafeArgMin[T constraints.Integer](valids []bool, values []T) (bool, int) {
|
||||||
hasValid := false
|
hasValid := false
|
||||||
minIndex := 0
|
minIndex := 0
|
||||||
minValue := math.MaxInt
|
minValue := math.MaxInt
|
||||||
for i := 0; i < len(valids); i++ {
|
for i := 0; i < len(valids); i++ {
|
||||||
if valids[i] && values[i] < minValue {
|
if valids[i] && int(values[i]) < minValue {
|
||||||
hasValid = true
|
hasValid = true
|
||||||
minIndex = i
|
minIndex = i
|
||||||
minValue = values[i]
|
minValue = int(values[i])
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if hasValid {
|
if hasValid {
|
||||||
@ -98,14 +100,13 @@ func NextI(M WavefrontComponent, I WavefrontComponent, score int, k int, penalti
|
|||||||
o := penalties.O
|
o := penalties.O
|
||||||
e := penalties.E
|
e := penalties.E
|
||||||
|
|
||||||
a_ok, a := M.GetVal(score-o-e, k-1)
|
a_ok, a, _ := M.GetVal(score-o-e, k-1)
|
||||||
b_ok, b := I.GetVal(score-e, k-1)
|
b_ok, b, _ := I.GetVal(score-e, k-1)
|
||||||
|
|
||||||
ok, nextITraceback := SafeArgMax([]bool{a_ok, b_ok}, []int{a, b})
|
ok, nextITraceback := SafeArgMax([]bool{a_ok, b_ok}, []uint32{a, b})
|
||||||
nextIVal := SafeMax([]int{a, b}, nextITraceback) + 1 // important that the +1 is here
|
nextIVal := SafeMax([]uint32{a, b}, nextITraceback) + 1 // important that the +1 is here
|
||||||
if ok {
|
if ok {
|
||||||
I.SetVal(score, k, nextIVal)
|
I.SetVal(score, k, nextIVal, []Traceback{OpenIns, ExtdIns}[nextITraceback])
|
||||||
I.SetTraceback(score, k, []traceback{OpenIns, ExtdIns}[nextITraceback])
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -113,33 +114,31 @@ func NextD(M WavefrontComponent, D WavefrontComponent, score int, k int, penalti
|
|||||||
o := penalties.O
|
o := penalties.O
|
||||||
e := penalties.E
|
e := penalties.E
|
||||||
|
|
||||||
a_ok, a := M.GetVal(score-o-e, k+1)
|
a_ok, a, _ := M.GetVal(score-o-e, k+1)
|
||||||
b_ok, b := D.GetVal(score-e, k+1)
|
b_ok, b, _ := D.GetVal(score-e, k+1)
|
||||||
|
|
||||||
ok, nextDTraceback := SafeArgMax(
|
ok, nextDTraceback := SafeArgMax(
|
||||||
[]bool{a_ok, b_ok},
|
[]bool{a_ok, b_ok},
|
||||||
[]int{a, b},
|
[]uint32{a, b},
|
||||||
)
|
)
|
||||||
nextDVal := SafeMax([]int{a, b}, nextDTraceback) // nothing special
|
nextDVal := SafeMax([]uint32{a, b}, nextDTraceback) // nothing special
|
||||||
if ok {
|
if ok {
|
||||||
D.SetVal(score, k, nextDVal)
|
D.SetVal(score, k, nextDVal, []Traceback{OpenDel, ExtdDel}[nextDTraceback])
|
||||||
D.SetTraceback(score, k, []traceback{OpenDel, ExtdDel}[nextDTraceback])
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
func NextM(M WavefrontComponent, I WavefrontComponent, D WavefrontComponent, score int, k int, penalties Penalty) {
|
func NextM(M WavefrontComponent, I WavefrontComponent, D WavefrontComponent, score int, k int, penalties Penalty) {
|
||||||
x := penalties.X
|
x := penalties.X
|
||||||
|
|
||||||
a_ok, a := M.GetVal(score-x, k)
|
a_ok, a, _ := M.GetVal(score-x, k)
|
||||||
a++ // important to have +1 here
|
a++ // important to have +1 here
|
||||||
b_ok, b := I.GetVal(score, k)
|
b_ok, b, _ := I.GetVal(score, k)
|
||||||
c_ok, c := D.GetVal(score, k)
|
c_ok, c, _ := D.GetVal(score, k)
|
||||||
|
|
||||||
ok, nextMTraceback := SafeArgMax([]bool{a_ok, b_ok, c_ok}, []int{a, b, c})
|
ok, nextMTraceback := SafeArgMax([]bool{a_ok, b_ok, c_ok}, []uint32{a, b, c})
|
||||||
nextMVal := SafeMax([]int{a, b, c}, nextMTraceback)
|
nextMVal := SafeMax([]uint32{a, b, c}, nextMTraceback)
|
||||||
|
|
||||||
if ok {
|
if ok {
|
||||||
M.SetVal(score, k, nextMVal)
|
M.SetVal(score, k, nextMVal, []Traceback{Sub, Ins, Del}[nextMTraceback])
|
||||||
M.SetTraceback(score, k, []traceback{Sub, Ins, Del}[nextMTraceback])
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
30
pkg/wfa.go
30
pkg/wfa.go
@ -4,19 +4,18 @@ func WFAlign(s1 string, s2 string, penalties Penalty, doCIGAR bool) Result {
|
|||||||
n := len(s1)
|
n := len(s1)
|
||||||
m := len(s2)
|
m := len(s2)
|
||||||
A_k := m - n
|
A_k := m - n
|
||||||
A_offset := m
|
A_offset := uint32(m)
|
||||||
score := 0
|
score := 0
|
||||||
estimatedScore := (max(n, m) * max(penalties.M, penalties.X, penalties.O, penalties.E)) / 4
|
estimatedScore := (max(n, m) * max(penalties.M, penalties.X, penalties.O, penalties.E)) / 4
|
||||||
M := NewWavefrontComponent(estimatedScore)
|
M := NewWavefrontComponent(estimatedScore)
|
||||||
M.SetLoHi(0, 0, 0)
|
M.SetLoHi(0, 0, 0)
|
||||||
M.SetVal(0, 0, 0)
|
M.SetVal(0, 0, 0, End)
|
||||||
M.SetTraceback(0, 0, End)
|
|
||||||
I := NewWavefrontComponent(estimatedScore)
|
I := NewWavefrontComponent(estimatedScore)
|
||||||
D := NewWavefrontComponent(estimatedScore)
|
D := NewWavefrontComponent(estimatedScore)
|
||||||
|
|
||||||
for {
|
for {
|
||||||
WFExtend(M, s1, n, s2, m, score)
|
WFExtend(M, s1, n, s2, m, score)
|
||||||
ok, val := M.GetVal(score, A_k)
|
ok, val, _ := M.GetVal(score, A_k)
|
||||||
if ok && val >= A_offset {
|
if ok && val >= A_offset {
|
||||||
break
|
break
|
||||||
}
|
}
|
||||||
@ -40,7 +39,8 @@ func WFExtend(M WavefrontComponent, s1 string, n int, s2 string, m int, score in
|
|||||||
for k := lo; k <= hi; k++ {
|
for k := lo; k <= hi; k++ {
|
||||||
// v = M[score][k] - k
|
// v = M[score][k] - k
|
||||||
// h = M[score][k]
|
// h = M[score][k]
|
||||||
ok, h := M.GetVal(score, k)
|
ok, hu, _ := M.GetVal(score, k)
|
||||||
|
h := int(hu)
|
||||||
v := h - k
|
v := h - k
|
||||||
|
|
||||||
// exit early if v or h are invalid
|
// exit early if v or h are invalid
|
||||||
@ -48,8 +48,8 @@ func WFExtend(M WavefrontComponent, s1 string, n int, s2 string, m int, score in
|
|||||||
continue
|
continue
|
||||||
}
|
}
|
||||||
for v < n && h < m && s1[v] == s2[h] {
|
for v < n && h < m && s1[v] == s2[h] {
|
||||||
_, val := M.GetVal(score, k)
|
_, val, tb := M.GetVal(score, k)
|
||||||
M.SetVal(score, k, val+1)
|
M.SetVal(score, k, val+1, tb)
|
||||||
v++
|
v++
|
||||||
h++
|
h++
|
||||||
}
|
}
|
||||||
@ -75,7 +75,7 @@ func WFBacktrace(M WavefrontComponent, I WavefrontComponent, D WavefrontComponen
|
|||||||
CIGAR_rev := ""
|
CIGAR_rev := ""
|
||||||
tb_s := score
|
tb_s := score
|
||||||
tb_k := A_k
|
tb_k := A_k
|
||||||
_, current_traceback := M.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback := M.GetVal(tb_s, tb_k)
|
||||||
done := false
|
done := false
|
||||||
|
|
||||||
for !done {
|
for !done {
|
||||||
@ -84,31 +84,31 @@ func WFBacktrace(M WavefrontComponent, I WavefrontComponent, D WavefrontComponen
|
|||||||
case OpenIns:
|
case OpenIns:
|
||||||
tb_s = tb_s - o - e
|
tb_s = tb_s - o - e
|
||||||
tb_k = tb_k - 1
|
tb_k = tb_k - 1
|
||||||
_, current_traceback = M.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = M.GetVal(tb_s, tb_k)
|
||||||
case ExtdIns:
|
case ExtdIns:
|
||||||
tb_s = tb_s - e
|
tb_s = tb_s - e
|
||||||
tb_k = tb_k - 1
|
tb_k = tb_k - 1
|
||||||
_, current_traceback = I.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = I.GetVal(tb_s, tb_k)
|
||||||
case OpenDel:
|
case OpenDel:
|
||||||
tb_s = tb_s - o - e
|
tb_s = tb_s - o - e
|
||||||
tb_k = tb_k + 1
|
tb_k = tb_k + 1
|
||||||
_, current_traceback = M.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = M.GetVal(tb_s, tb_k)
|
||||||
case ExtdDel:
|
case ExtdDel:
|
||||||
tb_s = tb_s - e
|
tb_s = tb_s - e
|
||||||
tb_k = tb_k + 1
|
tb_k = tb_k + 1
|
||||||
_, current_traceback = D.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = D.GetVal(tb_s, tb_k)
|
||||||
case Sub:
|
case Sub:
|
||||||
tb_s = tb_s - x
|
tb_s = tb_s - x
|
||||||
// tb_k = tb_k;
|
// tb_k = tb_k;
|
||||||
_, current_traceback = M.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = M.GetVal(tb_s, tb_k)
|
||||||
case Ins:
|
case Ins:
|
||||||
// tb_s = tb_s;
|
// tb_s = tb_s;
|
||||||
// tb_k = tb_k;
|
// tb_k = tb_k;
|
||||||
_, current_traceback = I.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = I.GetVal(tb_s, tb_k)
|
||||||
case Del:
|
case Del:
|
||||||
// tb_s = tb_s;
|
// tb_s = tb_s;
|
||||||
// tb_k = tb_k;
|
// tb_k = tb_k;
|
||||||
_, current_traceback = D.GetTraceback(tb_s, tb_k)
|
_, _, current_traceback = D.GetVal(tb_s, tb_k)
|
||||||
case End:
|
case End:
|
||||||
done = true
|
done = true
|
||||||
}
|
}
|
||||||
|
@ -3,6 +3,7 @@ package tests
|
|||||||
import (
|
import (
|
||||||
"bufio"
|
"bufio"
|
||||||
"encoding/json"
|
"encoding/json"
|
||||||
|
"math/rand/v2"
|
||||||
"os"
|
"os"
|
||||||
"strconv"
|
"strconv"
|
||||||
"strings"
|
"strings"
|
||||||
@ -27,6 +28,24 @@ type TestCase struct {
|
|||||||
Solutions string `json:"solutions"`
|
Solutions string `json:"solutions"`
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func randRange(min, max int) uint32 {
|
||||||
|
return uint32(rand.IntN(max-min) + min)
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestWavefrontPacking(t *testing.T) {
|
||||||
|
for range 1000 {
|
||||||
|
val := randRange(0, 1000)
|
||||||
|
tb := wfa.Traceback(randRange(0, 7))
|
||||||
|
v := wfa.PackWavefrontValue(val, tb)
|
||||||
|
|
||||||
|
valid, gotVal, gotTB := wfa.UnpackWavefrontValue(v)
|
||||||
|
|
||||||
|
if !valid || gotVal != val || gotTB != tb {
|
||||||
|
t.Errorf(`test WavefrontPack/Unpack, val: %d, tb: %d, packedval: %x, gotok: %t, gotval: %d, gottb: %d\n`, val, tb, v, valid, gotVal, gotTB)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
func TestWFA(t *testing.T) {
|
func TestWFA(t *testing.T) {
|
||||||
content, _ := os.ReadFile(testJsonPath)
|
content, _ := os.ReadFile(testJsonPath)
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user