Big change iin the data model, and a first version of obiuniq

This commit is contained in:
2022-02-21 19:00:23 +01:00
parent 9737f97084
commit 2e7c1834b0
43 changed files with 664 additions and 440 deletions

View File

@@ -9,19 +9,19 @@ import (
)
type BioSequenceClassifier struct {
Code func(BioSequence) int
Code func(*BioSequence) int
Value func(int) string
Reset func()
Clone func() *BioSequenceClassifier
}
//type BioSequenceClassifier func(sequence BioSequence) string
func AnnotationClassifier(key string, na string) *BioSequenceClassifier {
encode := make(map[string]int, 1000)
decode := make([]string, 0, 1000)
locke := sync.RWMutex{}
maxcode := 0
code := func(sequence BioSequence) int {
code := func(sequence *BioSequence) int {
var val string
if sequence.HasAnnotation() {
value, ok := sequence.Annotations()[key]
@@ -62,12 +62,26 @@ func AnnotationClassifier(key string, na string) *BioSequenceClassifier {
return decode[k]
}
c := BioSequenceClassifier{code, value}
reset := func() {
locke.Lock()
defer locke.Unlock()
for k := range encode {
delete(encode, k)
}
decode = decode[:0]
}
clone := func() *BioSequenceClassifier {
return AnnotationClassifier(key, na)
}
c := BioSequenceClassifier{code, value, reset, clone}
return &c
}
func PredicateClassifier(predicate SequencePredicate) *BioSequenceClassifier {
code := func(sequence BioSequence) int {
code := func(sequence *BioSequence) int {
if predicate(sequence) {
return 1
} else {
@@ -85,14 +99,22 @@ func PredicateClassifier(predicate SequencePredicate) *BioSequenceClassifier {
}
c := BioSequenceClassifier{code, value}
reset := func() {
}
clone := func() *BioSequenceClassifier {
return PredicateClassifier(predicate)
}
c := BioSequenceClassifier{code, value, reset, clone}
return &c
}
// Builds a classifier function based on CRC32 of the sequence
//
func HashClassifier(size int) *BioSequenceClassifier {
code := func(sequence BioSequence) int {
code := func(sequence *BioSequence) int {
return int(crc32.ChecksumIEEE(sequence.Sequence()) % uint32(size))
}
@@ -100,7 +122,15 @@ func HashClassifier(size int) *BioSequenceClassifier {
return strconv.Itoa(k)
}
c := BioSequenceClassifier{code, value}
reset := func() {
}
clone := func() *BioSequenceClassifier {
return HashClassifier(size)
}
c := BioSequenceClassifier{code, value, reset, clone}
return &c
}
@@ -112,7 +142,7 @@ func SequenceClassifier() *BioSequenceClassifier {
locke := sync.RWMutex{}
maxcode := 0
code := func(sequence BioSequence) int {
code := func(sequence *BioSequence) int {
val := sequence.String()
locke.Lock()
@@ -140,7 +170,23 @@ func SequenceClassifier() *BioSequenceClassifier {
return decode[k]
}
c := BioSequenceClassifier{code, value}
reset := func() {
locke.Lock()
defer locke.Unlock()
// for k := range encode {
// delete(encode, k)
// }
encode = make(map[string]int)
decode = decode[:0]
maxcode = 0
}
clone := func() *BioSequenceClassifier {
return SequenceClassifier()
}
c := BioSequenceClassifier{code, value, reset, clone}
return &c
}
@@ -148,7 +194,7 @@ func RotateClassifier(size int) *BioSequenceClassifier {
n := 0
lock := sync.Mutex{}
code := func(sequence BioSequence) int {
code := func(sequence *BioSequence) int {
lock.Lock()
defer lock.Unlock()
n = n % size
@@ -160,6 +206,14 @@ func RotateClassifier(size int) *BioSequenceClassifier {
return strconv.Itoa(k)
}
c := BioSequenceClassifier{code, value}
reset := func() {
}
clone := func() *BioSequenceClassifier {
return RotateClassifier(size)
}
c := BioSequenceClassifier{code, value, reset, clone}
return &c
}