mirror of
https://github.com/metabarcoding/obitools4.git
synced 2025-06-29 16:20:46 +00:00
359 lines
7.2 KiB
Go
359 lines
7.2 KiB
Go
package obiformats
|
|
|
|
import (
|
|
"git.metabarcoding.org/lecasofts/go/obitools/pkg/obiseq"
|
|
)
|
|
|
|
type __options__ struct {
|
|
fastseq_header_parser obiseq.SeqAnnotator
|
|
fastseq_header_writer func(*obiseq.BioSequence) string
|
|
with_progress_bar bool
|
|
buffer_size int
|
|
batch_size int
|
|
quality_shift int
|
|
parallel_workers int
|
|
closefile bool
|
|
appendfile bool
|
|
compressed bool
|
|
csv_id bool
|
|
csv_sequence bool
|
|
csv_quality bool
|
|
csv_definition bool
|
|
csv_count bool
|
|
csv_taxon bool
|
|
csv_keys []string
|
|
csv_separator string
|
|
csv_navalue string
|
|
paired_filename string
|
|
}
|
|
|
|
type Options struct {
|
|
pointer *__options__
|
|
}
|
|
|
|
type WithOption func(Options)
|
|
|
|
func MakeOptions(setters []WithOption) Options {
|
|
o := __options__{
|
|
fastseq_header_parser: ParseGuessedFastSeqHeader,
|
|
fastseq_header_writer: FormatFastSeqJsonHeader,
|
|
with_progress_bar: false,
|
|
buffer_size: 2,
|
|
quality_shift: 33,
|
|
parallel_workers: 4,
|
|
batch_size: 5000,
|
|
closefile: false,
|
|
appendfile: false,
|
|
compressed: false,
|
|
csv_id: true,
|
|
csv_definition: false,
|
|
csv_count: false,
|
|
csv_taxon: false,
|
|
csv_sequence: true,
|
|
csv_quality: false,
|
|
csv_separator: ",",
|
|
csv_navalue: "NA",
|
|
csv_keys: make([]string, 0),
|
|
paired_filename: "",
|
|
}
|
|
|
|
opt := Options{&o}
|
|
|
|
for _, set := range setters {
|
|
set(opt)
|
|
}
|
|
|
|
return opt
|
|
}
|
|
|
|
func (opt Options) QualityShift() int {
|
|
return opt.pointer.quality_shift
|
|
}
|
|
|
|
func (opt Options) BatchSize() int {
|
|
return opt.pointer.batch_size
|
|
}
|
|
|
|
func (opt Options) ParallelWorkers() int {
|
|
return opt.pointer.parallel_workers
|
|
}
|
|
|
|
func (opt Options) ParseFastSeqHeader() obiseq.SeqAnnotator {
|
|
return opt.pointer.fastseq_header_parser
|
|
}
|
|
|
|
func (opt Options) FormatFastSeqHeader() func(*obiseq.BioSequence) string {
|
|
return opt.pointer.fastseq_header_writer
|
|
}
|
|
|
|
func (opt Options) ProgressBar() bool {
|
|
return opt.pointer.with_progress_bar
|
|
}
|
|
|
|
func (opt Options) CloseFile() bool {
|
|
return opt.pointer.closefile
|
|
}
|
|
|
|
func (opt Options) AppendFile() bool {
|
|
return opt.pointer.appendfile
|
|
}
|
|
|
|
func (opt Options) CompressedFile() bool {
|
|
return opt.pointer.compressed
|
|
}
|
|
|
|
func (opt Options) CSVId() bool {
|
|
return opt.pointer.csv_id
|
|
}
|
|
|
|
func (opt Options) CSVDefinition() bool {
|
|
return opt.pointer.csv_definition
|
|
}
|
|
|
|
func (opt Options) CSVCount() bool {
|
|
return opt.pointer.csv_count
|
|
}
|
|
|
|
func (opt Options) CSVTaxon() bool {
|
|
return opt.pointer.csv_taxon
|
|
}
|
|
|
|
func (opt Options) CSVSequence() bool {
|
|
return opt.pointer.csv_sequence
|
|
}
|
|
|
|
func (opt Options) CSVQuality() bool {
|
|
return opt.pointer.csv_quality
|
|
}
|
|
|
|
func (opt Options) CSVKeys() []string {
|
|
return opt.pointer.csv_keys
|
|
}
|
|
|
|
func (opt Options) CSVSeparator() string {
|
|
return opt.pointer.csv_separator
|
|
}
|
|
|
|
func (opt Options) CSVNAValue() string {
|
|
return opt.pointer.csv_navalue
|
|
}
|
|
|
|
func (opt Options) HaveToSavePaired() bool {
|
|
return opt.pointer.paired_filename != ""
|
|
}
|
|
|
|
func (opt Options) PairedFileName() string {
|
|
return opt.pointer.paired_filename
|
|
}
|
|
|
|
func OptionCloseFile() WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.closefile = true
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionDontCloseFile() WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.closefile = false
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsAppendFile(append bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.appendfile = append
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsCompressed(compressed bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.compressed = compressed
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsNewFile() WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.appendfile = false
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
// Allows to specify the ascii code corresponding to
|
|
// a quality of 0 in fastq encoded quality scores.
|
|
func OptionsQualityShift(shift int) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.quality_shift = shift
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
// Allows to specify a quality shift of 33, corresponding
|
|
// to a FastQ file qualities encoded following Sanger
|
|
// convention. This corresponds to Illumina produced FastQ
|
|
// files.
|
|
func OptionsQualitySanger() WithOption {
|
|
return OptionsQualityShift(33)
|
|
}
|
|
|
|
// Allows to specify a quality shift of 64, corresponding
|
|
// to a FastQ file qualities encoded following the Solexa
|
|
// convention.
|
|
func OptionsQualitySolexa() WithOption {
|
|
return OptionsQualityShift(64)
|
|
}
|
|
|
|
func OptionsFastSeqHeaderParser(parser obiseq.SeqAnnotator) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.fastseq_header_parser = parser
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionFastSeqDoNotParseHeader() WithOption {
|
|
return OptionsFastSeqHeaderParser(nil)
|
|
}
|
|
|
|
func OptionsFastSeqDefaultHeaderParser() WithOption {
|
|
return OptionsFastSeqHeaderParser(ParseGuessedFastSeqHeader)
|
|
}
|
|
|
|
// OptionsFastSeqHeaderFormat allows foor specifying the format
|
|
// used to write FASTA and FASTQ sequence.
|
|
func OptionsFastSeqHeaderFormat(format func(*obiseq.BioSequence) string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.fastseq_header_writer = format
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsParallelWorkers(nworkers int) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.parallel_workers = nworkers
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsBatchSize(size int) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.batch_size = size
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsWithProgressBar() WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.with_progress_bar = true
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func OptionsWithoutProgressBar() WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.with_progress_bar = false
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func WritePairedReadsTo(filename string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.paired_filename = filename
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVId(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_id = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVSequence(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_sequence = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVQuality(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_quality = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVDefinition(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_definition = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVCount(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_count = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVTaxon(include bool) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_taxon = include
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVKey(key string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_keys = append(opt.pointer.csv_keys, key)
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVKeys(keys []string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_keys = append(opt.pointer.csv_keys, keys...)
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVSeparator(separator string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_separator = separator
|
|
})
|
|
|
|
return f
|
|
}
|
|
|
|
func CSVNAValue(navalue string) WithOption {
|
|
f := WithOption(func(opt Options) {
|
|
opt.pointer.csv_navalue = navalue
|
|
})
|
|
|
|
return f
|
|
}
|