+ cmd.trainingSet = make([]int, len(cmd.cgnames))
+ if *samplesFilename == "" {
+ cmd.trainingSetSize = len(cmd.cgnames)
+ for i, name := range cmd.cgnames {
+ cmd.samples = append(cmd.samples, sampleInfo{
+ id: trimFilenameForLabel(name),
+ isTraining: true,
+ })
+ cmd.trainingSet[i] = i
+ }
+ } else if len(cmd.cgnames) != len(cmd.samples) {
+ return fmt.Errorf("mismatched sample list: %d samples in library, %d in %s", len(cmd.cgnames), len(cmd.samples), *samplesFilename)
+ } else {
+ for i, name := range cmd.cgnames {
+ if s := trimFilenameForLabel(name); s != cmd.samples[i].id {
+ return fmt.Errorf("mismatched sample list: sample %d is %q in library, %q in %s", i, s, cmd.samples[i].id, *samplesFilename)
+ }
+ }
+ if *caseControlOnly {
+ for i := 0; i < len(cmd.samples); i++ {
+ if !cmd.samples[i].isTraining && !cmd.samples[i].isValidation {
+ if i+1 < len(cmd.samples) {
+ copy(cmd.samples[i:], cmd.samples[i+1:])
+ copy(cmd.cgnames[i:], cmd.cgnames[i+1:])
+ }
+ cmd.samples = cmd.samples[:len(cmd.samples)-1]
+ cmd.cgnames = cmd.cgnames[:len(cmd.cgnames)-1]
+ i--
+ }
+ }
+ }
+ cmd.chi2Cases = nil
+ cmd.trainingSetSize = 0
+ for i := range cmd.cgnames {
+ if cmd.samples[i].isTraining {
+ cmd.trainingSet[i] = cmd.trainingSetSize
+ cmd.trainingSetSize++
+ cmd.chi2Cases = append(cmd.chi2Cases, cmd.samples[i].isCase)
+ } else {
+ cmd.trainingSet[i] = -1
+ }
+ }
+ if cmd.pvalue == nil {
+ cmd.pvalue = func(onehot []bool) float64 {
+ return pvalue(onehot, cmd.chi2Cases)
+ }
+ }