runlocal := flags.Bool("local", false, "run on local host (default: run in an arvados container)")
projectUUID := flags.String("project", "", "project `UUID` for output data")
priority := flags.Int("priority", 500, "container request priority")
runlocal := flags.Bool("local", false, "run on local host (default: run in an arvados container)")
projectUUID := flags.String("project", "", "project `UUID` for output data")
priority := flags.Int("priority", 500, "container request priority")
- inputFilename := flags.String("i", "-", "input `file`")
- outputDir := flags.String("output-dir", "/tmp", "output `directory`")
+ inputDir := flags.String("input-dir", "./in", "input `directory`")
+ outputDir := flags.String("output-dir", "./out", "output `directory`")
annotationsFilename := flags.String("output-annotations", "", "output `file` for tile variant annotations csv")
librefsFilename := flags.String("output-onehot2tilevar", "", "when using -one-hot, create csv `file` mapping column# to tag# and variant#")
labelsFilename := flags.String("output-labels", "", "output `file` for genome labels csv")
annotationsFilename := flags.String("output-annotations", "", "output `file` for tile variant annotations csv")
librefsFilename := flags.String("output-onehot2tilevar", "", "when using -one-hot, create csv `file` mapping column# to tag# and variant#")
labelsFilename := flags.String("output-labels", "", "output `file` for genome labels csv")
Name: "lightning export-numpy",
Client: arvados.NewClientFromEnv(),
ProjectUUID: *projectUUID,
Name: "lightning export-numpy",
Client: arvados.NewClientFromEnv(),
ProjectUUID: *projectUUID,
"-output-dir", "/mnt/output",
"-output-annotations", "/mnt/output/annotations.csv",
"-output-onehot2tilevar", "/mnt/output/onehot2tilevar.csv",
"-output-labels", "/mnt/output/labels.csv",
"-regions", *regionsFilename,
"-expand-regions", fmt.Sprintf("%d", *expandRegions),
"-output-dir", "/mnt/output",
"-output-annotations", "/mnt/output/annotations.csv",
"-output-onehot2tilevar", "/mnt/output/onehot2tilevar.csv",
"-output-labels", "/mnt/output/labels.csv",
"-regions", *regionsFilename,
"-expand-regions", fmt.Sprintf("%d", *expandRegions),
- "-max-variants", fmt.Sprintf("%d", cmd.filter.MaxVariants),
- "-min-coverage", fmt.Sprintf("%f", cmd.filter.MinCoverage),
- "-max-tag", fmt.Sprintf("%d", cmd.filter.MaxTag),
"-chunks", fmt.Sprintf("%d", *chunks),
}
"-chunks", fmt.Sprintf("%d", *chunks),
}
- var input io.ReadCloser
- if *inputFilename == "-" {
- input = ioutil.NopCloser(stdin)
- } else {
- input, err = open(*inputFilename)
- if err != nil {
- return 1
- }
- defer input.Close()
- }
- input = ioutil.NopCloser(bufio.NewReaderSize(input, 8*1024*1024))
tilelib := &tileLibrary{
retainNoCalls: true,
retainTileSequences: true,
compactGenomes: map[string][]tileVariantID{},
}
tilelib := &tileLibrary{
retainNoCalls: true,
retainTileSequences: true,
compactGenomes: map[string][]tileVariantID{},
}
- err = tilelib.LoadGob(context.Background(), input, strings.HasSuffix(*inputFilename, ".gz"), nil)
- if err != nil {
- return 1
- }
- err = input.Close()
+ err = tilelib.LoadDir(context.Background(), *inputDir)
for tag, variants := range tilelib.variant {
lq := lowqual[tag]
for varidx, hash := range variants {
for tag, variants := range tilelib.variant {
lq := lowqual[tag]
for varidx, hash := range variants {