-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun-ecoli
executable file
·35 lines (31 loc) · 1.85 KB
/
run-ecoli
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
#!/bin/sh
# algorithm
# -a,--alpha <arg> alpha=penetrance, fraction of a supporting path's sequence that supports the FR (required)
# -k,--kappa <arg> kappa=maximum insertion length that any supporting path may have (required)
# -cc,--casectrl emphasize FRs that have large case vs. control support (false)
# input
# -d,--dot <arg> splitMEM DOT file (requires FASTA file)
# -f,--fasta <arg> FASTA file (requires DOT file)
# -g,--genotype <arg> which genotype to include (0,1) from the input file; -1 to include all (-1)
# -j,--json <arg> vg JSON file
# -gfa,--gfa <arg> GFA file
# -p,--pathlabels <arg> tab-delimited file with pathname<tab>label
# post-processing input
# -i,--inputprefix <arg> input file prefix for further processing (=outputprefix from previous run)
# -m,--minsup <arg> minsup=minimum number of supporting paths for a region to be considered interesting (1)
# -s,--minsize <arg> minsize=minimum number of nodes that a FR must contain to be considered interesting (1)
# -l,--minlen <arg> minlen=minimum allowed average length (bp) of an FR's subpaths (1)
# output
# -o,--outputprefix <arg> output file prefix (stdout)
# other
# -go,--graphonly just read the graph and output, do not find FRs; for debuggery (false)
# -v,--verbose verbose output (false)
# -do,--debug debug output (false)
# -bf,--bruteforce find FRs comprehensively via brute force - testing only! (false)
alpha=$1
kappa=$2
rm -f ecoli.*
echo "********** alpha=$alpha kappa=$kappa **********"
java -cp "build/install/fr/lib/*" org.ncgr.pangenomics.fr.FRFinder --gfa ecoli/ecoli.pan3.paths.gfa \
--outputprefix ecoli-$alpha-$kappa \
--alpha $alpha --kappa $kappa --debug # --serial --bruteforce --minsup=1 --minsize=1 --minlen=1