aboutsummaryrefslogtreecommitdiff
path: root/tools/gridss-assemble.nix
blob: 15e5ca604409c6b41d14244167ebf53cadd4ca4b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
{ bionix
, bwaIndexAttrs ? { }
, faidxAttrs ? { }
, indexAttrs ? { }
, collectMetricsAttrs ? { }
, flags ? null
, config ? null
, heapSize ? "31g"
, workdirs ? [ ]
, jobIndex ? null
, jobNodes ? null
}:

with bionix;
with lib;
with types;

inputs:

let
  getref = matchFiletype "gridss-assemble" { bam = x: x.ref; };
  ref = getref (head inputs);
  sorted = matchFileSorting "gridss-assemble" { coord = _: true; };
  homoRef = length (unique (map getref inputs)) == 1;

  linkInput = input: ''
    BASENAME=$(basename ${input})
    WRKDIR="''${BASENAME}.gridss.working"
    mkdir $WRKDIR
    ln -s ${input} $WRKDIR/$BASENAME.sv.bam
    ln -s  ${bionix.samtools.index indexAttrs input} $WRKDIR/$BASENAME.sv.bai
    for f in ${bionix.gridss.collectMetrics collectMetricsAttrs input}/* ; do
      ln -s $f $WRKDIR/$BASENAME.''${f##*.}
    done
  '';
in

assert (all sorted inputs);
assert homoRef;

stage rec {
  name = "gridss-assemble";
  buildInputs = with pkgs; [ jre bwa ];
  outputs = [ "out" "work" ];
  buildCommand = ''
    TMPDIR=$(pwd)
    ln -s ${ref} ref.fa
    ln -s ${bionix.samtools.faidx faidxAttrs ref} ref.fa.fai
    for f in ${bionix.bwa.index bwaIndexAttrs ref}/*; do
      ln -s $f
    done
    ${concatMapStringsSep "\n" linkInput inputs}
    mkdir out.gridss.working
    ${concatMapStringsSep "\n" (w: "cp -r ${w}/* ./out.gridss.working") workdirs}
    chmod -R u+rwX out.gridss.working
    java -Xmx${heapSize} -Dsamjdk.create_index=true \
      -cp ${bionix.gridss.jar} gridss.AssembleBreakends \
      VERBOSITY=WARNING \
      REFERENCE_SEQUENCE=ref.fa \
      ${concatMapStringsSep " " (i: "INPUT='${i}'") inputs} \
      WORKER_THREADS=$NIX_BUILD_CORES \
      OUTPUT=out \
      ${optionalString (config != null) ("OPTIONS_FILE=" + bionix.gridss.gridssConfig config)} \
      WORKING_DIR=$TMPDIR/ \
      TMP_DIR=$TMPDIR/ \
      ${optionalString (jobIndex != null) "JOB_INDEX=${toString jobIndex}"} \
      ${optionalString (jobIndex != null) "JOB_NODES=${toString jobNodes}"} \
      ${optionalString (flags != null) flags}
    [ -e out ] && cp -r out $out
    touch $out
    cp -r out.gridss.working $work
  '';
  passthru.filetype = filetype.bam { inherit ref; sorting = sort.none { }; };
  passthru.multicore = true;
}