|
8 | 8 |
|
9 | 9 | ezMethodFastqScreen = function(input=NA, output=NA, param=NA,
|
10 | 10 | htmlFile="00index.html"){
|
11 |
| - if(sum(input$meta$`Read Count`) > 1e9){ |
12 |
| - input <- ezMethodSubsampleFastq(input=input, param=param) |
| 11 | + inputReadCount = input$meta$`Read Count` |
| 12 | + if (!is.null(inputReadCount)){ |
| 13 | + ## TODO will fail if input is an unmapped bam but does not have read counts |
| 14 | + inputReadCount = countReadsInFastq(input$getFullPaths("Read1")) |
13 | 15 | }
|
14 |
| - inputRaw <- input$copy() |
| 16 | + if(sum(inputReadCount) > 1e9){ |
| 17 | + input <- ezMethodSubsampleFastq(input=input, param=param, n=1e6) |
| 18 | + } |
| 19 | + inputUntrimmed <- input$copy() |
15 | 20 | # Preprocessing
|
16 | 21 | param$trimAdapter = TRUE
|
17 | 22 | if(input$readType() == "bam"){
|
18 | 23 | stopifnot(input$getLength() == 1L) ## We only support one uBam now.
|
19 |
| - fastqInput <- ezMethodBam2Fastq(input = input, param = param, |
| 24 | + inputUntrimmed <- ezMethodBam2Fastq(input = inputUntrimmed, param = param, |
20 | 25 | OUTPUT_PER_RG=TRUE)
|
21 |
| - input <- ezMethodFastpTrim(input = fastqInput, param = param) |
22 |
| - inputRaw <- fastqInput |
23 |
| - }else{ |
24 |
| - input <- ezMethodFastpTrim(input = input, param = param) |
25 | 26 | }
|
26 |
| - dataset = inputRaw$meta |
| 27 | + input <- ezMethodFastpTrim(input = inputUntrimmed, param = param) |
| 28 | + dataset = inputUntrimmed$meta |
27 | 29 | # fastqscreen part
|
28 | 30 |
|
29 | 31 | ## get Adapter contamination from raw data
|
30 | 32 | confFile = FASTQSCREEN_ADAPTER_CONF
|
31 |
| - files_rawData = inputRaw$getFullPaths("Read1") |
| 33 | + files_rawData = inputUntrimmed$getFullPaths("Read1") |
32 | 34 | resultFiles_rawData = executeFastqscreenCMD(param, confFile = confFile,
|
33 | 35 | files_rawData)
|
34 | 36 | fastqData_rawData = collectFastqscreenOutput(files_rawData,
|
|
0 commit comments