LabKey
diff --git a/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/SequenceAnalysisModule.java‎
Lines changed: 1 addition & 0 deletions b/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/SequenceAnalysisModule.java‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/SequenceAnalysisServiceImpl.java‎
Lines changed: 13 additions & 11 deletions b/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/SequenceAnalysisServiceImpl.java‎
Lines changed: 13 additions & 11 deletions
diff --git a/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/run/variant/KingInferenceStep.java‎
Lines changed: 182 additions & 0 deletions b/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/run/variant/KingInferenceStep.java‎
Lines changed: 182 additions & 0 deletions
diff --git a/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/run/variant/PlinkPcaStep.java‎
Lines changed: 6 additions & 4 deletions b/‎SequenceAnalysis/src/org/labkey/sequenceanalysis/run/variant/PlinkPcaStep.java‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎jbrowse/build.gradle‎
Lines changed: 17 additions & 0 deletions b/‎jbrowse/build.gradle‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎jbrowse/package.json‎
Lines changed: 2 additions & 2 deletions b/‎jbrowse/package.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎singlecell/resources/chunks/AvgExpression.R‎
Lines changed: 38 additions & 3 deletions b/‎singlecell/resources/chunks/AvgExpression.R‎
Lines changed: 38 additions & 3 deletions
diff --git a/‎singlecell/resources/chunks/CalculateUCellScores.R‎
Lines changed: 1 addition & 1 deletion b/‎singlecell/resources/chunks/CalculateUCellScores.R‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎singlecell/resources/chunks/CiteSeqDimReduxDist.R‎
Lines changed: 2 additions & 2 deletions b/‎singlecell/resources/chunks/CiteSeqDimReduxDist.R‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎singlecell/resources/chunks/CiteSeqDimReduxPca.R‎
Lines changed: 2 additions & 2 deletions b/‎singlecell/resources/chunks/CiteSeqDimReduxPca.R‎
Lines changed: 2 additions & 2 deletions
@@ -303,6 +303,7 @@ public static void registerPipelineSteps()
         SequencePipelineService.get().registerPipelineStep(new VariantsToTableStep.Provider());
         SequencePipelineService.get().registerPipelineStep(new VariantQCStep.Provider());
         SequencePipelineService.get().registerPipelineStep(new PlinkPcaStep.Provider());
+        SequencePipelineService.get().registerPipelineStep(new KingInferenceStep.Provider());
         SequencePipelineService.get().registerPipelineStep(new MendelianViolationReportStep.Provider());
         SequencePipelineService.get().registerPipelineStep(new SummarizeGenotypeQualityStep.Provider());
 
 
@@ -253,16 +253,10 @@ public File ensureVcfIndex(File vcf, Logger log, boolean forceRecreate) throws I
         try
         {
             FileType gz = new FileType(".gz");
-            File expected = new File(vcf.getPath() + FileExtensions.TRIBBLE_INDEX);
-            File tbi = new File(vcf.getPath() + ".tbi");
-
-            if (!forceRecreate && expected.exists())
-            {
-                return expected;
-            }
-            else if  (!forceRecreate && tbi.exists())
+            File expectedIdx = gz.isType(vcf) ? new File(vcf.getPath() + ".tbi") : new File(vcf.getPath() + FileExtensions.TRIBBLE_INDEX);
+            if (!forceRecreate && expectedIdx.exists())
             {
-                return tbi;
+                return expectedIdx;
             }
             else
             {
@@ -272,15 +266,23 @@ else if  (!forceRecreate && tbi.exists())
                 {
                     TabixRunner r = new TabixRunner(log);
                     r.execute(vcf);
+                    if (!expectedIdx.exists())
+                    {
+                        throw new PipelineJobException("Expected index was not created: " + expectedIdx.getPath());
+                    }
 
-                    return tbi;
+                    return expectedIdx;
                 }
                 else
                 {
                     Index idx = IndexFactory.createDynamicIndex(vcf, new VCFCodec());
                     idx.writeBasedOnFeatureFile(vcf);
+                    if (!expectedIdx.exists())
+                    {
+                        throw new PipelineJobException("Expected index was not created: " + expectedIdx.getPath());
+                    }
 
-                    return expected;
+                    return expectedIdx;
                 }
             }
         }
 
@@ -0,0 +1,182 @@
+package org.labkey.sequenceanalysis.run.variant;
+
+import htsjdk.samtools.SAMSequenceDictionary;
+import htsjdk.samtools.SAMSequenceRecord;
+import htsjdk.samtools.util.Interval;
+import htsjdk.variant.utils.SAMSequenceDictionaryExtractor;
+import org.apache.commons.io.FileUtils;
+import org.apache.commons.lang3.StringUtils;
+import org.apache.commons.lang3.math.NumberUtils;
+import org.apache.logging.log4j.Logger;
+import org.json.old.JSONObject;
+import org.labkey.api.pipeline.PipelineJobException;
+import org.labkey.api.sequenceanalysis.SequenceAnalysisService;
+import org.labkey.api.sequenceanalysis.pipeline.AbstractVariantProcessingStepProvider;
+import org.labkey.api.sequenceanalysis.pipeline.PipelineContext;
+import org.labkey.api.sequenceanalysis.pipeline.PipelineStepProvider;
+import org.labkey.api.sequenceanalysis.pipeline.ReferenceGenome;
+import org.labkey.api.sequenceanalysis.pipeline.SequencePipelineService;
+import org.labkey.api.sequenceanalysis.pipeline.ToolParameterDescriptor;
+import org.labkey.api.sequenceanalysis.pipeline.VariantProcessingStep;
+import org.labkey.api.sequenceanalysis.pipeline.VariantProcessingStepOutputImpl;
+import org.labkey.api.sequenceanalysis.run.AbstractCommandPipelineStep;
+import org.labkey.api.sequenceanalysis.run.AbstractCommandWrapper;
+
+import javax.annotation.Nullable;
+import java.io.File;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+
+public class KingInferenceStep extends AbstractCommandPipelineStep<KingInferenceStep.KingWrapper> implements VariantProcessingStep
+{
+    public KingInferenceStep(PipelineStepProvider<?> provider, PipelineContext ctx)
+    {
+        super(provider, ctx, new KingInferenceStep.KingWrapper(ctx.getLogger()));
+    }
+
+    public static class Provider extends AbstractVariantProcessingStepProvider<KingInferenceStep>
+    {
+        public Provider()
+        {
+            super("KingInferenceStep", "KING/Relatedness", "", "This will run KING to infer kinship from a VCF", Arrays.asList(
+                    ToolParameterDescriptor.create("limitToChromosomes", "Limit to Chromosomes", "If checked, the analysis will include only the primary chromosomes", "checkbox", new JSONObject(){{
+                        put("checked", true);
+                    }}, true)
+            ), null, "https://www.kingrelatedness.com/manual.shtml");
+        }
+
+        @Override
+        public KingInferenceStep create(PipelineContext ctx)
+        {
+            return new KingInferenceStep(this, ctx);
+        }
+    }
+
+    @Override
+    public Output processVariants(File inputVCF, File outputDirectory, ReferenceGenome genome, @Nullable List<Interval> intervals) throws PipelineJobException
+    {
+        VariantProcessingStepOutputImpl output = new VariantProcessingStepOutputImpl();
+
+        output.addInput(inputVCF, "Input VCF");
+        output.addInput(genome.getWorkingFastaFile(), "Reference Genome");
+
+        File plinkOut = new File(outputDirectory, "plink");
+        output.addIntermediateFile(new File(plinkOut.getPath() + ".bed"));
+        output.addIntermediateFile(new File(plinkOut.getPath() + ".fam"));
+        output.addIntermediateFile(new File(plinkOut.getPath() + ".bim"));
+        output.addIntermediateFile(new File(plinkOut.getPath() + ".log"));
+        output.addIntermediateFile(new File(plinkOut.getPath() + "-temporary.psam"));
+
+        PlinkPcaStep.PlinkWrapper plink = new PlinkPcaStep.PlinkWrapper(getPipelineCtx().getLogger());
+        List<String> plinkArgs = new ArrayList<>();
+        plinkArgs.add(plink.getExe().getPath());
+        plinkArgs.add("--vcf");
+        plinkArgs.add(inputVCF.getPath());
+
+        plinkArgs.add("--make-bed");
+
+        boolean limitToChromosomes = getProvider().getParameterByName("limitToChromosomes").extractValue(getPipelineCtx().getJob(), getProvider(), getStepIdx(), Boolean.class, true);
+        if (limitToChromosomes)
+        {
+            SAMSequenceDictionary dict = SAMSequenceDictionaryExtractor.extractDictionary(genome.getSequenceDictionary().toPath());
+            List<String> toKeep = dict.getSequences().stream().filter(s -> {
+                String name = StringUtils.replaceIgnoreCase(s.getSequenceName(), "^chr", "");
+
+                return NumberUtils.isCreatable(name) || "X".equalsIgnoreCase(name) || "Y".equalsIgnoreCase(name);
+            }).map(SAMSequenceRecord::getSequenceName).toList();
+
+            plinkArgs.add("--chr");
+            plinkArgs.add(StringUtils.join(toKeep, ","));
+        }
+        else
+        {
+            plinkArgs.add("--allow-extra-chr");
+        }
+
+        plinkArgs.add("--silent");
+
+        plinkArgs.add("--max-alleles");
+        plinkArgs.add("2");
+
+        plinkArgs.add("--out");
+        plinkArgs.add(plinkOut.getPath());
+
+        Integer threads = SequencePipelineService.get().getMaxThreads(getPipelineCtx().getLogger());
+        if (threads != null)
+        {
+            plinkArgs.add("--threads");
+            plinkArgs.add(threads.toString());
+        }
+
+        //TODO: consider --memory (in MB)
+
+        plink.execute(plinkArgs);
+
+        File plinkOutBed = new File(plinkOut.getPath() + ".bed");
+        if (!plinkOutBed.exists())
+        {
+            throw new PipelineJobException("Unable to find file: " + plinkOutBed.getPath());
+        }
+
+        KingWrapper wrapper = new KingWrapper(getPipelineCtx().getLogger());
+        wrapper.setWorkingDir(outputDirectory);
+
+        List<String> kingArgs = new ArrayList<>();
+        kingArgs.add(wrapper.getExe().getPath());
+
+        kingArgs.add("-b");
+        kingArgs.add(plinkOutBed.getPath());
+
+        kingArgs.add("--prefix");
+        kingArgs.add(SequenceAnalysisService.get().getUnzippedBaseName(inputVCF.getName()));
+
+        if (threads != null)
+        {
+            kingArgs.add("--cpus");
+            kingArgs.add(threads.toString());
+        }
+
+        kingArgs.add("--kinship");
+
+        File kinshipOutput = new File(outputDirectory, SequenceAnalysisService.get().getUnzippedBaseName(inputVCF.getName()) + ".kin");
+        wrapper.execute(kingArgs);
+        if (!kinshipOutput.exists())
+        {
+            throw new PipelineJobException("Unable to find file: " + kinshipOutput.getPath());
+        }
+
+        File kinshipOutputTxt = new File(kinshipOutput.getPath() + ".txt");
+        if (kinshipOutputTxt.exists())
+        {
+            kinshipOutputTxt.delete();
+        }
+
+        try
+        {
+            FileUtils.moveFile(kinshipOutput, kinshipOutputTxt);
+        }
+        catch (IOException e)
+        {
+            throw new PipelineJobException(e);
+        }
+
+        output.addSequenceOutput(kinshipOutputTxt, "King Relatedness: " + inputVCF.getName(), "KING Relatedness", null, null, genome.getGenomeId(), null);
+
+        return output;
+    }
+
+    public static class KingWrapper extends AbstractCommandWrapper
+    {
+        public KingWrapper(@Nullable Logger logger)
+        {
+            super(logger);
+        }
+
+        public File getExe()
+        {
+            return SequencePipelineService.get().getExeForPackage("KINGPATH", "king");
+        }
+    }
+}
@@ -42,6 +42,7 @@
 import java.io.PrintWriter;
 import java.util.ArrayList;
 import java.util.Arrays;
+import java.util.Collection;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
@@ -255,12 +256,13 @@ public void init(PipelineJob job, SequenceAnalysisJobSupport support, List<Seque
                                 filter.addCondition(FieldKey.fromString("application"), allowableApplications, CompareType.IN);
                             }
 
-                            Set<String> applications = new HashSet<>(new TableSelector(QueryService.get().getUserSchema(getPipelineCtx().getJob().getUser(), targetContainer, SequenceAnalysisSchema.SCHEMA_NAME).getTable(SequenceAnalysisSchema.TABLE_READSETS), PageFlowUtil.set("application"), filter, null).getArrayList(String.class));
-                            if (applications.size() == 1)
+                            Collection<Map<String, Object>> results = new TableSelector(QueryService.get().getUserSchema(getPipelineCtx().getJob().getUser(), targetContainer, SequenceAnalysisSchema.SCHEMA_NAME).getTable(SequenceAnalysisSchema.TABLE_READSETS), PageFlowUtil.set("application", "rowid"), filter, null).getMapCollection();
+                            if (results.size() == 1)
                             {
-                                writer.println(sample + "\t" + applications.iterator().next());
+                                Map<String, Object> row = results.iterator().next();
+                                writer.println(sample + "\t" + row.get("application") + "\t" + row.get("rowid"));
                             }
-                            else if (applications.size() > 1)
+                            else if (results.size() > 1)
                             {
                                 duplicates.add(sample);
                             }
 
@@ -24,3 +24,20 @@ dependencies {
     BuildUtils.addLabKeyDependency(project: project, config: "modules", depProjectPath: ":server:modules:DiscvrLabKeyModules:SequenceAnalysis", depProjectConfig: "published", depExtension: "module")
     BuildUtils.addLabKeyDependency(project: project, config: "modules", depProjectPath: BuildUtils.getPlatformModuleProjectPath(project.gradle, "pipeline"), depProjectConfig: "published", depExtension: "module")
 }
+
+def jbPkgTask = project.tasks.named("npm_run_jb-pkg")
+
+jbPkgTask.configure {
+    outputs.cacheIf {false}
+
+    inputs.dir(project.file("./node_modules/@jbrowse/cli")).withPathSensitivity(PathSensitivity.RELATIVE)
+    outputs.dir(project.file("./resources/external/jb-cli"))
+}
+
+project.tasks.named("npm_run_build-prod").configure {
+    finalizedBy jbPkgTask.get()
+}
+
+project.tasks.named("npm_run_build-dev").configure {
+    finalizedBy jbPkgTask.get()
+}
@@ -7,8 +7,8 @@
     "build": "npm run build-dev",
     "start": "cross-env NODE_ENV=development LK_MODULE_CONTAINER=DiscvrLabKeyModules LK_MODULE=jbrowse webpack-dev-server --config config/watch.config.js",
     "build-no-pkg": "npm run clean && cross-env NODE_ENV=development LK_MODULE_CONTAINER=DiscvrLabKeyModules LK_MODULE=jbrowse webpack --config config/dev.config.js --progress --profile",
-    "build-dev": "npm run build-no-pkg && npm run jb-pkg",
-    "build-prod": "npm run clean && cross-env NODE_ENV=production PROD_SOURCE_MAP=source-map LK_MODULE_CONTAINER=DiscvrLabKeyModules LK_MODULE=jbrowse webpack --config config/prod.config.js --progress --profile && npm run jb-pkg",
+    "build-dev": "npm run build-no-pkg",
+    "build-prod": "npm run clean && cross-env NODE_ENV=production PROD_SOURCE_MAP=source-map LK_MODULE_CONTAINER=DiscvrLabKeyModules LK_MODULE=jbrowse webpack --config config/prod.config.js --progress --profile",
     "clean": "rimraf resources/web/gen && rimraf resources/web/jbrowse/gen && rimraf resources/views/gen && rimraf resources/views/browser*",
     "test": "cross-env NODE_ENV=test jest",
     "jb-pkg": "pkg ./node_modules/@jbrowse/cli --out-path ./resources/external/jb-cli"
 
@@ -1,10 +1,45 @@
+GenerateAveragedData <- function(seuratObj, groupFields, addMetadata) {
+    if (addMetadata && !'cDNA_ID' %in% names(seuratObj@meta.data)) {
+        stop('A field names cDNA_ID must exist when addMetadata=TRUE')
+    }
+
+    if (addMetadata && !'cDNA_ID' %in% groupFields) {
+        stop('When addMetadata=TRUE, cDNA_ID must be part of groupFields')
+    }
+
+    meta <- unique(seuratObj@meta.data[,groupFields, drop = F])
+    rownames(meta) <- apply(meta, 1, function(y){
+        return(paste0(y, collapse = '_'))
+    })
+
+    Seurat::Idents(seuratObj) <- rownames(meta)
+
+    for (assayName in names(seuratObj@assays)) {
+        if (!(!identical(seuratObj@assays[[assayName]]@counts, seuratObj@assays[[assayName]]@data))){
+            print(paste0('Seurat assay', assayName, ' does not appear to be normalized, running now:'))
+            seuratObj <- Seurat::NormalizeData(seuratObj, verbose = FALSE, assay = assayName)
+        }
+    }
+
+    a <- Seurat::AverageExpression(seuratObj, return.seurat = T, verbose = F)
+    a <- Seurat::AddMetaData(a, meta)
+
+    totals <- seuratObj@meta.data %>% group_by_at(groupFields) %>% summarise(TotalCells = n())
+    a$TotalCells <- totals$TotalCells
+
+    if (addMetadata) {
+        a <- Rdiscvr::QueryAndApplyMetadataUsingCDNA(a)
+    }
+
+    return(a)
+}
+
 for (datasetId in names(seuratObjects)) {
     printName(datasetId)
     seuratObj <- readRDS(seuratObjects[[datasetId]])
 
-    df <- CellMembrane::AvgExpression(seuratObj, groupField = groupField)
-    write.table(df, file = paste0(outputPrefix, '.', makeLegalFileName(datasetId), '.avg.', groupField, '.txt'), sep = '\t', row.names = FALSE, quote = FALSE)
-    rm(df)
+    seuratObj <- GenerateAveragedData(seuratObj, groupFields = groupFields, addMetadata = addMetadata)
+    saveData(seuratObj, datasetId)
 
     # Cleanup
     rm(seuratObj)
 
@@ -3,7 +3,7 @@ for (datasetId in names(seuratObjects)) {
     seuratObj <- readRDS(seuratObjects[[datasetId]])
 
     message(paste0('Loading dataset ', datasetId, ', with total cells: ', ncol(seuratObj)))
-    seuratObj <- RIRA::CalculateUCellScores(seuratObj)
+    seuratObj <- RIRA::CalculateUCellScores(seuratObj, storeRanks = storeRanks, assayName = assayName)
 
     saveData(seuratObj, datasetId)
 
 
@@ -2,8 +2,8 @@ for (datasetId in names(seuratObjects)) {
     printName(datasetId)
     seuratObj <- readRDS(seuratObjects[[datasetId]])
 
-    if (!('ADT' %in% names(seuratObj@assays))) {
-        print('ADT assay not present, skipping')
+    if (!(assayName %in% names(seuratObj@assays))) {
+        print(paste0(assayName, ' assay not present, skipping'))
     } else {
         tryCatch({
             seuratObj <- bindArgs(CellMembrane::CiteSeqDimRedux.Dist, seuratObj)()
 
@@ -2,8 +2,8 @@ for (datasetId in names(seuratObjects)) {
     printName(datasetId)
     seuratObj <- readRDS(seuratObjects[[datasetId]])
 
-    if (!('ADT' %in% names(seuratObj@assays))) {
-        print('ADT assay not present, skipping')
+    if (!(assayName %in% names(seuratObj@assays))) {
+        print(paste0(assayName, ' assay not present, skipping'))
     } else {
         seuratObj <- bindArgs(CellMembrane::CiteSeqDimRedux.PCA, seuratObj)()
     }
Original file line number	Diff line number	Diff line change
`@@ -253,16 +253,10 @@ public File ensureVcfIndex(File vcf, Logger log, boolean forceRecreate) throws I`
`253`	`253`	`try`
`254`	`254`	`{`
`255`	`255`	`FileType gz = new FileType(".gz");`
`256`		`- File expected = new File(vcf.getPath() + FileExtensions.TRIBBLE_INDEX);`
`257`		`- File tbi = new File(vcf.getPath() + ".tbi");`
`258`		`-`
`259`		`- if (!forceRecreate && expected.exists())`
`260`		`- {`
`261`		`- return expected;`
`262`		`- }`
`263`		`- else if (!forceRecreate && tbi.exists())`
	`256`	`+ File expectedIdx = gz.isType(vcf) ? new File(vcf.getPath() + ".tbi") : new File(vcf.getPath() + FileExtensions.TRIBBLE_INDEX);`
	`257`	`+ if (!forceRecreate && expectedIdx.exists())`
`264`	`258`	`{`
`265`		`- return tbi;`
	`259`	`+ return expectedIdx;`
`266`	`260`	`}`
`267`	`261`	`else`
`268`	`262`	`{`
`@@ -272,15 +266,23 @@ else if (!forceRecreate && tbi.exists())`
`272`	`266`	`{`
`273`	`267`	`TabixRunner r = new TabixRunner(log);`
`274`	`268`	`r.execute(vcf);`
	`269`	`+ if (!expectedIdx.exists())`
	`270`	`+ {`
	`271`	`+ throw new PipelineJobException("Expected index was not created: " + expectedIdx.getPath());`
	`272`	`+ }`
`275`	`273`
`276`		`- return tbi;`
	`274`	`+ return expectedIdx;`
`277`	`275`	`}`
`278`	`276`	`else`
`279`	`277`	`{`
`280`	`278`	`Index idx = IndexFactory.createDynamicIndex(vcf, new VCFCodec());`
`281`	`279`	`idx.writeBasedOnFeatureFile(vcf);`
	`280`	`+ if (!expectedIdx.exists())`
	`281`	`+ {`
	`282`	`+ throw new PipelineJobException("Expected index was not created: " + expectedIdx.getPath());`
	`283`	`+ }`
`282`	`284`
`283`		`- return expected;`
	`285`	`+ return expectedIdx;`
`284`	`286`	`}`
`285`	`287`	`}`
`286`	`288`	`}`
Original file line number	Diff line number	Diff line change
`@@ -42,6 +42,7 @@`
`42`	`42`	`import java.io.PrintWriter;`
`43`	`43`	`import java.util.ArrayList;`
`44`	`44`	`import java.util.Arrays;`
	`45`	`+import java.util.Collection;`
`45`	`46`	`import java.util.HashMap;`
`46`	`47`	`import java.util.HashSet;`
`47`	`48`	`import java.util.List;`
`@@ -255,12 +256,13 @@ public void init(PipelineJob job, SequenceAnalysisJobSupport support, List<Seque`
`255`	`256`	`filter.addCondition(FieldKey.fromString("application"), allowableApplications, CompareType.IN);`
`256`	`257`	`}`
`257`	`258`
`258`		`- Set<String> applications = new HashSet<>(new TableSelector(QueryService.get().getUserSchema(getPipelineCtx().getJob().getUser(), targetContainer, SequenceAnalysisSchema.SCHEMA_NAME).getTable(SequenceAnalysisSchema.TABLE_READSETS), PageFlowUtil.set("application"), filter, null).getArrayList(String.class));`
`259`		`- if (applications.size() == 1)`
	`259`	`+ Collection<Map<String, Object>> results = new TableSelector(QueryService.get().getUserSchema(getPipelineCtx().getJob().getUser(), targetContainer, SequenceAnalysisSchema.SCHEMA_NAME).getTable(SequenceAnalysisSchema.TABLE_READSETS), PageFlowUtil.set("application", "rowid"), filter, null).getMapCollection();`
	`260`	`+ if (results.size() == 1)`
`260`	`261`	`{`
`261`		`- writer.println(sample + "\t" + applications.iterator().next());`
	`262`	`+ Map<String, Object> row = results.iterator().next();`
	`263`	`+ writer.println(sample + "\t" + row.get("application") + "\t" + row.get("rowid"));`
`262`	`264`	`}`
`263`		`- else if (applications.size() > 1)`
	`265`	`+ else if (results.size() > 1)`
`264`	`266`	`{`
`265`	`267`	`duplicates.add(sample);`
`266`	`268`	`}`