fixes #15

brwnj · brwnj · commit 85a9b317765e · 2021-02-11T16:19:27.000-07:00
diff --git a/covviz/bed.py b/covviz/bed.py
@@ -1,8 +1,8 @@
 import csv
 import logging
-import warnings
 import os
 import sys
+import warnings
 from collections import defaultdict
 from itertools import groupby
 
@@ -99,8 +99,10 @@ def get_traces(data, samples, outliers, distance_threshold, slop):
                         )
                     except IndexError as e:
                         # x_values[0] is the first data point
-                        print("index error: %s\nindex_values[0]: %d, distance_idx: %d" % (
-                            e, index_values[0], distance_idx))
+                        print(
+                            "index error: %s\nindex_values[0]: %d, distance_idx: %d"
+                            % (e, index_values[0], distance_idx)
+                        )
                         break
                     extension_length -= (
                         data["x"][index_values[0] - distance_idx + 1]
@@ -167,6 +169,7 @@ def parse_sex_groups(filename, sample_col, sex_col):
             groups[row[sex_col]].append(row[sample_col])
     return groups
 
+
 def normalize_depths(path, sex_chroms, median_window=7):
     filename, ext = os.path.splitext(path)
     if ext == ".gz":
@@ -183,32 +186,37 @@ def normalize_depths(path, sex_chroms, median_window=7):
 
     extras = []
     for s in sex_chroms:
-        if s.startswith("chr"): extras.append(s[3:])
-        else: extras.append("chr" + s)
+        if s.startswith("chr"):
+            extras.append(s[3:])
+        else:
+            extras.append("chr" + s)
     sex_chroms = sex_chroms + extras
 
     # median per site
     autosome = ~np.asarray(df.iloc[:, 0].isin(sex_chroms))
 
     with warnings.catch_warnings():
-        warnings.filterwarnings('ignore', r'All-NaN (slice|axis) encountered')
+        warnings.filterwarnings("ignore", r"All-NaN (slice|axis) encountered")
         site_median = np.nanmedian(df.iloc[:, 3:], axis=1)
 
-    with np.errstate(invalid='ignore'):
+    with np.errstate(invalid="ignore"):
         site_median[np.isnan(site_median) | (site_median < 0.03)] = 1
     # divide autosomes by median at each site so a given block is centered at
     # middle sample.
     for i in range(3, df.shape[1]):
         df.iloc[:, i] = np.where(autosome, df.iloc[:, i] / site_median, df.iloc[:, i])
         if median_window > 1:
-            df.iloc[:, i] = df.iloc[:, i].rolling(median_window).median() #pd.rolling_median(df.iloc[:, i], median_window)
+            df.iloc[:, i] = (
+                df.iloc[:, i].rolling(median_window).median()
+            )  # pd.rolling_median(df.iloc[:, i], median_window)
         inan = np.asarray(np.isnan(df.iloc[:, i]))
         df.iloc[inan, i] = 0.0
-    #df.to_csv(path_or_buf=output_bed, sep="\t", na_rep=0.0, index=False,
+    # df.to_csv(path_or_buf=output_bed, sep="\t", na_rep=0.0, index=False,
     #        compression='gzip',
     #        float_format="%.2f")
     return df
-    #return output_bed
+    # return output_bed
+
 
 def identify_outliers(a, threshold=3.5):
     a = np.asarray(a, dtype=np.float32)
@@ -269,7 +277,7 @@ def parse_bed(
     slop=500000,
     min_samples=8,
     skip_norm=False,
-    window=1
+    window=1,
 ):
     bed_traces = dict()
     # chromosomes, in order of appearance
@@ -286,15 +294,13 @@ def parse_bed(
     else:
         df = normalize_depths(path, sex_chroms, median_window=window)
 
-    if True: # temporary to get sane diff.
+    if True:  # temporary to get sane diff.
         header = list(df.columns)
         samples = header[3:]
         if groups:
             valid = validate_samples(samples, groups)
             if not valid:
-                logger.critical(
-                    "sample ID mismatches exist between ped and bed"
-                )
+                logger.critical("sample ID mismatches exist between ped and bed")
                 sys.exit(1)
         for chr, entries in df.groupby(header[0], as_index=False, sort=False):
 
@@ -334,8 +340,9 @@ def parse_bed(
                         bounds["upper"].append([])
                         bounds["lower"].append([])
                     if all_points:
-                        sample_values = np.minimum(3, np.asarray(row[3:],
-                            dtype=np.float32))
+                        sample_values = np.minimum(
+                            3, np.asarray(row[3:], dtype=np.float32)
+                        )
                         for i, s in enumerate(samples):
                             data[s].append(float(sample_values[i]))
                     else:
diff --git a/covviz/templates/covviz.html b/covviz/templates/covviz.html
@@ -417,57 +417,60 @@ <h5>Problematic low and non-uniform coverage bins</h5>
         // annotation tracks
         let y_offset = -0.10
         let track_idx = 0
-        for (const tracktype of Object.keys(data[chr].annotations)) {
-            for (const track of data[chr].annotations[tracktype]) {
-                let trackname = track[0]
-                let track_color = dark2[track_idx % dark2.length]
-                let track_depth = 0
-                if (tracktype == "gff" || tracktype == "bed") {
-                    let intervals = plot_intervals(track[1], y_offset)
-                    track_depth = intervals.track_depth
-                    scaled_traces.push({
-                        x: intervals.x,
-                        y: intervals.y,
-                        text: intervals.text,
-                        type: "scattergl",
-                        name: trackname,
-                        tracktype: tracktype,
-                        connectgaps: false,
-                        showlegend: false,
-                        line: { width: 2, color: track_color },
-                        mode: "lines+markers",
-                        hoverinfo: "text+x+name",
-                        hoverlabel: { namelength: -1 },
-                        marker: {
-                            size: 6,
-                            symbol: "square",
-                            color: track_color,
-                            line: { width: 1, color: "white" },
-                        },
-                    })
-                } else {
-                    scaled_traces.push({
-                        x: track[1].x,
-                        y: Array(track[1].x.length).fill(y_offset),
-                        mode: "markers",
-                        type: "scattergl",
-                        name: trackname,
-                        text: track[1].text.map((i) => {
-                            return i.replaceAll(";", "<br>")
-                        }),
-                        hoverinfo: "text+x+name",
-                        hoverlabel: { namelength: -1 },
-                        marker: {
-                            size: 6,
-                            symbol: "square",
-                            color: track_color,
-                            line: { width: 1, color: "white" },
-                        },
-                        tracktype: tracktype,
-                    })
+
+        if ("annotations" in data[chr]) {
+            for (const tracktype of Object.keys(data[chr].annotations)) {
+                for (const track of data[chr].annotations[tracktype]) {
+                    let trackname = track[0]
+                    let track_color = dark2[track_idx % dark2.length]
+                    let track_depth = 0
+                    if (tracktype == "gff" || tracktype == "bed") {
+                        let intervals = plot_intervals(track[1], y_offset)
+                        track_depth = intervals.track_depth
+                        scaled_traces.push({
+                            x: intervals.x,
+                            y: intervals.y,
+                            text: intervals.text,
+                            type: "scattergl",
+                            name: trackname,
+                            tracktype: tracktype,
+                            connectgaps: false,
+                            showlegend: false,
+                            line: { width: 2, color: track_color },
+                            mode: "lines+markers",
+                            hoverinfo: "text+x+name",
+                            hoverlabel: { namelength: -1 },
+                            marker: {
+                                size: 6,
+                                symbol: "square",
+                                color: track_color,
+                                line: { width: 1, color: "white" },
+                            },
+                        })
+                    } else {
+                        scaled_traces.push({
+                            x: track[1].x,
+                            y: Array(track[1].x.length).fill(y_offset),
+                            mode: "markers",
+                            type: "scattergl",
+                            name: trackname,
+                            text: track[1].text.map((i) => {
+                                return i.replaceAll(";", "<br>")
+                            }),
+                            hoverinfo: "text+x+name",
+                            hoverlabel: { namelength: -1 },
+                            marker: {
+                                size: 6,
+                                symbol: "square",
+                                color: track_color,
+                                line: { width: 1, color: "white" },
+                            },
+                            tracktype: tracktype,
+                        })
+                    }
+                    y_offset = track_depth - 0.10
+                    track_idx += 1
                 }
-                y_offset = track_depth - 0.10
-                track_idx += 1
             }
         }
 
@@ -849,7 +852,7 @@ <h5>PCA 1 vs 3</h5>
         let seen = new Set()
 
         for (const chr of data.chromosomes) {
-            if ("gff" in data[chr].annotations) {
+            if ("annotations" in data[chr] && "gff" in data[chr].annotations) {
                 for (const gff of data[chr].annotations.gff) {
                     let filename = gff[0]
                     let gene_data = gff[1]
diff --git a/covviz/utils.py b/covviz/utils.py
@@ -17,7 +17,11 @@ def compare_array(a, b):
         b = np.pad(b, (0, len_a - len_b), mode="constant")
     elif len_b > len_a:
         a = np.pad(a, (0, len_b - len_a), mode="constant")
-    return a[: np.nonzero(a != b)[0][0]]
+    try:
+        return a[: np.nonzero(a != b)[0][0]]
+    except IndexError:
+        # case: a == b
+        return a
 
 
 def find_common_start(items):
diff --git a/docker/Dockerfile b/docker/Dockerfile
@@ -4,6 +4,6 @@ RUN apt-get update && apt-get install -y procps
 RUN conda create -n env -c conda-forge python=3.7 numpy>=1.16.2 jinja2>=2.10.1
 RUN echo "source activate env" > ~/.bashrc
 ENV PATH /opt/conda/envs/env/bin:$PATH
-RUN /opt/conda/envs/env/bin/pip install --no-cache-dir covviz==1.3.0
+RUN /opt/conda/envs/env/bin/pip install --no-cache-dir covviz==1.3.1
 RUN wget -qO /usr/bin/goleft https://github.com/brentp/goleft/releases/download/v0.2.3/goleft_linux64
 RUN chmod +x /usr/bin/goleft
diff --git a/nextflow.config b/nextflow.config
@@ -25,7 +25,7 @@ process {
     errorStrategy = { task.exitStatus in [1,143,137,104,134,139] ? 'retry' : 'terminate' }
     maxRetries = 3
     maxErrors = '-1'
-    container = 'brwnj/covviz:v1.3.0'
+    container = 'brwnj/covviz:v1.3.1'
     withLabel: 'indexcov' {
         memory = { 8.GB * task.attempt }
         cache = 'deep'
@@ -62,7 +62,7 @@ manifest {
     name = 'brwnj/covviz'
     author = 'Joe Brown'
     description = "find large, coverage-based variations on chromosomes"
-    version = '1.3.0'
+    version = '1.3.1'
     nextflowVersion = '>=0.32.0'
     homePage = 'https://github.com/brwnj/covviz'
     mainScript = 'main.nf'
diff --git a/setup.py b/setup.py
@@ -18,7 +18,7 @@
 EMAIL = "brwnjm@gmail.com"
 AUTHOR = "Joe Brown"
 REQUIRES_PYTHON = ">=3.6.0"
-VERSION = "1.3.0"
+VERSION = "1.3.1"
 
 # What packages are required for this module to be executed?
 REQUIRED = ["Jinja2", "numpy", "pandas"]