├── .gitignore
├── .pre-commit-config.yaml
├── .travis.yml
├── LICENSE
├── README.md
├── bin
    ├── cellposeStaging.py
    ├── imgProcessing.py
    ├── main.py
    ├── pseudoSort.py
    ├── qcDriver.py
    ├── segmentationDriver.py
    ├── spaceTxConverter.py
    └── starfishDriver.py
├── docker
    ├── baysor
    │   └── Dockerfile
    ├── cellpose
    │   └── Dockerfile
    ├── starfish-custom
    │   └── Dockerfile
    ├── starfish-docker-runner
    │   └── Dockerfile
    └── starfish
    │   └── Dockerfile
├── docker_images.txt
├── flowchart.svg
├── input_schemas
    ├── cellpose.json
    ├── pipeline.json
    ├── processing.json
    ├── psortedDefaultParams.json
    ├── qc.json
    ├── segmentation.json
    ├── sorter.json
    ├── spaceTxConversion.json
    └── starfishRunner.json
├── logo.png
├── pipeline-manifest.json
├── pipeline.cwl
├── pyproject.toml
├── requirements.txt
├── requirements_test.txt
├── steps
    ├── baysor.cwl
    ├── baysorStaged.cwl
    ├── cellpose.cwl
    ├── fileSizer.cwl
    ├── inputParser.cwl
    ├── processing.cwl
    ├── psortedDefaultParams.cwl
    ├── qc.cwl
    ├── segmentation.cwl
    ├── sorter.cwl
    ├── spaceTxConversion.cwl
    ├── starfishRunner.cwl
    └── tmpdir.cwl
└── test.sh


/.gitignore:
--------------------------------------------------------------------------------
1 | *~
2 | .*.kate-swp
3 | .*.swp
4 | .idea/
5 | __pycache__/
6 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 |   - repo: https://github.com/psf/black
 3 |     rev: 24.1.1
 4 |     hooks:
 5 |       - id: black
 6 |         language_version: python3
 7 |   - repo: https://github.com/pycqa/isort
 8 |     rev: 5.12.0
 9 |     hooks:
10 |       - id: isort
11 |         args: ["--profile", "black"]
12 | 


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
1 | dist: focal
2 | language: python
3 | python: 3.8
4 | install:
5 |   - pip install -r requirements_test.txt
6 | script:
7 |   - ./test.sh
8 | 


--------------------------------------------------------------------------------
/bin/cellposeStaging.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | import glob
  4 | from argparse import ArgumentParser
  5 | from copy import deepcopy
  6 | from os import makedirs
  7 | from pathlib import Path
  8 | 
  9 | import numpy as np
 10 | import skimage.measure
 11 | import skimage.segmentation
 12 | import tifffile
 13 | from scipy.ndimage import gaussian_filter
 14 | from starfish.core.intensity_table.decoded_intensity_table import DecodedIntensityTable
 15 | 
 16 | 
 17 | def scale_img(image):
 18 |     image = image - np.min(image)
 19 |     image = image.astype("float32") / np.max(image)
 20 |     image = image * 2**16
 21 |     image[image == 2**16] = 2**16 - 1
 22 |     return np.rint(image).astype("uint16")
 23 | 
 24 | 
 25 | def _clip_percentile_to_zero(image, p_min, p_max, min_coeff=1, max_coeff=1):
 26 |     v_min, v_max = np.percentile(image, [p_min, p_max])
 27 |     v_min = min_coeff * v_min
 28 |     v_max = max_coeff * v_max
 29 |     return np.clip(image, v_min, v_max) - np.float32(v_min)
 30 | 
 31 | 
 32 | def cellpose_format(output_dir, input_dir, aux_ch_names, mRNA_dir, selected_fovs):
 33 |     # Get all fov names
 34 |     if selected_fovs is None:
 35 |         primary_jsons = glob.glob(f"{input_dir}/primary-*.json")
 36 |         fovs = [
 37 |             primary_json.split("/")[-1].split("-")[-1].split(".")[0]
 38 |             for primary_json in primary_jsons
 39 |         ]
 40 |     else:
 41 |         fovs = ["fov_{:05}".format(int(f)) for f in selected_fovs]
 42 | 
 43 |     # Get number of z slices by looking at the fov_000 files
 44 |     fov0_files = glob.glob(f"{input_dir}/primary-{fovs[0]}*.tiff")
 45 |     shape = tifffile.imread(fov0_files[0]).shape  # Get image xy shape (will need later)
 46 |     fov0_files = [file.split("/")[-1] for file in fov0_files]
 47 |     zs = np.max([int(file.split("-")[-1][1]) for file in fov0_files])
 48 | 
 49 |     # Make folder for cellpose inputs if it doesn't exist
 50 |     makedirs(output_dir, exist_ok=True)
 51 | 
 52 |     # Create cellpose inputs
 53 |     # Images have to be 16 bit and have dimension order z, ch, y, x
 54 |     for fov in fovs:
 55 |         mRNA_ch = 1 if mRNA_dir else 0
 56 |         empty_ch = 1 if len(aux_ch_names) == 1 and not mRNA_ch else 0
 57 |         new_img = np.zeros(
 58 |             [zs + 1, len(aux_ch_names) + mRNA_ch + empty_ch] + list(shape), dtype="uint16"
 59 |         )
 60 |         for ch, aux_ch_name in enumerate(aux_ch_names):
 61 |             files = sorted(glob.glob(f"{input_dir}/{aux_ch_name}-{fov}-c0-r0-z*.tiff"))
 62 |             for z, file in enumerate(files):
 63 |                 img = tifffile.imread(file)
 64 |                 if np.max(img) <= 1:
 65 |                     img = np.rint(img * 2**16).astype("uint16")
 66 |                 new_img[z, ch] = deepcopy(img)
 67 |             new_img[:, ch] = _clip_percentile_to_zero(new_img[:, ch], p_min=0, p_max=99.9)
 68 |             new_img[:, ch] = scale_img(new_img[:, ch])
 69 | 
 70 |         # Add mRNA density channel if specified
 71 |         # Each mRNA is plotted as a single point of maximum intensity and the the resulting image is then
 72 |         # blurred with a guassian filter.
 73 |         if mRNA_dir:
 74 |             dit = DecodedIntensityTable.open_netcdf(f"{mRNA_dir}/cdf/{fov}_decoded.cdf")
 75 |             coords = np.array(
 76 |                 [[z, y, x] for z, y, x in zip(dit["z"].data, dit["y"].data, dit["x"].data)]
 77 |             )
 78 |             mRNAs = np.zeros([zs + 1] + list(shape), dtype="uint16")
 79 |             mRNAs[tuple(coords.T)] = 2**16 - 1
 80 |             for z in range(zs + 1):
 81 |                 mRNAs[z] = gaussian_filter(
 82 |                     mRNAs[z], sigma=10, cval=0, truncate=4.0, mode="nearest"
 83 |                 )
 84 |             new_img[:, -1] = scale_img(mRNAs)
 85 | 
 86 |         # Save result, squeeze out any size 1 dimensions
 87 |         tifffile.imsave(f"{output_dir}/{fov}_image.tiff", np.squeeze(new_img))
 88 | 
 89 | 
 90 | def filter_cellpose(
 91 |     output_dir, input_dir, border_buffer=None, label_exp_size=None, min_size=None, max_size=None
 92 | ):
 93 |     # Make folder if it doesn't exist
 94 |     makedirs(output_dir, exist_ok=True)
 95 | 
 96 |     # For each file, check for each function if it should be run then run it if yes
 97 |     files = glob.glob(f"{input_dir}/*cp_masks*")
 98 |     for file in files:
 99 |         # print(f"found {file}")
100 |         mask = tifffile.imread(file)
101 | 
102 |         # Clear border objects
103 |         if border_buffer is not None:
104 |             # print(f"\tclearing border of size {border_buffer}")
105 |             if mask.ndim == 3:
106 |                 for z in range(mask.shape[0]):
107 |                     mask[z] = skimage.segmentation.clear_border(mask[z], buffer_size=border_buffer)
108 |             else:
109 |                 mask = skimage.segmentation.clear_border(mask, buffer_size=border_buffer)
110 |             mask = skimage.segmentation.relabel_sequential(mask)[0]
111 | 
112 |         # Expand labels
113 |         if label_exp_size is not None:
114 |             # print(f"\texpanding labels by size {label_exp_size}")
115 |             if mask.ndim == 3:
116 |                 for z in range(mask.shape[0]):
117 |                     mask[z] = skimage.segmentation.expand_labels(mask[z], distance=label_exp_size)
118 |             else:
119 |                 mask = skimage.segmentation.expand_labels(mask, distance=label_exp_size)
120 | 
121 |         # Remove labels below a minimum size threshold
122 |         if min_size is not None:
123 |             # print(f"\tcells beneath size {min_size} being removed")
124 |             props = skimage.measure.regionprops(mask)
125 |             small_labels = np.where([p.area < min_size for p in props])[0] + 1
126 |             mask[np.isin(mask, small_labels)] = 0
127 |             mask = skimage.segmentation.relabel_sequential(mask)[0]
128 | 
129 |         # Remove labels above a maximum size threshold
130 |         if max_size is not None:
131 |             # print(f"\tcells above size {max_size} being removed")
132 |             props = skimage.measure.regionprops(mask)
133 |             big_labels = np.where([p.area > max_size for p in props])[0] + 1
134 |             mask[np.isin(mask, big_labels)] = 0
135 |             mask = skimage.segmentation.relabel_sequential(mask)[0]
136 | 
137 |         # Save result
138 |         tifffile.imsave(f'{output_dir}/fov_{file.split("fov_")[-1][:5]}_masks.tiff', mask)
139 | 
140 | 
141 | if __name__ == "__main__":
142 |     p = ArgumentParser()
143 | 
144 |     p.add_argument("--input-dir", type=Path)
145 |     p.add_argument("--tmp-prefix", type=str)
146 |     p.add_argument("--selected-fovs", nargs="+", const=None)
147 | 
148 |     p.add_argument("--format", dest="format", action="store_true")
149 |     p.add_argument("--aux-views", type=str, nargs="+")
150 |     p.add_argument("--decoded-dir", type=Path, nargs="?")
151 | 
152 |     p.add_argument("--filter", dest="filter", action="store_true")
153 |     p.add_argument("--border-buffer", type=int, nargs="?")
154 |     p.add_argument("--label-exp-size", type=int, nargs="?")
155 |     p.add_argument("--min-size", type=int, nargs="?")
156 |     p.add_argument("--max-size", type=int, nargs="?")
157 | 
158 |     args = p.parse_args()
159 | 
160 |     if not (args.format ^ args.filter):
161 |         raise ValueError("Script must be run with --format xor --filter. Terminating.")
162 | 
163 |     if args.format:
164 |         cellpose_format(
165 |             output_dir=f"tmp/{args.tmp_prefix}/5A_cellpose_input",
166 |             input_dir=args.input_dir,
167 |             aux_ch_names=args.aux_views,
168 |             mRNA_dir=args.decoded_dir,
169 |             selected_fovs=args.selected_fovs,
170 |         )
171 |     else:
172 |         filter_cellpose(
173 |             output_dir=f"tmp/{args.tmp_prefix}/5C_cellpose_filtered",
174 |             input_dir=args.input_dir,
175 |             border_buffer=args.border_buffer,
176 |             label_exp_size=args.label_exp_size,
177 |             min_size=args.min_size,
178 |             max_size=args.max_size,
179 |         )
180 |         # because we know these two will be called as a part of the same cwl,
181 |         # we don't need to re-clarify selected_fovs on the filter step
182 | 


--------------------------------------------------------------------------------
/bin/imgProcessing.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | import hashlib
  4 | import json
  5 | import os
  6 | import shutil
  7 | import sys
  8 | from argparse import ArgumentParser
  9 | from concurrent.futures.process import ProcessPoolExecutor
 10 | from copy import deepcopy
 11 | from datetime import datetime
 12 | from functools import partial, partialmethod
 13 | from os import path
 14 | from pathlib import Path
 15 | from time import time
 16 | from typing import List
 17 | 
 18 | import cv2
 19 | import numpy as np
 20 | import starfish
 21 | import tifffile as tiff
 22 | from scipy import ndimage
 23 | from skimage import exposure, morphology, restoration
 24 | from skimage.morphology import disk
 25 | from skimage.registration import phase_cross_correlation
 26 | from starfish import Experiment, ImageStack
 27 | from starfish.types import Levels
 28 | from tqdm import tqdm
 29 | 
 30 | 
 31 | def saveImg(loc: str, prefix: str, img: ImageStack):
 32 |     # save the individual slices of an image in the same format starfish does
 33 |     for r in range(img.num_rounds):
 34 |         for c in range(img.num_chs):
 35 |             for z in range(img.num_zplanes):
 36 |                 tiff.imsave(
 37 |                     "{}{}-c{}-r{}-z{}.tiff".format(loc, prefix, c, r, z), img._data[r, c, z, :, :]
 38 |                 )
 39 | 
 40 | 
 41 | def saveExp(
 42 |     source_dir: str, save_dir: str, exp: Experiment = None, selected_fovs: List[str] = None
 43 | ):
 44 |     # go through and save all images, if an experiment is provided
 45 |     if exp:
 46 |         for fov in exp.keys():
 47 |             for view in exp[fov].image_types:
 48 |                 img = exp[fov].get_image(view)
 49 |                 prefix = f"{view}-{fov}"
 50 |                 saveImg(save_dir, prefix, img)
 51 | 
 52 |     # copy the non-tiff files to the new directory
 53 |     cp_files = [x for x in os.listdir(source_dir) if x[-5:] != ".tiff" and x[-4:] != ".log"]
 54 |     for file in cp_files:
 55 |         print(f"looking at {file}.")
 56 |         if "fov" in file:
 57 |             # images were only updated if we looked at that fov
 58 |             if (selected_fovs is None) or (True in [f in file for f in selected_fovs]):
 59 |                 # if file contains images, we need to update sha's
 60 |                 data = json.load(open(str(source_dir) + "/" + file))
 61 |                 for i in range(len(data["tiles"])):
 62 |                     abspath = str(save_dir) + "/" + data["tiles"][i]["file"]
 63 |                     with open(os.fspath(abspath), "rb") as fh:
 64 |                         hsh = hashlib.sha256(fh.read()).hexdigest()
 65 |                     data["tiles"][i]["sha256"] = hsh
 66 |                     print(f"\tupdated hash for {data['tiles'][i]['file']}")
 67 |                 with open(str(save_dir) + "/" + file, "w") as f:
 68 |                     json.dump(data, f)
 69 |                 print(f"saved {file} with modified hashes")
 70 |             else:
 71 |                 print(f"\tskipping file {file}")
 72 |         else:
 73 |             # if we're using a subset of fovs, we'll need to modify view files
 74 |             if (selected_fovs is not None) and (
 75 |                 "json" in file and "codebook" not in file and "experiment" not in file
 76 |             ):
 77 |                 data = json.load(open(str(source_dir) + "/" + file))
 78 |                 new_data = {}
 79 |                 for k, v in data.items():
 80 |                     if k == "contents":
 81 |                         # this is where we select only fovs that we care about
 82 |                         new_data["contents"] = {f: v[f] for f in selected_fovs}
 83 |                     else:
 84 |                         new_data[k] = v
 85 |                 with open(str(save_dir) + "/" + file, "w") as f:
 86 |                     json.dump(new_data, f)
 87 |                 print(f"\tsaved {file} with used FOVs.")
 88 |             else:
 89 |                 # we can just copy the rest of the files
 90 |                 shutil.copyfile(f"{source_dir}/{file}", f"{save_dir}/{file}")
 91 |                 print(f"\tcopied {file}")
 92 | 
 93 | 
 94 | def register_primary_aux(img, reg_img, chs_per_reg):
 95 |     """
 96 |     Register primary images using provided registration images.
 97 |     chs_per_reg is number of primary image channels
 98 |     associated with each registration image.
 99 | 
100 |     Calculates shifts between auxillary images using the first
101 |     auxillary image as a reference, then applies shifts to primary images.
102 |     """
103 |     # Calculate registration shifts from registration images
104 |     shifts = {}
105 |     # Reference is set arbitrarily to first round/channel
106 |     reference = reg_img.xarray.data[0, 0]
107 |     for r in range(reg_img.num_rounds):
108 |         for ch in range(reg_img.num_chs):
109 |             shift, error, diffphase = phase_cross_correlation(
110 |                 reference, reg_img.xarray.data[r, ch], upsample_factor=100
111 |             )
112 |             shifts[(r, ch)] = shift
113 | 
114 |     # Create transformation matrices
115 |     shape = img.raw_shape
116 |     tforms = {}
117 |     for r, ch in shifts:
118 |         tform = np.diag([1.0] * 4)
119 |         # Start from 1 because we don't want to shift in the z direction (if there is one)
120 |         for i in range(1, 3):
121 |             tform[i, 3] = shifts[(r, ch)][i]
122 |         tforms[(r, ch)] = tform
123 | 
124 |     # Register primary images
125 |     for r in range(img.num_rounds):
126 |         for ch in range(img.num_chs):
127 |             img.xarray.data[r, ch] = ndimage.affine_transform(
128 |                 img.xarray.data[r, ch],
129 |                 np.linalg.inv(tforms[(r, ch // chs_per_reg)]),
130 |                 output_shape=shape[2:],
131 |             )
132 |     return img
133 | 
134 | 
135 | def calc_reg_shift(images, reg_img):
136 |     """
137 |     Helper function for calculating registration shifts in parallel
138 |     """
139 | 
140 |     # Calculate shifts from each primary image to the registration image
141 |     shifts = []
142 |     for image in images:
143 |         shift, error, diffphase = phase_cross_correlation(reg_img, image, upsample_factor=100)
144 |         shifts.append(shift)
145 |     return shifts
146 | 
147 | 
148 | def apply_reg_shift(image_tforms, shape):
149 |     """
150 |     Helper function for applying registration shifts in parallel
151 |     """
152 | 
153 |     align_imgs = []
154 |     for i in range(len(image_tforms[0])):
155 |         image = image_tforms[0][i]
156 |         tform = image_tforms[1][i]
157 |         align_img = ndimage.affine_transform(
158 |             image,
159 |             np.linalg.inv(tform),
160 |             output_shape=shape[2:],
161 |         )
162 |         align_imgs.append(align_img)
163 |     return align_imgs
164 | 
165 | 
166 | def register_primary_primary_parallel(img, reg_img, num_threads):
167 |     """
168 |     Register primary images using provided registration images.
169 | 
170 |     Calculates shifts between primary images and the single auxillary image
171 |     and then applies shifts to primary images.
172 |     """
173 |     # Chunk round/channel combinations for parallel run
174 |     rchs = [(r, ch) for r in range(img.num_rounds) for ch in range(img.num_chs)]
175 | 
176 |     # Calculates index ranges to chunk data by
177 |     ranges = [0]
178 |     for i in range(1, num_threads + 1):
179 |         ranges.append(int((len(rchs) / num_threads) * i))
180 |     chunked_rchs = [rchs[ranges[i] : ranges[i + 1]] for i in range(len(ranges[:-1]))]
181 | 
182 |     # Create list of lists of images corresponding to the above chunking
183 |     chunked_imgs = []
184 |     for rch_chunk in chunked_rchs:
185 |         chunk = []
186 |         for rch in rch_chunk:
187 |             chunk.append(img.xarray.data[rch[0], rch[1]])
188 |         chunked_imgs.append(chunk)
189 | 
190 |     # Calculate registration shifts in parallel
191 |     part = partial(calc_reg_shift, reg_img=reg_img.xarray.data[0, 0])
192 |     with ProcessPoolExecutor() as pool:
193 |         poolMap = pool.map(part, [img_chunk for img_chunk in chunked_imgs])
194 |         results = [x for x in poolMap]
195 | 
196 |     # Create transformation matrices
197 |     tforms = {}
198 |     for i in range(len(chunked_rchs)):
199 |         for j in range(len(chunked_rchs[i])):
200 |             r, ch = chunked_rchs[i][j]
201 |             tform = np.diag([1.0] * 4)
202 |             # Start from 1 because we don't want to shift in the z direction (if there is one)
203 |             for k in range(1, 3):
204 |                 tform[k, 3] = results[i][j][k]
205 |             tforms[(r, ch)] = tform
206 | 
207 |     # Create list of lists of tforms corresponding to the above chunking
208 |     chunked_tforms = []
209 |     for rch_chunk in chunked_rchs:
210 |         chunk = []
211 |         for rch in rch_chunk:
212 |             chunk.append(tforms[(rch[0], rch[1])])
213 |         chunked_tforms.append(chunk)
214 | 
215 |     # Apply registration shifts in parallel
216 |     shape = img.raw_shape
217 |     part = partial(apply_reg_shift, shape=shape)
218 |     with ProcessPoolExecutor() as pool:
219 |         poolMap = pool.map(
220 |             part, [img_tform_chunk for img_tform_chunk in zip(chunked_imgs, chunked_tforms)]
221 |         )
222 |         results = [x for x in poolMap]
223 | 
224 |     # Compile results
225 |     for i in range(len(chunked_rchs)):
226 |         for j in range(len(chunked_rchs[i])):
227 |             r, ch = chunked_rchs[i][j]
228 |             img.xarray.data[r, ch] = deepcopy(results[i][j])
229 | 
230 |     return img
231 | 
232 | 
233 | def subtract_background(img, background):
234 |     """
235 |     Subtract real background image from primary images. Will register to same reference as primary images were
236 |     aligned to if reg_img is provided, assumes background is of same round/channel dimensions as reference.
237 |     """
238 | 
239 |     # Subtract background images from primary
240 |     bg_dat = background.xarray.data
241 |     num_chs = background.num_chs
242 |     for r in range(img.num_rounds):
243 |         for ch in range(img.num_chs):
244 |             for z in range(img.num_zplanes):
245 |                 data = img.xarray.data[r, ch, z].astype("float32")
246 |                 data -= bg_dat[r, ch % num_chs, z].astype("float32")
247 |                 data[data < 0] = 0
248 |                 img.xarray.data[r, ch, z] = data.astype("uint16")
249 | 
250 |     return img
251 | 
252 | 
253 | def morph_open(images):
254 |     """
255 |     Multiprocessing helper function to run morphological openings in parallel.
256 |     """
257 |     size = 100
258 |     morphed = []
259 |     for image in images:
260 |         background = np.zeros_like(image)
261 |         for z in range(image.shape[0]):
262 |             background[z] = cv2.morphologyEx(image[z], cv2.MORPH_OPEN, disk(size))
263 |         morphed.append(background)
264 |     return morphed
265 | 
266 | 
267 | def subtract_background_estimate(img, num_threads):
268 |     """
269 |     Estimate background using large morphological opening (radis = 100px) and subtract from image.
270 |     """
271 |     # Chunk round/channel combinations for parallel run
272 |     rchs = [(r, ch) for r in range(img.num_rounds) for ch in range(img.num_chs)]
273 | 
274 |     # Calculates index ranges to chunk data by
275 |     ranges = [0]
276 |     for i in range(1, num_threads + 1):
277 |         ranges.append(int((len(rchs) / num_threads) * i))
278 |     chunked_rchs = [rchs[ranges[i] : ranges[i + 1]] for i in range(len(ranges[:-1]))]
279 | 
280 |     # Create list of lists of images corresponding to the above chunking
281 |     chunked_imgs = []
282 |     for rch_chunk in chunked_rchs:
283 |         chunk = []
284 |         for rch in rch_chunk:
285 |             chunk.append(img.xarray.data[rch[0], rch[1]])
286 |         chunked_imgs.append(chunk)
287 | 
288 |     # Run morph open in parallel
289 |     with ProcessPoolExecutor() as pool:
290 |         poolMap = pool.map(morph_open, [img_chunk for img_chunk in chunked_imgs])
291 |         results = [x for x in poolMap]
292 | 
293 |     # Subtract background estimates from img
294 |     for i in range(len(chunked_rchs)):
295 |         for j in range(len(chunked_rchs[i])):
296 |             r, ch = chunked_rchs[i][j]
297 |             img.xarray.data[r, ch] = img.xarray.data[r, ch] - results[i][j]
298 |             img.xarray.data[r, ch][img.xarray.data[r, ch] < 0] = 0
299 |     return img
300 | 
301 | 
302 | def rolling_ball(img, rolling_rad=3, num_threads=1):
303 |     """
304 |     Peform rolling ball background subtraction.
305 |     """
306 |     for r in range(img.num_rounds):
307 |         for ch in range(img.num_chs):
308 |             for z in range(img.num_zplanes):
309 |                 background = restoration.rolling_ball(
310 |                     img.xarray.data[r, ch, z], radius=rolling_rad, num_threads=num_threads
311 |                 )
312 |                 img.xarray.data[r, ch, z] -= background
313 |     return img
314 | 
315 | 
316 | def match_hist_2_min(img):
317 |     """
318 |     Calculate the lowest average intensity image in stack and use as reference to match histograms for all
319 |     other rounds/channels.
320 |     """
321 |     # Calculate image means to find min
322 |     meds = {}
323 |     for r in range(img.num_rounds):
324 |         for ch in range(img.num_chs):
325 |             meds[(r, ch)] = np.mean(img.xarray.data[r, ch])
326 |     min_rch = sorted(meds.items(), key=lambda item: item[1])[0][0]
327 | 
328 |     # Use min image as reference for histogram matching
329 |     reference = img.xarray.data[min_rch[0], min_rch[1]]
330 |     for r in range(img.num_rounds):
331 |         for ch in range(img.num_chs):
332 |             img.xarray.data[r, ch] = np.rint(
333 |                 exposure.match_histograms(img.xarray.data[r, ch], reference)
334 |             )
335 |     return img
336 | 
337 | 
338 | def white_top_hat(img, wth_rad):
339 |     """
340 |     Perform white top hat filter on image.
341 |     """
342 |     footprint = morphology.disk(wth_rad)
343 |     for r in range(img.num_rounds):
344 |         for ch in range(img.num_chs):
345 |             for z in range(img.num_zplanes):
346 |                 img.xarray.data[r, ch, z] = cv2.morphologyEx(
347 |                     img.xarray.data[r, ch, z], cv2.MORPH_TOPHAT, footprint
348 |                 )
349 |     return img
350 | 
351 | 
352 | def cli(
353 |     input_dir: Path,
354 |     output_dir: str,
355 |     n_processes: int,
356 |     clip_min: float = 0,
357 |     clip_max: float = 99.9,
358 |     level_method: str = "",
359 |     is_volume: bool = False,
360 |     register_aux_view: str = None,
361 |     register_to_primary: bool = False,
362 |     ch_per_reg: int = 1,
363 |     background_name: str = None,
364 |     register_background: bool = False,
365 |     anchor_name: str = None,
366 |     high_sigma: int = None,
367 |     decon_iter: int = 15,
368 |     decon_sigma: int = None,
369 |     low_sigma: int = None,
370 |     rolling_rad: int = None,
371 |     match_hist: bool = False,
372 |     wth_rad: int = None,
373 |     rescale: bool = False,
374 |     selected_fovs: List[int] = None,
375 | ):
376 |     """
377 |     n_processes: If provided, the number of threads to use for processing. Otherwise, the max number of
378 |         available CPUs will be used.
379 | 
380 |     clip_min: minimum value for ClipPercentileToZero
381 | 
382 |     is_volume: whether to treat the z-planes as a 3D image.
383 | 
384 |     level_method: Which level method to be applied to the Clip filter.
385 | 
386 |     aux_name: name of the aux view to align registration to
387 | 
388 |     chs_per_reg: Number of images/channels associated with each registration image.
389 |     If registration images are duplicated so that the dimensions of primary and
390 |     registration images match then keep set to 1 for 1-to-1 registration.
391 | 
392 |     background_name: name of the background view that will be subtracted, if provided.
393 | 
394 |     register_background: if true, the background image will be registered to 'aux_name'
395 | 
396 |     anchor_name: name of the aux view anchor round to perform processing on, if provided.
397 | 
398 |     high_sigma: Sigma value for high pass filter. High values remove less autofluorescence
399 |         while lower values remove more. Won't need to change between data sets unless you
400 |         had lots of autofluorescence.
401 | 
402 |     decon_iter: Number of iterations for deconvolution. High values remove more noise while
403 |         lower values remove less. Won't need to change between data sets unless image is very noisy.
404 | 
405 |     decon_sigma: Sigma value for deconvolution. Should be approximately the expected spot size.
406 | 
407 |     low_sigma: Sigma value for lowpass filtering. Larger values result in stronger
408 |     blurring. This should be low so can remain constant.
409 | 
410 |     rolling_rad: Radius for rolling ball background subtraction. Larger values lead to
411 |         increased intensity evening effect. Likely doesn't need changed from 3.
412 | 
413 |     match_hist: If true, will perform histogram matching.
414 | 
415 |     wth_rad: Radius for white top hat filter. Should be slightly larger than the expected spot radius.
416 | 
417 |     rescale: If true, will not run final clip and scale on image, because it is expected to rescale
418 |         the images in the following decoding step.
419 | 
420 |     selected_fovs: If provided, only FOVs with the provided indicies will be run.
421 |     """
422 | 
423 |     os.makedirs(output_dir, exist_ok=True)
424 | 
425 |     reporter = open(
426 |         path.join(output_dir, datetime.now().strftime("%Y%m%d_%H%M%S.%f_img_processing.log")), "w"
427 |     )
428 |     sys.stdout = reporter
429 |     sys.stderr = reporter
430 | 
431 |     print(locals())
432 | 
433 |     tqdm.__init__ = partialmethod(tqdm.__init__, disable=True)
434 | 
435 |     if level_method and level_method.upper() == "SCALE_BY_CHUNK":
436 |         level_method = Levels.SCALE_BY_CHUNK
437 |     elif level_method and level_method.upper() == "SCALE_BY_IMAGE":
438 |         level_method = Levels.SCALE_BY_IMAGE
439 |     elif level_method and level_method.upper() == "SCALE_SATURATED_BY_CHUNK":
440 |         level_method = Levels.SCALE_SATURATED_BY_CHUNK
441 |     elif level_method and level_method.upper() == "SCALE_SATURATED_BY_IMAGE":
442 |         level_method = Levels.SCALE_SATURATED_BY_IMAGE
443 |     else:
444 |         level_method = Levels.SCALE_BY_IMAGE
445 | 
446 |     t0 = time()
447 |     exp = starfish.core.experiment.experiment.Experiment.from_json(
448 |         str(input_dir / "experiment.json")
449 |     )
450 |     if selected_fovs is not None:
451 |         fovs = ["fov_{:05}".format(int(f)) for f in selected_fovs]
452 |     else:
453 |         fovs = list(exp.keys())
454 | 
455 |     for fov in fovs:
456 |         img = exp[fov].get_image("primary")
457 |         t1 = time()
458 |         print("Fetched view " + fov)
459 | 
460 |         anchor = None
461 |         if anchor_name:
462 |             anchor = exp[fov].get_image(anchor_name)
463 |             print("\tanchor image retrieved")
464 | 
465 |         if background_name:
466 |             # If a background image is provided, subtract it from the primary image.
467 |             bg = exp[fov].get_image(background_name)
468 |             print("\tremoving existing backgound...")
469 |             img = subtract_background(img, bg)
470 |             if anchor_name:
471 |                 print("\tremoving existing background from anchor image...")
472 |                 anchor = subtract_background(anchor, bg)
473 |         else:
474 |             # If no background image is provided, estimate background using a large morphological
475 |             # opening to subtract from primary images
476 |             print("\tremoving estimated background...")
477 |             img = subtract_background_estimate(img, n_processes)
478 |             if anchor_name:
479 |                 print("\tremoving estimated background from anchor image...")
480 |                 anchor = subtract_background_estimate(anchor, n_processes)
481 | 
482 |         if high_sigma:
483 |             # Remove cellular autofluorescence w/ gaussian high-pass filter
484 |             print("\trunning high pass filter...")
485 |             ghp = starfish.image.Filter.GaussianHighPass(sigma=high_sigma)
486 |             # ghp.run(img, verbose=False, in_place=True)
487 |             ghp.run(img, verbose=False, in_place=True, n_processes=n_processes)
488 |             if anchor_name:
489 |                 print("\trunning high pass filter on anchor image...")
490 |                 ghp.run(anchor, verbose=False, in_place=True, n_processes=n_processes)
491 | 
492 |         if decon_sigma:
493 |             # Increase resolution by deconvolving w/ point spread function
494 |             print("\tdeconvolving point spread function...")
495 |             dpsf = starfish.image.Filter.DeconvolvePSF(num_iter=decon_iter, sigma=decon_sigma)
496 |             # dpsf.run(img, verbose=False, in_place=True)
497 |             dpsf.run(img, verbose=False, in_place=True, n_processes=n_processes)
498 |             if anchor_name:
499 |                 print("\tdeconvolving point spread function on anchor image...")
500 |                 dpsf.run(anchor, verbose=False, in_place=True, n_processes=n_processes)
501 | 
502 |         if low_sigma:
503 |             # Blur image with lowpass filter
504 |             print("\trunning low pass filter...")
505 |             glp = starfish.image.Filter.GaussianLowPass(sigma=low_sigma)
506 |             # glp.run(img, verbose=False, in_place=True)
507 |             glp.run(img, verbose=False, in_place=True, n_processes=n_processes)
508 | 
509 |         if wth_rad:
510 |             print("\trunning white tophat filter...")
511 |             img = white_top_hat(img, wth_rad)
512 |             if anchor_name:
513 |                 print("\trunning white tophat filter on anchor image...")
514 |                 anchor = white_top_hat(anchor, wth_rad)
515 | 
516 |         if rolling_rad:
517 |             # Apply rolling ball background subtraction method to even out intensities through each 2D image
518 |             print("\tapplying rolling ball background subtraction...")
519 |             img = rolling_ball(img, rolling_rad=rolling_rad, num_threads=n_processes)
520 |             if anchor_name:
521 |                 print("\tapplying rolling ball background subtraction to anchor image...")
522 |                 anchor = rolling_ball(anchor, rolling_rad=rolling_rad, num_threads=n_processes)
523 | 
524 |         if match_hist:
525 |             # Use histogram matching to lower the intensities of each 3D image down to the same
526 |             # intensity range as the least bright image. This is done so spot finding can be done.
527 |             # BlobDetector doesn't do well when the intensities are in different ranges and c
528 |             # lipping the values is not sufficient.
529 |             print("\tapplying histogram matching...")
530 |             img = match_hist_2_min(img)
531 |             if anchor_name:
532 |                 print("\tapplying histogram matching to anchor image...")
533 |                 anchor = match_hist_2_min(anchor)
534 | 
535 |         if register_to_primary:
536 |             # If register_to_primary calculate registration shifts between primary images and the single aux image and
537 |             # apply to primary images
538 |             register = exp[fov].get_image(register_aux_view)
539 |             if register.shape["r"] != 1:
540 |                 raise Exception(
541 |                     "If --register-primary-view is used, auxillary images must have only a single round/channel (use the --aux-single-round option)"
542 |                 )
543 |             else:
544 |                 print("\taligning to " + register_aux_view)
545 |                 img = register_primary_primary_parallel(img, register, n_processes)
546 |         elif register_aux_view:
547 |             # If not register_to_primary but still registering, calculate registration shifts between specified aux images and apply to primary images
548 |             register = exp[fov].get_image(register_aux_view)
549 |             if register.shape["r"] != img.shape["r"]:
550 |                 raise Exception(
551 |                     "If --register-aux-view is used, auxillary image dimensions must match primary image dimensions"
552 |                 )
553 |             else:
554 |                 print("\taligning to " + register_aux_view)
555 |                 img = register_primary_aux(img, register, ch_per_reg)
556 | 
557 |         if not rescale and not (clip_min == 0 and clip_max == 0):
558 |             print("\tclip and scaling...")
559 |             # Scale image, clipping all but the highest intensities to zero
560 |             clip = starfish.image.Filter.ClipPercentileToZero(
561 |                 p_min=clip_min, p_max=clip_max, is_volume=is_volume, level_method=level_method
562 |             )
563 |             clip.run(img, in_place=True)
564 |             if anchor_name:
565 |                 print("\tapplying clip and scale to anchor image...")
566 |                 clip = starfish.image.Filter.ClipPercentileToZero(
567 |                     p_min=90, p_max=99.9, is_volume=is_volume, level_method=level_method
568 |                 )
569 |                 clip.run(anchor, in_place=True)
570 | 
571 |         else:
572 |             print("\tskipping clip and scale.")
573 |             # Clip values below 0 and greater than 1 (prevents errors in decoding)
574 |             clip = starfish.image.Filter.ClipPercentileToZero(
575 |                 p_min=0, p_max=100, is_volume=is_volume, level_method=Levels.CLIP
576 |             )
577 |             clip.run(img, in_place=True)
578 | 
579 |         print(f"\tView {fov} complete")
580 |         # save modified image
581 |         saveImg(output_dir, f"primary-{fov}", img)
582 | 
583 |         # save all aux views while we're here
584 |         for view in exp[fov].image_types:
585 |             if view != "primary" and view != anchor_name:
586 |                 aux_img = exp[fov].get_image(view)
587 |                 saveImg(output_dir, f"{view}-{fov}", aux_img)
588 |             elif view == anchor_name:
589 |                 saveImg(output_dir, f"{view}-{fov}", anchor)
590 | 
591 |         print(f"View {fov} saved")
592 |         print(f"Time for {fov}: {time() - t1}")
593 | 
594 |     print(f"Saving updated .jsons for {fovs}, copying other jsons\n")
595 |     saveExp(input_dir, output_dir, exp=None, selected_fovs=fovs)
596 |     print(f"\n\nTotal time elapsed for processing: {time() - t0}")
597 | 
598 | 
599 | if __name__ == "__main__":
600 |     p = ArgumentParser()
601 | 
602 |     p.add_argument("--tmp-prefix", type=str)
603 |     p.add_argument("--input-dir", type=Path)
604 |     p.add_argument("--clip-min", type=float, default=0)
605 |     p.add_argument("--clip-max", type=float, default=99.9)
606 |     p.add_argument("--level-method", type=str, nargs="?")
607 |     p.add_argument("--is-volume", dest="is_volume", action="store_true")
608 |     p.add_argument("--register-aux-view", type=str, nargs="?")
609 |     p.add_argument("--register-to-primary", dest="register_to_primary", action="store_true")
610 |     p.add_argument("--ch-per-reg", type=int, nargs="?")
611 |     p.add_argument("--background-view", type=str, nargs="?")
612 |     p.add_argument("--register-background", dest="register_background", action="store_true")
613 |     p.add_argument("--anchor-view", type=str, nargs="?")
614 |     p.add_argument("--high-sigma", type=int, nargs="?")
615 |     p.add_argument("--decon-iter", type=int, nargs="?")
616 |     p.add_argument("--decon-sigma", type=int, nargs="?")
617 |     p.add_argument("--low-sigma", type=int, nargs="?")
618 |     p.add_argument("--rolling-radius", type=int, nargs="?")
619 |     p.add_argument("--match-histogram", dest="match_histogram", action="store_true")
620 |     p.add_argument("--tophat-radius", type=int, nargs="?")
621 |     p.add_argument("--rescale", dest="rescale", action="store_true")
622 |     p.add_argument("--n-processes", type=int, nargs="?")
623 |     p.add_argument("--selected-fovs", nargs="+", const=None)
624 | 
625 |     args = p.parse_args()
626 | 
627 |     output_dir = f"tmp/{args.tmp_prefix}/3_processed/"
628 | 
629 |     if args.n_processes:
630 |         n_processes = args.n_processes
631 |     else:
632 |         try:
633 |             # the following line is not guaranteed to work on non-linux machines.
634 |             n_processes = len(os.sched_getaffinity(os.getpid()))
635 |         except Exception:
636 |             n_processes = 1
637 | 
638 |     cli(
639 |         input_dir=args.input_dir,
640 |         output_dir=output_dir,
641 |         clip_min=args.clip_min,
642 |         clip_max=args.clip_max,
643 |         level_method=args.level_method,
644 |         is_volume=args.is_volume,
645 |         register_aux_view=args.register_aux_view,
646 |         register_to_primary=args.register_to_primary,
647 |         ch_per_reg=args.ch_per_reg,
648 |         background_name=args.background_view,
649 |         register_background=args.register_background,
650 |         anchor_name=args.anchor_view,
651 |         high_sigma=args.high_sigma,
652 |         decon_iter=args.decon_iter,
653 |         decon_sigma=args.decon_sigma,
654 |         low_sigma=args.low_sigma,
655 |         rolling_rad=args.rolling_radius,
656 |         match_hist=args.match_histogram,
657 |         wth_rad=args.tophat_radius,
658 |         rescale=args.rescale,
659 |         n_processes=n_processes,
660 |         selected_fovs=args.selected_fovs,
661 |     )
662 | 


--------------------------------------------------------------------------------
/bin/main.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | from argparse import ArgumentParser
 3 | from pathlib import Path
 4 | 
 5 | import starfish
 6 | 
 7 | 
 8 | def main(data_dir: Path):
 9 |     print("hello world")
10 |     pass
11 | 
12 | 
13 | if __name__ == "__main__":
14 |     p = ArgumentParser()
15 |     p.add_argument("data_dir", type=Path)
16 |     args = p.parse_args()
17 | 
18 |     main(args.data_dir)
19 | 


--------------------------------------------------------------------------------
/bin/pseudoSort.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | import sys
  4 | from argparse import ArgumentParser
  5 | from datetime import datetime
  6 | from os import makedirs, path
  7 | from pathlib import Path
  8 | from typing import Dict, List
  9 | 
 10 | import numpy as np
 11 | import pandas as pd
 12 | import skimage.io
 13 | import yaml
 14 | from starfish import Codebook
 15 | 
 16 | 
 17 | def parse_codebook(codebook_csv: str) -> Codebook:
 18 |     csv: pd.DataFrame = pd.read_csv(codebook_csv, index_col=0)
 19 |     genes = csv.index.values
 20 |     data_raw = csv.values
 21 |     rounds = csv.shape[1]
 22 |     channels = data_raw.max()
 23 | 
 24 |     # convert data_raw -> data, where data is genes x channels x rounds
 25 |     data = np.zeros((len(data_raw), rounds, channels))
 26 |     for b in range(len(data_raw)):
 27 |         for i in range(len(data_raw[b])):
 28 |             if data_raw[b][i] != 0:
 29 |                 data[b][i][data_raw[b][i] - 1] = 1
 30 | 
 31 |     return Codebook.from_numpy(genes, rounds, channels, data)
 32 | 
 33 | 
 34 | def convert_codebook(
 35 |     oldbook: Codebook, cycles_conv: Dict[int, int], channels_conv: List[Dict[int, int]]
 36 | ) -> Codebook:
 37 |     raw = oldbook.data
 38 |     targets = np.shape(raw)[0]
 39 |     rounds = len(cycles_conv)
 40 |     channels = len(channels_conv[0])
 41 |     new_data = np.empty((targets, rounds, channels), dtype=int)
 42 |     for t in range(targets):
 43 |         for pr in range(len(raw[t])):
 44 |             # annoying math because dicts are saved for the other direction
 45 |             pchannel = np.argmax(raw[t][pr])
 46 |             subChannel = [
 47 |                 [tch for tch, pch in subchannel.items() if pch == pchannel]
 48 |                 for subchannel in channels_conv
 49 |             ]
 50 |             subRound = np.argmax([len(per_round) for per_round in subChannel])
 51 |             tchannel = subChannel[subRound][0]
 52 |             tround = [tr for tr, pround in cycles_conv.items() if pround == pr][subRound]
 53 |             # print("channel {}->{} round {}->{}".format(pchannel,tchannel,pr,tround))
 54 |             new_data[t][tround][tchannel] = 1
 55 | 
 56 |     return Codebook.from_numpy(oldbook.coords["target"].data, rounds, channels, new_data)
 57 | 
 58 | 
 59 | def reformatter(
 60 |     cycles_conv: Dict[int, int],
 61 |     channels_conv: List[Dict[int, int]],
 62 |     input_dir: str,
 63 |     file_format: str = "",
 64 |     output_format: str = "",
 65 |     output_vars: List[str] = [],
 66 |     output_dir: str = "",
 67 |     file_vars: str = "",
 68 |     fov_count: int = 1,
 69 |     cache_read_order: List[str] = [],
 70 |     channel_slope: float = 1,
 71 |     channel_intercept: int = 0,
 72 |     fov_offset: int = 0,
 73 |     round_offset: int = 0,
 74 |     channel_offset: int = 0,
 75 |     aux_file_formats: List[str] = [],
 76 |     aux_file_vars: List[List[str]] = [],
 77 |     aux_names: List[str] = [],
 78 |     aux_cache_read_order: List[List[str]] = [],
 79 |     aux_channel_count: List[int] = [],
 80 |     aux_channel_slope: List[float] = [],
 81 |     aux_channel_intercept: List[int] = [],
 82 | ):
 83 |     reportFile = path.join(output_dir, datetime.now().strftime("%Y%d%m_%H%M_psorting.log"))
 84 |     sys.stdout = open(reportFile, "w")
 85 | 
 86 |     combined_file_format = [file_format] + aux_file_formats
 87 |     combined_file_vars = [file_vars] + aux_file_vars
 88 |     combined_names = [""] + aux_names
 89 |     combined_cache_read_order = [cache_read_order] + aux_cache_read_order
 90 |     combined_channel_count = [len(channels_conv[0])] + aux_channel_count
 91 |     channel_slope = [1] + aux_channel_slope
 92 |     channel_intercept = [0] + aux_channel_intercept
 93 |     views = len(combined_names)
 94 | 
 95 |     for r in cycles_conv.keys():
 96 |         for c in range(max(combined_channel_count)):
 97 |             for fov in range(fov_count):
 98 |                 varTable = {
 99 |                     "channel": c,
100 |                     "offset_channel": c + channel_offset,
101 |                     "round": r,
102 |                     "offset_round": r + round_offset,
103 |                     "fov": fov,
104 |                     "offset_fov": fov + fov_offset,
105 |                 }
106 |                 for target in range(views):
107 |                     if c < combined_channel_count[target]:
108 |                         varTable["input_channel"] = int(
109 |                             int(c * channel_slope[target]) + channel_intercept[target]
110 |                         )
111 |                         file_path = path.join(
112 |                             input_dir,
113 |                             combined_file_format[target].format(
114 |                                 *[varTable[arg] for arg in combined_file_vars[target]]
115 |                             ),
116 |                         )
117 |                         print(varTable)
118 |                         img = skimage.io.imread(file_path)
119 | 
120 |                         # Convert to uint16 if not already
121 |                         if np.max(img) <= 1:
122 |                             img = np.rint(img * 2**16).astype("uint16")
123 |                         if img.dtype != "uint16":
124 |                             img = img.astype("uint16")
125 |                         # img_out = img
126 | 
127 |                         # figure out what slice to take.
128 |                         slices = []
129 |                         for i in range(len(combined_cache_read_order[target])):
130 |                             axis = combined_cache_read_order[target][i]
131 |                             if axis.lower() == "ch":
132 |                                 c_adj = int(channel_slope[target] * c) + channel_intercept[target]
133 |                                 slices.append(int(c_adj))
134 |                             elif axis.lower() == "round":
135 |                                 slices.append(r)
136 |                             else:
137 |                                 slices.append(slice(0, img.shape[i]))
138 | 
139 |                         # take slices out of image and reduce unneeded dims
140 |                         slices = tuple(slices)
141 |                         print(slices)
142 |                         img_out = np.squeeze(img[slices])
143 | 
144 |                         # convert to new rounds/channels
145 |                         pr = cycles_conv[r]
146 |                         pc = channels_conv[r % len(channels_conv)][c]
147 | 
148 |                         # get output string
149 |                         varTableConv = {
150 |                             "channel": pc,
151 |                             "offset_channel": pc + channel_offset,
152 |                             "round": pr,
153 |                             "offset_round": pr + round_offset,
154 |                             "fov": fov,
155 |                             "offset_fov": fov + fov_offset,
156 |                             "aux_name": combined_names[target],
157 |                         }
158 |                         output_path = path.join(
159 |                             output_dir,
160 |                             output_format.format(*[varTableConv[arg] for arg in output_vars]),
161 |                         )
162 |                         print("{}\n->{}".format(file_path, output_path))
163 |                         print(np.shape(img_out))
164 |                         skimage.io.imsave(output_path, img_out)
165 | 
166 |     sys.stdout = sys.__stdout__
167 |     return True
168 | 
169 | 
170 | if __name__ == "__main__":
171 |     p = ArgumentParser()
172 |     p.add_argument("--tmp-prefix", type=str)
173 |     p.add_argument("--input-dir", type=Path)
174 |     p.add_argument("--codebook-csv", type=Path, nargs="?")
175 |     p.add_argument("--codebook-json", type=Path, nargs="?")
176 |     p.add_argument("--channel-yml", type=Path)
177 |     p.add_argument("--cycle-yml", type=Path)
178 |     p.add_argument("--file-format", type=str)
179 |     p.add_argument("--file-vars", type=str, nargs="+")
180 |     p.add_argument("--cache-read-order", type=str, nargs="+")
181 |     p.add_argument("--z-plane-offset", type=int)
182 |     p.add_argument("--fov-offset", type=int)
183 |     p.add_argument("--round-offset", type=int)
184 |     p.add_argument("--channel-offset", type=int)
185 |     p.add_argument("--fov-count", type=int)
186 |     p.add_argument("--channel-slope", type=float)
187 |     p.add_argument("--channel-intercept", type=int)
188 |     p.add_argument("--aux-file-formats", type=str, nargs="+", const=None)
189 |     p.add_argument("--aux-file-vars", type=str, nargs="+", const=None)
190 |     p.add_argument("--aux-names", type=str, nargs="+", const=None)
191 |     p.add_argument("--aux-cache-read-order", type=str, nargs="+", const=None)
192 |     p.add_argument("--aux-channel-count", type=int, nargs="+", const=None)
193 |     p.add_argument("--aux-channel-slope", type=float, nargs="+", const=None)
194 |     p.add_argument("--aux-channel-intercept", type=float, nargs="+", const=None)
195 | 
196 |     args = p.parse_args()
197 | 
198 |     aux_lens = []
199 |     aux_vars = [
200 |         args.aux_file_formats,
201 |         args.aux_file_vars,
202 |         args.aux_names,
203 |         args.aux_cache_read_order,
204 |         args.aux_channel_count,
205 |         args.aux_channel_slope,
206 |         args.aux_channel_intercept,
207 |     ]
208 | 
209 |     for item in aux_vars:
210 |         if isinstance(item, list):
211 |             aux_lens.append(len(item))
212 |         elif item is not None:
213 |             aux_lens.append(1)
214 |         else:
215 |             aux_lens.append(0)
216 | 
217 |     if len(set(aux_lens)) > 1:
218 |         print(aux_vars)
219 |         print(aux_lens)
220 |         raise Exception("Dimensions of all aux parameters must match.")
221 | 
222 |     output_dir = f"tmp/{args.tmp_prefix}/1_pseudosort/"
223 |     output_format = "PseudoCycle{}/MMStack_Pos{}_{}ch{}.ome.tif"
224 |     output_vars = ["round", "fov", "aux_name", "channel"]
225 | 
226 |     with open(args.channel_yml, "r") as fl:
227 |         channels_conv: List[Dict[int, int]] = yaml.load(fl, Loader=yaml.FullLoader)
228 | 
229 |     with open(args.cycle_yml, "r") as fl:
230 |         cycles_conv: Dict[int, int] = yaml.load(fl, Loader=yaml.FullLoader)
231 | 
232 |     for i in range(len(set(cycles_conv.values()))):
233 |         makedirs("{}PseudoCycle{}".format(output_dir, i))
234 | 
235 |     aux_file_vars = [item.split(";") for item in args.aux_file_vars]
236 |     aux_cache_read_order = [item.split(";") for item in args.aux_cache_read_order]
237 | 
238 |     reformatter(
239 |         cycles_conv=cycles_conv,
240 |         channels_conv=channels_conv,
241 |         input_dir=args.input_dir,
242 |         file_format=args.file_format,
243 |         output_format=output_format,
244 |         output_vars=output_vars,
245 |         output_dir=output_dir,
246 |         file_vars=args.file_vars,
247 |         fov_count=args.fov_count,
248 |         cache_read_order=args.cache_read_order,
249 |         channel_slope=args.channel_slope,
250 |         channel_intercept=args.channel_intercept,
251 |         fov_offset=args.fov_offset,
252 |         round_offset=args.round_offset,
253 |         channel_offset=args.channel_offset,
254 |         aux_file_formats=args.aux_file_formats,
255 |         aux_file_vars=aux_file_vars,
256 |         aux_names=args.aux_names,
257 |         aux_cache_read_order=aux_cache_read_order,
258 |         aux_channel_count=args.aux_channel_count,
259 |         aux_channel_slope=args.aux_channel_slope,
260 |         aux_channel_intercept=args.aux_channel_intercept,
261 |     )
262 | 
263 |     if args.codebook_csv:
264 |         codebook = parse_codebook(args.codebook_csv)
265 |     elif args.codebook_json:
266 |         codebook = Codebook.open_json(args.codebook_json)
267 |     else:
268 |         print("Can't convert notebook, none provided.")
269 | 
270 |     conv_codebook = convert_codebook(codebook, cycles_conv, channels_conv)
271 |     codebook.to_json(output_dir + "pround_codebook.json")
272 |     conv_codebook.to_json(output_dir + "codebook.json")
273 | 


--------------------------------------------------------------------------------
/docker/baysor/Dockerfile:
--------------------------------------------------------------------------------
 1 | # based on https://github.com/kharchenkolab/Baysor/blob/master/Dockerfile
 2 | # retrieved 2023.01.18
 3 | # version of this image in dockerhub breaks in cwltool due to included CMD line.
 4 | 
 5 | FROM julia:latest
 6 | 
 7 | RUN apt-get update && apt-get install -y build-essential
 8 | 
 9 | ## Jupyter
10 | 
11 | RUN apt-get install -y python3 python3-pip vim
12 | 
13 | RUN pip3 install jupyterlab numpy scipy matplotlib seaborn pandas sklearn scikit-image
14 | 
15 | RUN pip3 install -Iv six==1.12.0
16 | 
17 | RUN julia -e 'using Pkg; Pkg.add("IJulia"); Pkg.build(); using IJulia;'
18 | 
19 | ### jupyter notebook --no-browser --port=8989 --ip=0.0.0.0 --allow-root ./
20 | 
21 | ## Julia Baysor envitonment
22 | ### Ignore cache (https://stackoverflow.com/questions/35134713/disable-cache-for-specific-run-commands)
23 | ARG CACHEBUST=1
24 | RUN julia -e 'using Pkg; Pkg.add(PackageSpec(url="https://github.com/kharchenkolab/Baysor.git"));'
25 | 
26 | ENV LazyModules_lazyload false
27 | 
28 | RUN julia -e 'import Baysor, Pkg; Pkg.activate(dirname(dirname(pathof(Baysor)))); Pkg.instantiate(); Pkg.build();'
29 | RUN echo "export PATH=/root/.julia/bin/:$PATH" >> ~/.bashrc
30 | RUN echo "alias julia='/usr/local/julia/bin/julia --sysimage=/root/.julia/scratchspaces/cc9f9468-1fbe-11e9-0acf-e9460511877c/sysimg/libbaysor.so'" >> ~/.bashrc
31 | RUN ln -s /root/.julia/bin/baysor /usr/local/bin/baysor && chmod +x /root/.julia/bin/baysor
32 | 
33 | CMD ["/bin/bash"]
34 | 


--------------------------------------------------------------------------------
/docker/cellpose/Dockerfile:
--------------------------------------------------------------------------------
 1 | #FROM ubuntu:18.04
 2 | FROM continuumio/miniconda3:23.3.1-0
 3 | 
 4 | RUN conda create -y -n cellpose -c andfoy python=3.8 pyqt
 5 | RUN conda init bash; . /root/.bashrc; conda activate cellpose
 6 | 
 7 | RUN apt update
 8 | RUN apt -y upgrade
 9 | RUN apt install -y make gcc build-essential libgtk-3-dev wget git
10 | #RUN apt install -y python3.8-dev python3.8-venv python3-pip
11 | 
12 | #ENV VIRTUAL_ENV=/opt/venv
13 | #RUN python3.8 -m venv $VIRTUAL_ENV
14 | #ENV PATH="$VIRTUAL_ENV/bin:$PATH"
15 | RUN pip install --upgrade pip
16 | RUN pip install wheel numpy cython
17 | RUN conda install -c conda-forge imagecodecs
18 | 
19 | # Can't run on GPU inside a cwl, no sense installing this.
20 | #RUN pip install torch cuda-python==11.7
21 | 
22 | RUN pip install git+https://www.github.com/nickeener/cellpose.git
23 | 
24 | CMD ["/bin/bash"]
25 | 


--------------------------------------------------------------------------------
/docker/starfish-custom/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.8-buster
 2 | 
 3 | COPY requirements.txt /opt
 4 | 
 5 | # alt installs needed for ARM build
 6 | ARG TARGETPLATFORM
 7 | RUN if [ "$TARGETPLATFORM" = "linux/arm64" ]; then \
 8 | 		apt-get update && apt-get install -y libhdf5-dev && rm -rf /var/lib/apt/lists/*; \
 9 | 	else \
10 | 		 echo "Using pip install."; \
11 | 	fi
12 | 
13 | RUN python3 -m pip install -r /opt/requirements.txt \
14 |  && rm -rf /root/cache/.pip /opt/requirements.txt
15 | 
16 | RUN git clone --branch ctcisar-hubmap https://github.com/ctcisar/starfish.git
17 | RUN cd /starfish;make install-dev
18 | 
19 | COPY bin /opt
20 | COPY input_schemas /opt
21 | RUN chmod +x /opt/*.*
22 | 
23 | CMD ["/bin/bash"]
24 | 


--------------------------------------------------------------------------------
/docker/starfish-docker-runner/Dockerfile:
--------------------------------------------------------------------------------
1 | FROM quay.io/ucsc_cgl/toil:5.11.0a1-f6dda143d2bbd1e0a28138263cb34e2deca04377-py3.9
2 | 
3 | ENV DEBIAN_FRONTEND=noninteractive
4 | RUN apt-get update && apt-get install -y subversion && rm -rf /var/lib/apt/lists/*
5 | 
6 | RUN git clone --branch release https://github.com/hubmapconsortium/spatial-transcriptomics-pipeline.git
7 | 


--------------------------------------------------------------------------------
/docker/starfish/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.7-stretch
 2 | 
 3 | COPY requirements.txt /opt
 4 | 
 5 | RUN python3 -m pip install -r /opt/requirements.txt \
 6 |  && python3 -m pip install starfish \
 7 |  && rm -rf /root/cache/.pip /opt/requirements.txt
 8 | 
 9 | COPY bin /opt
10 | COPY input_schemas /opt
11 | RUN chmod +x /opt/*.py
12 | 
13 | CMD ["/bin/bash"]
14 | 


--------------------------------------------------------------------------------
/docker_images.txt:
--------------------------------------------------------------------------------
1 | #hubmap/starfish docker/starfish/Dockerfile base_directory_build
2 | hubmap/starfish-custom docker/starfish-custom/Dockerfile base_directory_build,platforms=linux/amd64&linux/arm64
3 | hubmap/starfish-docker-runner docker/starfish-docker-runner/Dockerfile base_directory_build,platforms=linux/amd64&linux/arm64
4 | # As of v0.6.0 the build for the baysor docker image is broken.
5 | # Check up on it again later to see if it's working (last update 2023.04.13)
6 | #hubmap/baysor docker/baysor/Dockerfile base_directory_build
7 | hubmap/cellpose docker/cellpose/Dockerfile base_directory_build,platforms=linux/amd64&linux/arm64
8 | 


--------------------------------------------------------------------------------
/input_schemas/cellpose.json:
--------------------------------------------------------------------------------
 1 | [
 2 |     "zplane_count?",
 3 |     "selected_fovs?",
 4 |     "use_mrna?",
 5 |     "pretrained_model_str?",
 6 |     "diameter?",
 7 |     "flow_threshold?",
 8 |     "stitch_threshold?",
 9 |     "cellprob_threshold?",
10 |     "border_buffer?",
11 |     "label_exp_size?",
12 |     "min_allowed_size?",
13 |     "max_allowed_size?",
14 |     "aux_views"
15 | ]
16 | 


--------------------------------------------------------------------------------
/input_schemas/pipeline.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"run_baysor",
 3 | 	"aux_views",
 4 | 	"skip_formatting",
 5 | 	"skip_processing",
 6 | 	"register_aux_view",
 7 | 	"run_cellpose",
 8 | 	{
 9 | 		"fov_positioning":[
10 | 			[
11 | 				"x_locs?",
12 | 				"x_shape?",
13 | 				"x_voxel?",
14 | 				"y_locs?",
15 | 				"y_shape?",
16 | 				"y_voxel?",
17 | 				"z_locs?",
18 | 				"z_shape?",
19 | 				"z_voxel?"
20 | 			]
21 | 		]
22 | 	},
23 | 	"add_blanks",
24 | 	"skip_seg",
25 | 	"skip_qc"
26 | ]
27 | 


--------------------------------------------------------------------------------
/input_schemas/processing.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"fov_count",
 3 | 	"selected_fovs",
 4 | 	"clip_min?",
 5 | 	"clip_max?",
 6 | 	"level_method?",
 7 | 	"rescale?",
 8 | 	"is_volume?",
 9 | 	"register_aux_view?",
10 | 	"register_to_primary?",
11 | 	"channels_per_reg?",
12 | 	"background_view?",
13 | 	"register_background?",
14 | 	"anchor_view?",
15 | 	"high_sigma?",
16 | 	"deconvolve_iter?",
17 | 	"deconvolve_sigma?",
18 | 	"low_sigma?",
19 | 	"rolling_radius?",
20 | 	"match_histogram?",
21 | 	"tophat_radius?",
22 | 	"channel_count",
23 | 	"n_processes?",
24 | 	{
25 | 		"aux_tilesets":[
26 | 			[
27 | 				"aux_names?",
28 | 				"aux_channel_count?"
29 | 			]
30 | 		]
31 | 	}
32 | ]
33 | 


--------------------------------------------------------------------------------
/input_schemas/psortedDefaultParams.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"round_count",
 3 | 	"fov_count",
 4 | 	"channel_count",
 5 | 	"zplane_count",
 6 | 	"cache_read_order",
 7 | 	{
 8 | 		"aux_tilesets": [
 9 | 			[
10 | 				"aux_names?",
11 | 				"aux_cache_read_order?",
12 | 				"aux_channel_count"
13 | 			]
14 | 		]
15 | 	}
16 | ]
17 | 


--------------------------------------------------------------------------------
/input_schemas/qc.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"selected_fovs?",
 3 | 	"find_ripley",
 4 | 	"save_pdf",
 5 | 	{
 6 | 		"fov_positioning" : [
 7 | 			[],
 8 | 			[
 9 | 				"x_shape",
10 | 				"y_shape",
11 | 				"z_shape"
12 | 			]
13 | 		]
14 | 	},
15 | 	{
16 | 		"decoding":[
17 | 			[],
18 | 			[
19 | 				"decode_method?",
20 | 				"magnitude_threshold?",
21 | 				{
22 | 					"decoder": [
23 | 						[],
24 | 						[
25 | 							"min_intensity"
26 | 						]
27 | 					]
28 | 				}
29 | 			]
30 | 		]
31 | 	}
32 | ]
33 | 


--------------------------------------------------------------------------------
/input_schemas/segmentation.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"selected_fovs?",
 3 | 	"aux_name",
 4 | 	{
 5 | 		"binary_mask":[
 6 | 			[],
 7 | 			[
 8 | 				"img_threshold",
 9 | 				"min_dist",
10 | 				"min_allowed_size",
11 | 				"max_allowed_size",
12 | 				"masking_radius"
13 | 			],
14 | 			[
15 | 				"nuclei_view",
16 | 				"cyto_seg",
17 | 				"correct_seg",
18 | 				"border_buffer",
19 | 				"area_thresh",
20 | 				"thresh_block_size",
21 | 				"watershed_footprint_size",
22 | 				"label_exp_size"
23 | 			]
24 | 		]
25 | 	}
26 | ]
27 | 


--------------------------------------------------------------------------------
/input_schemas/sorter.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"round_count",
 3 | 	"fov_count",
 4 | 	"round_offset?",
 5 | 	"fov_offset?",
 6 | 	"channel_offset?",
 7 | 	"channel_slope?",
 8 | 	"file_format",
 9 | 	"file_vars",
10 | 	"cache_read_order",
11 | 	{
12 | 		"aux_tilesets":[
13 | 			[
14 | 				"aux_names?",
15 | 				"aux_file_formats?",
16 | 				"aux_file_vars?",
17 | 				"aux_cache_read_order?",
18 | 				"aux_channel_count?",
19 | 				"aux_channel_slope?",
20 | 				"aux_channel_intercept?"
21 | 			]
22 | 		]
23 | 	}
24 | ]
25 | 


--------------------------------------------------------------------------------
/input_schemas/spaceTxConversion.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"round_count",
 3 | 	"fov_count",
 4 | 	"zplane_count",
 5 | 	"channel_count",
 6 | 	"round_offset?",
 7 | 	"fov_offset?",
 8 | 	"zplane_offset?",
 9 | 	"channel_offset?",
10 | 	"file_format",
11 | 	"file_vars",
12 | 	"cache_read_order",
13 | 	{
14 | 		"aux_tilesets":[
15 | 			[
16 | 				"aux_names?",
17 | 				"aux_file_formats?",
18 | 				"aux_file_vars?",
19 | 				"aux_cache_read_order?",
20 | 				"aux_single_round?",
21 | 				"aux_channel_count?",
22 | 				"aux_channel_slope?",
23 | 				"aux_channel_intercept?"
24 | 			]
25 | 		]
26 | 	},
27 | 	{
28 | 		"fov_positioning":[
29 | 			[
30 | 			],
31 | 			[
32 | 				"x_locs?",
33 | 				"x_shape?",
34 | 				"x_voxel?",
35 | 				"y_locs?",
36 | 				"y_shape?",
37 | 				"y_voxel?",
38 | 				"z_locs?",
39 | 				"z_shape?",
40 | 				"z_voxel?"
41 | 			]
42 | 		]
43 | 	},
44 | 	"add_blanks?"
45 | ]
46 | 


--------------------------------------------------------------------------------
/input_schemas/starfishRunner.json:
--------------------------------------------------------------------------------
 1 | [
 2 | 	"fov_count",
 3 | 	"selected_fovs?",
 4 | 	"level_method?",
 5 | 	"use_ref_img?",
 6 | 	"is_volume?",
 7 | 	"rescale?",
 8 | 	"anchor_view?",
 9 | 	"not_filtered_results?",
10 | 	"n_processes?",
11 | 	"scatter_into_n?",
12 | 	{
13 | 		"decoding":[
14 | 			[
15 | 				"min_sigma?",
16 | 				"max_sigma?",
17 | 				"num_sigma?",
18 | 				"threshold?",
19 | 				"overlap?",
20 | 				"decode_method?",
21 | 				"pnorm?",
22 | 				"distance_threshold?",
23 | 				"magnitude_threshold?",
24 | 				"min_area?",
25 | 				"max_area?",
26 | 				"norm_order?",
27 | 				"composite_decode?",
28 | 				"composite_pmin?",
29 | 				"composite_pmax?",
30 | 				{
31 | 					"decoder":[
32 | 						[
33 | 							
34 | 						],
35 | 						[
36 | 							"trace_building_strategy",
37 | 							"max_distance",
38 | 							"min_intensity",
39 | 							"pnorm?",
40 | 							"norm_order?",
41 | 							"anchor_round?",
42 | 							"search_radius?",
43 | 							"return_original_intensities?"
44 | 						],
45 | 						[
46 | 							"search_radius?",
47 | 							"anchor_round?",
48 | 							"trace_building_strategy"
49 | 						],
50 | 						[
51 | 							"search_radius?",
52 | 							"error_rounds?",
53 | 							"mode",
54 | 							"physical_coords?"
55 | 						]
56 | 					]
57 | 				}
58 | 			]
59 | 		]
60 | 	}
61 | ]
62 | 


--------------------------------------------------------------------------------
/logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/hubmapconsortium/spatial-transcriptomics-pipeline/2e31b8ddd4d509c7bbcb983ad41e401687623ddb/logo.png


--------------------------------------------------------------------------------
/pipeline-manifest.json:
--------------------------------------------------------------------------------
  1 | [
  2 | 	"//TODO": "Baysor folders, cellpose folders.",
  3 | 	{
  4 | 		"pattern": "1_pseudosort/PseudoCycle(?P<round>)/MMStack_Pos(?P<FOV>)_(?P<view>)ch(?P<channel>).ome.tif",
  5 | 		"description": "Input images, rearranged into consistent round and channel counts.",
  6 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
  7 | 	},
  8 | 	{
  9 | 		"pattern": "1_pseudosort/(?P<timestamp>)_psorting.log",
 10 | 		"description": "Log of completed operations while round sorting.",
 11 | 		"edam_ontology_term": "EDAM_1.24.data_3671"
 12 | 	},
 13 | 	{
 14 | 		"pattern": "1_pseudosort/codebook.json",
 15 | 		"description": "Codebook that represents the truerounds and truechannels for barcodes.",
 16 | 		"edam_ontology_term": "EDAM_1.24.format_3464"
 17 | 	},
 18 | 	{
 19 | 		"pattern": "1_pseudosort/pround_codebook.json",
 20 | 		"description": "Codebook that represents the pseudorounds and pseudochannels that will be used for decoding.",
 21 | 		"edam_ontology_term": "EDAM_1.24.format_3464"
 22 | 	},
 23 | 	{
 24 | 		"pattern": "2_tx_converted/(?P<view>)-fov_(?P<FOV>)-c(?P<channel>)-r(?P<round>)-z(?P<zslice>).tiff",
 25 | 		"description": "Images saved in spacetx format.",
 26 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 27 | 	},
 28 | 	{
 29 | 		"pattern": "2_tx_converted/(?P<view>)-fov_(?P<FOV>).json",
 30 | 		"description": "spacetx metadata files describing each fov, view combination.",
 31 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 32 | 	},
 33 | 	{
 34 | 		"pattern": "2_tx_converted/(?P<view>).json",
 35 | 		"description": "spacetx metadata files describing each view.",
 36 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 37 | 	},
 38 | 	{
 39 | 		"pattern": "2_tx_converted/codebook.json",
 40 | 		"description": "Codebook that contains round and channel information for barcodes.",
 41 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 42 | 	},
 43 | 	{
 44 | 		"pattern": "2_tx_converted/experiment.json",
 45 | 		"description": "spacetx metadata files describing the entirety of the experiment.",
 46 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 47 | 	},
 48 | 	{
 49 | 		"pattern": "2_tx_converted/(?P<timestamp>)_img_processing.log",
 50 | 		"description": "Log of completed operations while converting images.",
 51 | 		"edam_ontology_term": "EDAM_1.24.data_3671"
 52 | 	},
 53 | 	{
 54 | 		"pattern": "3_processed/(?P<view>)-fov_(?P<FOV>)-c(?P<channel>)-r(?P<round>)-z(?P<zslice>).tiff",
 55 | 		"description": "Images saved in spacetx format.",
 56 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 57 | 	},
 58 | 	{
 59 | 		"pattern": "3_processed/(?P<view>)-fov_(?P<FOV>).json",
 60 | 		"description": "spacetx metadata files describing each fov, view combination.",
 61 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 62 | 	},
 63 | 	{
 64 | 		"pattern": "3_processed/(?P<view>).json",
 65 | 		"description": "spacetx metadata files describing each view.",
 66 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 67 | 	},
 68 | 	{
 69 | 		"pattern": "3_processed/codebook.json",
 70 | 		"description": "Codebook that contains round and channel information for barcodes.",
 71 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 72 | 	},
 73 | 	{
 74 | 		"pattern": "3_processed/experiment.json",
 75 | 		"description": "spacetx metadata files describing the entirety of the experiment.",
 76 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
 77 | 	},
 78 | 	{
 79 | 		"pattern": "3_processed/(?P<timestamp>)_TXconversion.log",
 80 | 		"description": "Log of completed operations while modifying images.",
 81 | 		"edam_ontology_term": "EDAM_1.24.data_3671"
 82 | 	},
 83 | 	{
 84 | 		"pattern": "4_Decoded/cdf/fov_(?P<FOV>)_decoded.cdf",
 85 | 		"description": "netCDF formatted gene table with transcript locations.",
 86 | 		"edam_ontology_term": "EDAM_1.24.format_3650"
 87 | 	},
 88 | 	{
 89 | 		"pattern": "4_Decoded/csv/fov_(?P<FOV>)_decoded.csv",
 90 | 		"description": "csv formatted gene table with transcript locations.",
 91 | 		"edam_ontology_term": "EDAM_1.24.format_3752"
 92 | 	},
 93 | 	{
 94 | 		"pattern": "4_Decoded/spots/fov_(?P<FOV>)_coords_(?P<dimension>).nc",
 95 | 		"description": "FOV positioning information for decoded spots.",
 96 | 		"edam_ontology_term": "EDAM_1.24.format_3650"
 97 | 	},
 98 | 	{
 99 | 		"pattern": "4_Decoded/spots/fov_(?P<FOV>)_SpotFindingResults.json",
100 | 		"description": "Metadata for saved spots.",
101 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
102 | 	},
103 | 	{
104 | 		"pattern": "4_Decoded/spots/fov_(?P<FOV>)_log.arr",
105 | 		"description": "Log of operation history for this FOV's spots.",
106 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
107 | 	},
108 | 	{
109 | 		"pattern": "4_Decoded/spots/fov_(?P<FOV>)_spots_(?P<round>)_(?P<channel>).nc",
110 | 		"description": "Spot data for one round, channel combination.",
111 | 		"edam_ontology_term": "EDAM_1.24.format_3650"
112 | 	},
113 | 	{
114 | 		"pattern": "4_Decoded/(?p<timestamp>)_starfish_runner.log",
115 | 		"description": "log of completed operations while decoding the experiment.",
116 | 		"edam_ontology_term": "edam_1.24.data_3671"
117 | 	},
118 | 	{
119 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/segmentation.csv",
120 | 		"description": "CSV table of transcripts, annotated with location and cell IDs.",
121 | 		"edam_ontology_term": "EDAM_1.24.format_3752"
122 | 	},
123 | 	{
124 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/df_segmented.cdf",
125 | 		"description": "NetCDF table of transcripts, annotated with location and cell IDs.",
126 | 		"edam_ontology_term": "EDAM_1.24.format_3650"
127 | 	},
128 | 	{
129 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/exp_segmented.cdf",
130 | 		"description": "NetCDF Cell x Gene table.",
131 | 		"edam_ontology_term": "EDAM_1.24.format_3650"
132 | 	},
133 | 	{
134 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/exp_segmented.csv",
135 | 		"description": "CSV Cell x Gene table.",
136 | 		"edam_ontology_term": "EDAM_1.24.format_3752"
137 | 	},
138 | 	{
139 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/exp_segmented.h5ad",
140 | 		"description": "Anndata Cell x Gene table.",
141 | 		"edam_ontology_term": "FIXME"
142 | 	},
143 | 	{
144 | 		"pattern": "5_Segmented/fov_(?P<FOV>)/mask.tiff",
145 | 		"description": "A copy of the segmentation mask applied to this FOV",
146 | 		"edam_ontology_term": "EDAM_1.24.format_3591"
147 | 	},
148 | 	{
149 | 		"pattern": "5_Segmented/(?p<timestamp>)_starfish_segmenter.log",
150 | 		"description": "log of completed operations while segmenting the experiment.",
151 | 		"edam_ontology_term": "edam_1.24.data_3671"
152 | 	},
153 | 	{
154 | 		"pattern": "7_QC/(?p<timestamp>)_QC_metrics.log",
155 | 		"description": "log of completed operations while calculating QC values.",
156 | 		"edam_ontology_term": "edam_1.24.data_3671"
157 | 	},
158 | 	{
159 | 		"pattern": "7_QC/QC_results.yml",
160 | 		"description": "Complete human-readable set of QC values.",
161 | 		"edam_ontology_term": "edam_1.24.data_3750"
162 | 	},
163 | 	{
164 | 		"pattern": "7_QC/fov_(?P<FOV>)_graph_output.pdf",
165 | 		"description": "Visual plots of QC metrics.",
166 | 		"edam_ontology_term": "edam_1.24.data_3508"
167 | 	},
168 | 	{
169 | 		"pattern": "7_QC/fov_combined_graph_output.pdf",
170 | 		"description": "Visual plots of QC metrics, combined across all FOVs.",
171 | 		"edam_ontology_term": "edam_1.24.data_3508"
172 | 	}
173 | ]
174 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
1 | [tool.black]
2 | line-length = 99
3 | 
4 | [tool.isort]
5 | profile = "black"
6 | multi_line_output = 3
7 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | numpy
 2 | scikit-image==0.18.3
 3 | tqdm
 4 | anndata
 5 | astropy
 6 | tifffile
 7 | matplotlib
 8 | opencv-python-headless==4.6.0.66
 9 | pyro-ppl
10 | 


--------------------------------------------------------------------------------
/requirements_test.txt:
--------------------------------------------------------------------------------
1 | black>=22.3.0
2 | isort
3 | 


--------------------------------------------------------------------------------
/steps/baysor.cwl:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env cwl-runner
 2 | 
 3 | class: CommandLineTool
 4 | cwlVersion: v1.2
 5 | baseCommand: ["baysor","run"]
 6 | 
 7 | requirements:
 8 |   DockerRequirement:
 9 |     dockerPull: vpetukhov/baysor@sha256:ce58af2bbd81ca29f7382497223afe9dbfbcc674e810155964722b447b676087
10 |     #dockerPull: hubmap/baysor:latest
11 | 
12 | inputs:
13 |   csv:
14 |     type: File
15 |     inputBinding:
16 |       position: 5
17 |     doc: csv with transcript information
18 |   priors:
19 |     type: File?
20 |     inputBinding:
21 |       position: 6
22 |     doc: Binary Mask image with prior segmentation.
23 |   scale:
24 |     type: int?
25 |     inputBinding:
26 |       position: 1
27 |       prefix: -s
28 |     doc: Expected scale equal to cell radius in the same units as x, y, and z.
29 |   x_col:
30 |     type: string?
31 |     inputBinding:
32 |       position: 2
33 |       prefix: -x
34 |     doc: Name of the column with x information
35 |     default: x
36 |   y_col:
37 |     type: string?
38 |     inputBinding:
39 |       position: 3
40 |       prefix: -y
41 |     default: y
42 |     doc: Name of the column with y information
43 |   gene_col:
44 |     type: string?
45 |     inputBinding:
46 |       position: 4
47 |       prefix: --gene
48 |     default: target
49 |     doc: Name of the column with gene names
50 | 
51 | outputs:
52 |   segmented:
53 |     type: File[]
54 |     outputBinding:
55 |       glob: "segmentation*"
56 | 
57 | stdout: baysor_stdout.log
58 | 


--------------------------------------------------------------------------------
/steps/baysorStaged.cwl:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env cwl-runner
 2 | 
 3 | class: Workflow
 4 | cwlVersion: v1.2
 5 | requirements:
 6 |   ScatterFeatureRequirement: {}
 7 | inputs:
 8 |   segmented: Directory
 9 | outputs:
10 |   baysor:
11 |     type: Directory
12 |     outputSource: restage/pool_dir
13 | 
14 | steps:
15 |   stage:
16 |     run:
17 |       class: CommandLineTool
18 |       baseCommand: [ls]
19 |       requirements:
20 |         DockerRequirement:
21 |           dockerPull: ubuntu:latest
22 |         InitialWorkDirRequirement:
23 |           listing:
24 |             - $(inputs.segDir)
25 |       inputs:
26 |         segDir:
27 |           type: Directory
28 |           doc: Directory with output from starfish segmentation step.
29 |       outputs:
30 |         csvs:
31 |           type:
32 |             type: array
33 |             items: File
34 |           outputBinding:
35 |             glob: "**/**/segmentation.csv"
36 |         priors:
37 |           type:
38 |             type: array
39 |             items: File
40 |           outputBinding:
41 |             glob: "**/**/mask.tiff"
42 |     in:
43 |       segDir: segmented
44 |     out: [csvs, priors]
45 |   baysor_run:
46 |     run: baysor.cwl
47 |     in:
48 |       csv: stage/csvs
49 |       priors: stage/priors
50 |     scatter: [csv, priors]
51 |     scatterMethod: dotproduct
52 |     out: [segmented]
53 |   restage:
54 |     run:
55 |       class: ExpressionTool
56 |       requirements:
57 |         InlineJavascriptRequirement: {}
58 |       inputs:
59 |         file_array:
60 |           type:
61 |             type: array
62 |             items:
63 |               type: array
64 |               items: File
65 |       outputs:
66 |         pool_dir: Directory
67 |       expression: |
68 |         ${ var dir = [];
69 |            for(var i=0;i<inputs.file_array.length; i++){
70 |              dir.push({"class": "Directory", "basename": "fov_"+String(i).padStart(5,'0'), "listing": inputs.file_array[i]});
71 |            }
72 |            return {"pool_dir": {
73 |              "class": "Directory",
74 |              "basename": "6_Baysor",
75 |              "listing": dir}
76 |            }; }
77 |     in:
78 |       file_array: baysor_run/segmented
79 |     out: [pool_dir]
80 | 


--------------------------------------------------------------------------------
/steps/cellpose.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 |   exp_loc:
 14 |     type: Directory
 15 |     doc: Root directory containing space_tx formatted experiment
 16 | 
 17 |   dir_size:
 18 |     type: long?
 19 |     doc: Size of tiffs, in MiB. If provided, will be used to calculate ResourceRequirement.
 20 | 
 21 |   decoded_loc:
 22 |     type: Directory?
 23 |     doc: Location of directory that is output from the starfishRunner step, only needed if mRNA information is to be included.
 24 | 
 25 |   use_mrna:
 26 |     type: boolean?
 27 |     doc: If true and decoded_loc is provided, mrna data will be used in calculations.
 28 | 
 29 |   parameter_json:
 30 |     type: File?
 31 |     doc: json containing step parameters.
 32 | 
 33 |   selected_fovs:
 34 |     type: int[]?
 35 |     doc: If provided, segmentation will only be run on FOVs with these indices.
 36 | 
 37 |   zplane_count:
 38 |     type: int?
 39 |     doc: The number of z-planes in each image. All that matters is whether this is equal to 1 or not, retaining the same var name as conversion for simplification.
 40 | 
 41 |   aux_views:
 42 |     type: string[]?
 43 |     doc: The views to use for cellpose segmentation.
 44 | 
 45 |   pretrained_model_str:
 46 |     type: string?
 47 |     doc: Cellpose-provided model to use.
 48 | 
 49 |   pretrained_model_dir:
 50 |     type: File?
 51 |     doc: Manually trained cellpose model to use.
 52 | 
 53 |   diameter:
 54 |     type: float?
 55 |     doc: Expected diameter of cells. Should be 0 if a custom model is used.
 56 | 
 57 |   flow_threshold:
 58 |     type: float?
 59 |     doc: threshold for filtering cell segmentations (increasing this will filter out lower confidence segmentations), range is 0 to infinity
 60 | 
 61 |   stitch_threshold:
 62 |     type: float?
 63 |     doc: threshold for stitching together segmentations that occur at the same xy location but in adjacent z slices, range is 0 to 1. This should only be used when the image is 3D.
 64 | 
 65 |   cellprob_threshold:
 66 |     type: float?
 67 |     doc: determines the extent of the segmentations (0 is the default more negative values result in larger cells, more positive values result in smaller cells), range is -6 to 6.
 68 | 
 69 |   border_buffer:
 70 |     type: int?
 71 |     doc: If not None, removes cytoplasms whose nuclei lie within the given distance from the border.
 72 | 
 73 |   label_exp_size:
 74 |     type: int?
 75 |     doc: Pixel size labels are dilated by in final step. Helpful for closing small holes that are common from thresholding but can also cause cell boundaries to exceed their true boundaries if set too high. Label dilation respects label borders and does not mix labels.
 76 | 
 77 |   min_allowed_size:
 78 |     type: int?
 79 |     doc: minimum size for a cell (in pixels)
 80 | 
 81 |   max_allowed_size:
 82 |     type: int?
 83 |     doc: maximum size for a cell (in pixels)
 84 | 
 85 | outputs:
 86 |   cellpose_input:
 87 |     type: Directory
 88 |     outputSource: execute_cellpose_prep/cellpose_input
 89 |   cellpose_output:
 90 |     type: Directory
 91 |     outputSource: execute_cellpose/cellpose_output
 92 |   cellpose_filtered:
 93 |     type: Directory
 94 |     outputSource: execute_filtering/cellpose_filtered
 95 | 
 96 | steps:
 97 | 
 98 |   tmpname:
 99 |     run: tmpdir.cwl
100 |     in: []
101 |     out: [tmp]
102 | 
103 |   read_schema:
104 |     run:
105 |       class: CommandLineTool
106 |       baseCommand: cat
107 | 
108 |       requirements:
109 |         DockerRequirement:
110 |           dockerPull: hubmap/starfish-custom:latest
111 |         ResourceRequirement:
112 |           ramMin: 1000
113 |           tmpdirMin: 1000
114 |           outdirMin: 1000
115 | 
116 |       inputs:
117 |         schema:
118 |           type: string
119 |           inputBinding:
120 |             position: 1
121 | 
122 |       outputs:
123 |         data:
124 |           type: stdout
125 | 
126 |     in:
127 |       schema:
128 |         valueFrom: "/opt/cellpose.json"
129 |     out: [data]
130 | 
131 |   stage_cellpose:
132 |     run: inputParser.cwl
133 |     in:
134 |       datafile: parameter_json
135 |       schema: read_schema/data
136 |     out: [use_mrna, zplane_count, selected_fovs, pretrained_model_str, diameter, flow_threshold, stitch_threshold, cellprob_threshold,  border_buffer, label_exp_size, min_allowed_size, max_allowed_size, aux_views]
137 |     when: $(inputs.datafile != null)
138 | 
139 |   execute_cellpose_prep:
140 |     run:
141 |       class: CommandLineTool
142 |       baseCommand: /opt/cellposeStaging.py
143 | 
144 |       requirements:
145 |         InitialWorkDirRequirement:
146 |           listing:
147 |             - entryname: "$('input_dir_'+inputs.tmp_prefix)"
148 |               writable: true
149 |               entry: "$(inputs.exp_loc)"
150 |         DockerRequirement:
151 |           dockerPull: hubmap/starfish-custom:latest
152 |         ResourceRequirement:
153 |           tmpdirMin: |
154 |             ${
155 |               if(inputs.dir_size === null) {
156 |                 return null;
157 |               } else {
158 |                 return inputs.dir_size;
159 |               }
160 |             }
161 |           outdirMin: |
162 |             ${
163 |               return 1000;
164 |             }
165 | 
166 |       inputs:
167 |         dir_size:
168 |           type: long?
169 | 
170 |         tmp_prefix:
171 |           type: string
172 |           inputBinding:
173 |             prefix: --tmp-prefix
174 | 
175 |         exp_loc:
176 |           type: Directory
177 |           doc: Root directory containing space_tx formatted experiment
178 | 
179 |         exp_loc_staged:
180 |           type: string
181 |           inputBinding:
182 |             prefix: --input-dir
183 | 
184 |         decoded_loc:
185 |           type: Directory?
186 |           doc: Location of directory that is output from the starfishRunner step.
187 |           inputBinding:
188 |             prefix: --decoded-dir
189 | 
190 |         selected_fovs:
191 |           type: int[]?
192 |           doc: If provided, segmentation will only be run on FOVs with these indices.
193 |           inputBinding:
194 |             prefix: --selected-fovs
195 | 
196 |         aux_views:
197 |           type: string[]?
198 |           doc: The views to use for cellpose segmentation.
199 |           inputBinding:
200 |             prefix: --aux-views
201 | 
202 |         format:
203 |           type: boolean
204 |           doc: Used to specify method in python script
205 |           default: true
206 |           inputBinding:
207 |             prefix: --format
208 | 
209 |       outputs:
210 |         cellpose_input:
211 |           type: Directory
212 |           outputBinding:
213 |             glob: $("tmp/" + inputs.tmp_prefix + "/5A_cellpose_input/")
214 |     in:
215 |       dir_size: dir_size
216 |       tmp_prefix: tmpname/tmp
217 |       exp_loc: exp_loc
218 |       exp_loc_staged:
219 |         valueFrom: $("input_dir_" + inputs.tmp_prefix)
220 |       decoded_loc:
221 |         source: [decoded_loc, stage_cellpose/use_mrna, use_mrna]
222 |         valueFrom: |
223 |           ${
224 |             if(self[1] || self[2]){
225 |               return self[0];
226 |             } else {
227 |               return null;
228 |             }
229 |           }
230 |       selected_fovs:
231 |         source: [stage_cellpose/selected_fovs, selected_fovs]
232 |         valueFrom: |
233 |           ${
234 |             if(self[0]){
235 |               return self[0];
236 |             } else if(self[1]) {
237 |               return self[1];
238 |             } else {
239 |               return null;
240 |             }
241 |           }
242 |       aux_views:
243 |         source: [stage_cellpose/aux_views, aux_views]
244 |         valueFrom: |
245 |           ${
246 |             if(self[0]){
247 |               return self[0];
248 |             } else if(self[1]) {
249 |               return self[1];
250 |             } else {
251 |               return null;
252 |             }
253 |           }
254 |     out: [cellpose_input]
255 | 
256 |   execute_cellpose:
257 |     run:
258 |       class: CommandLineTool
259 |       baseCommand: ["cellpose"]
260 | 
261 |       requirements:
262 |         DockerRequirement:
263 |           dockerPull: hubmap/cellpose:latest
264 |         InitialWorkDirRequirement:
265 |           listing:
266 |             - entry: $(inputs.input_dir)
267 |               writable: true
268 | 
269 |       inputs:
270 |         verbose:
271 |           type: boolean?
272 |           inputBinding:
273 |             prefix: --verbose
274 |           default: true
275 |           doc: Enables verbose output
276 | 
277 |         input_dir:
278 |           type: Directory
279 |           inputBinding:
280 |             prefix: --dir
281 | #            valueFrom: $(self.basename)
282 |           doc: Input directory for cellpose
283 | 
284 |         img_filter:
285 |           type: string
286 |           inputBinding:
287 |             prefix: --img_filter
288 |           default: _image
289 |           doc: Glob filter for input
290 | 
291 |         z_axis:
292 |           type: int?
293 |           inputBinding:
294 |             prefix: --z_axis
295 |           doc: 0 if image is not flat, unset if flat.
296 | 
297 |         channel_axis:
298 |           type: int?
299 |           inputBinding:
300 |             prefix: --channel_axis
301 |           doc: 1 if image is flat, 0 if flat.
302 | 
303 |         all_channels:
304 |           type: boolean?
305 |           inputBinding:
306 |             prefix: --all_channels
307 |           default: true
308 |           doc: Tells cellpose to use all channels in the order they appear
309 | 
310 |         save_tif:
311 |           type: boolean?
312 |           inputBinding:
313 |             prefix: --save_tif
314 |           default: true
315 |           doc: Tells cellpose to save images as a tif, instead of defaulting to png
316 | 
317 |         savedir:
318 |           type: string?
319 |           inputBinding:
320 |             prefix: --savedir
321 |           default: "5B_cellpose_output"
322 |           doc: Name of directory to save to.
323 | 
324 |         pretrained_model_str:
325 |           type: string?
326 |           inputBinding:
327 |             prefix: --pretrained_model
328 |           doc: Cellpose-provided model to use.
329 | 
330 |         pretrained_model_dir:
331 |           type: File?
332 |           inputBinding:
333 |             prefix: --pretrained_model
334 |           doc: Manually trained cellpose model to use.
335 | 
336 |         diameter:
337 |           type: float?
338 |           inputBinding:
339 |             prefix: --diameter
340 |           doc: Expected diameter of cells. Should be 0 if a custom model is used.
341 | 
342 |         flow_threshold:
343 |           type: float?
344 |           inputBinding:
345 |             prefix: --flow_threshold
346 |           default: 0.4
347 |           doc: threshold for filtering cell segmentations (increasing this will filter out lower confidence segmentations), range is 0 to infinity
348 | 
349 |         stitch_threshold:
350 |           type: float?
351 |           inputBinding:
352 |             prefix: --stitch_threshold
353 |           doc: threshold for stitching together segmentations that occur at the same xy location but in adjacent z slices, range is 0 to 1. This should only be used when the image is 3D.
354 | 
355 |         cellprob_threshold:
356 |           type: float?
357 |           inputBinding:
358 |             prefix: --cellprob_threshold
359 |           doc: determines the extent of the segmentations (0 is the default more negative values result in larger cells, more positive values result in smaller cells), range is -6 to 6.
360 | 
361 |         net_avg:
362 |           type: boolean?
363 |           inputBinding:
364 |             prefix: --net_avg
365 |           default: true
366 |           doc: tells cellpose to calculate 4 nets and take the average, improves performance.
367 | 
368 |       outputs:
369 |         log:
370 |           type: stdout
371 |         cellpose_output:
372 |           type: Directory
373 |           outputBinding:
374 |             glob: "5B_cellpose_output"
375 | 
376 |     in:
377 |       input_dir: execute_cellpose_prep/cellpose_input
378 |       z_axis:
379 |         source: [stage_cellpose/zplane_count, zplane_count]
380 |         valueFrom: |
381 |           ${
382 |             if(self[0]){
383 |               if(self[0] > 1){
384 |                 return 0;
385 |               } else {
386 |                 return null;
387 |               }
388 |             } else {
389 |               if(self[1] > 1){
390 |                 return 0;
391 |               } else {
392 |                 return null;
393 |               }
394 |             }
395 |           }
396 |       channel_axis:
397 |         source: [stage_cellpose/zplane_count, zplane_count]
398 |         valueFrom: |
399 |           ${
400 |             if(self[0]){
401 |               if(self[0] > 1){
402 |                 return 1;
403 |               } else {
404 |                 return 0;
405 |               }
406 |             } else {
407 |               if(self[1] > 1){
408 |                 return 1;
409 |               } else {
410 |                 return 0;
411 |               }
412 |             }
413 |           }
414 |       pretrained_model_str:
415 |         source: [stage_cellpose/pretrained_model_str, pretrained_model_str]
416 |         valueFrom: |
417 |           ${
418 |             if(self[0]){
419 |               return self[0];
420 |             } else if(self[1]) {
421 |               return self[1];
422 |             } else {
423 |               return null;
424 |             }
425 |           }
426 |       pretrained_model_dir: pretrained_model_dir
427 |       diameter:
428 |         source: [stage_cellpose/diameter, diameter, pretrained_model_dir]
429 |         valueFrom: |
430 |           ${
431 |             if(self[2]){
432 |               return 0;
433 |             } else if(self[0]){
434 |               return self[0];
435 |             } else if(self[1]) {
436 |               return self[1];
437 |             } else {
438 |               return null;
439 |             }
440 |           }
441 |       flow_threshold:
442 |         source: [stage_cellpose/flow_threshold, flow_threshold]
443 |         valueFrom: |
444 |           ${
445 |             if(self[0]){
446 |               return self[0];
447 |             } else if(self[1]) {
448 |               return self[1];
449 |             } else {
450 |               return null;
451 |             }
452 |           }
453 |       stitch_threshold:
454 |         source: [stage_cellpose/stitch_threshold, stitch_threshold, stage_cellpose/zplane_count, zplane_count]
455 |         valueFrom: |
456 |           ${
457 |             if(self[2] == 1 || self[3] == 1){
458 |               return null;
459 |             }
460 |             if(self[0]){
461 |               return self[0];
462 |             } else if(self[1]) {
463 |               return self[1];
464 |             } else {
465 |               return null;
466 |             }
467 |           }
468 |       cellprob_threshold:
469 |         source: [stage_cellpose/cellprob_threshold, cellprob_threshold]
470 |         valueFrom: |
471 |           ${
472 |             if(self[0]){
473 |               return self[0];
474 |             } else if(self[1]) {
475 |               return self[1];
476 |             } else {
477 |               return null;
478 |             }
479 |           }
480 |     out: [cellpose_output]
481 | 
482 |   execute_filtering:
483 |     run:
484 |       class: CommandLineTool
485 |       baseCommand: /opt/cellposeStaging.py
486 | 
487 |       requirements:
488 |         DockerRequirement:
489 |             dockerPull: hubmap/starfish-custom:latest
490 |         ResourceRequirement:
491 |           tmpdirMin: |
492 |             ${
493 |               if(inputs.dir_size === null) {
494 |                 return null;
495 |               } else {
496 |                 return inputs.dir_size * 4;
497 |               }
498 |             }
499 |           outdirMin: |
500 |             ${
501 |               if(inputs.dir_size === null) {
502 |                 return null;
503 |               } else {
504 |                 return inputs.dir_size * 4;
505 |               }
506 |             }
507 | 
508 |       inputs:
509 |         dir_size:
510 |           type: long?
511 | 
512 |         tmp_prefix:
513 |           type: string
514 |           inputBinding:
515 |             prefix: --tmp-prefix
516 | 
517 |         input_loc:
518 |           type: Directory
519 |           doc: Output from cellpose.
520 |           inputBinding:
521 |             prefix: --input-dir
522 | 
523 |         selected_fovs:
524 |           type: int[]?
525 |           doc: If provided, segmentation will only be run on FOVs with these indices.
526 |           inputBinding:
527 |             prefix: --selected-fovs
528 | 
529 |         border_buffer:
530 |           type: int?
531 |           doc: If not None, removes cytoplasms whose nuclei lie within the given distance from the border.
532 |           inputBinding:
533 |             prefix: --border-buffer
534 | 
535 |         label_exp_size:
536 |           type: int?
537 |           doc: Pixel size labels are dilated by in final step. Helpful for closing small holes that are common from thresholding but can also cause cell boundaries to exceed their true boundaries if set too high. Label dilation respects label borders and does not mix labels.
538 |           inputBinding:
539 |             prefix: --label-exp-size
540 | 
541 |         max_allowed_size:
542 |           type: int?
543 |           doc: maximum size for a cell (in pixels)
544 |           inputBinding:
545 |             prefix: --max-size
546 | 
547 |         min_allowed_size:
548 |           type: int?
549 |           doc: minimum size for a cell (in pixels)
550 |           inputBinding:
551 |             prefix: --min-size
552 | 
553 |         filter:
554 |           type: boolean
555 |           doc: Used to specify method in python script
556 |           default: true
557 |           inputBinding:
558 |             prefix: --filter
559 | 
560 |       outputs:
561 |         cellpose_filtered:
562 |           type: Directory
563 |           outputBinding:
564 |             glob: $("tmp/" + inputs.tmp_prefix + "/5C_cellpose_filtered")
565 | 
566 |     in:
567 |       dir_size: dir_size
568 |       tmp_prefix: tmpname/tmp
569 |       input_loc: execute_cellpose/cellpose_output
570 |       selected_fovs:
571 |         source: [stage_cellpose/selected_fovs, selected_fovs]
572 |         valueFrom: |
573 |           ${
574 |             if(self[0]){
575 |               return self[0];
576 |             } else if(self[1]) {
577 |               return self[1];
578 |             } else {
579 |               return null;
580 |             }
581 |           }
582 |       border_buffer:
583 |         source: [stage_cellpose/border_buffer, border_buffer]
584 |         valueFrom: |
585 |           ${
586 |             if(self[0]){
587 |               return self[0];
588 |             } else if(self[1]) {
589 |               return self[1];
590 |             } else {
591 |               return null;
592 |             }
593 |           }
594 |       label_exp_size:
595 |         source: [stage_cellpose/label_exp_size, label_exp_size]
596 |         valueFrom: |
597 |           ${
598 |             if(self[0]){
599 |               return self[0];
600 |             } else if(self[1]) {
601 |               return self[1];
602 |             } else {
603 |               return null;
604 |             }
605 |           }
606 |       min_allowed_size:
607 |         source: [stage_cellpose/min_allowed_size, min_allowed_size]
608 |         valueFrom: |
609 |           ${
610 |             if(self[0]){
611 |               return self[0];
612 |             } else if(self[1]) {
613 |               return self[1];
614 |             } else {
615 |               return null;
616 |             }
617 |           }
618 |       max_allowed_size:
619 |         source: [stage_cellpose/max_allowed_size, max_allowed_size]
620 |         valueFrom: |
621 |           ${
622 |             if(self[0]){
623 |               return self[0];
624 |             } else if(self[1]) {
625 |               return self[1];
626 |             } else {
627 |               return null;
628 |             }
629 |           }
630 |     out: [cellpose_filtered]
631 | 


--------------------------------------------------------------------------------
/steps/fileSizer.cwl:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env cwl-runner
 2 | cwlVersion: v1.2
 3 | class: Workflow
 4 | requirements:
 5 |   MultipleInputFeatureRequirement: {}
 6 |   InlineJavascriptRequirement: {}
 7 | 
 8 | inputs:
 9 |   example_dir:
10 |     type: Directory
11 | 
12 | outputs:
13 |   dir_size:
14 |     type: long
15 |     outputSource: formatter/dir_size
16 | 
17 | steps:
18 |   size_dir:
19 |     run:
20 |       class: CommandLineTool
21 |       requirements:
22 |         DockerRequirement:
23 |           dockerPull: hubmap/starfish-custom:latest
24 |         InitialWorkDirRequirement:
25 |           listing:
26 |             - $(inputs.example_dir)
27 |       baseCommand: ["du", "-s", "--block-size=1MiB"]
28 |       inputs:
29 |         example_dir:
30 |           type: Directory
31 |           inputBinding:
32 |             position: 0
33 |       outputs:
34 |         dir_size:
35 |           type: stdout
36 |     in:
37 |       example_dir: example_dir
38 |     out: [dir_size]
39 | 
40 |   formatter:
41 |     run:
42 |       class: ExpressionTool
43 |       requirements:
44 |         InlineJavascriptRequirement: {}
45 |       expression: |
46 |         ${
47 |           return {dir_size: Number(inputs.len_str.contents.split("\t")[0])}
48 |         }
49 |       inputs:
50 |         len_str:
51 |           type: File
52 |           loadContents: true
53 |       outputs:
54 |         dir_size:
55 |           type: long
56 |     in:
57 |       len_str: size_dir/dir_size
58 |     out: [dir_size]
59 | 


--------------------------------------------------------------------------------
/steps/inputParser.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | cwlVersion: v1.0
  3 | class: ExpressionTool
  4 | 
  5 | requirements:
  6 |   InlineJavascriptRequirement: {}
  7 |   ResourceRequirement:
  8 |     ramMin: 1000
  9 |     tmpdirMin: 1000
 10 |     outdirMin: 1000
 11 | 
 12 | inputs:
 13 |   datafile:
 14 |     type: File
 15 |     inputBinding:
 16 |       loadContents: true
 17 | 
 18 |   schema:
 19 |     type: File
 20 |     inputBinding:
 21 |       loadContents: true
 22 | 
 23 | # all possible outputs from tool must be listed here.
 24 | # not every output needs to be present in workflows that call this.
 25 | outputs:
 26 |   round_count: int
 27 |   zplane_count: int
 28 |   channel_count: int
 29 |   fov_count: int
 30 |   round_offset: int
 31 |   fov_offset: int
 32 |   zplane_offset: int
 33 |   channel_offset: int
 34 |   channel_slope: float
 35 |   file_format: string
 36 |   file_vars: string[]
 37 |   cache_read_order: string[]
 38 |   aux_tilesets_aux_names: string[]
 39 |   aux_tilesets_aux_file_formats: string[]
 40 |   aux_tilesets_aux_file_vars: string[]
 41 |   aux_tilesets_aux_cache_read_order: string[]
 42 |   aux_tilesets_aux_single_round: string[]
 43 |   aux_tilesets_aux_channel_count: float[]
 44 |   aux_tilesets_aux_channel_slope: float[]
 45 |   aux_tilesets_aux_channel_intercept: int[]
 46 |   fov_positioning_x_locs: string
 47 |   fov_positioning_x_shape: int
 48 |   fov_positioning_x_voxel: float
 49 |   fov_positioning_y_locs: string
 50 |   fov_positioning_y_shape: int
 51 |   fov_positioning_y_voxel: float
 52 |   fov_positioning_z_locs: string
 53 |   fov_positioning_z_shape: int
 54 |   fov_positioning_z_voxel: float
 55 |   add_blanks: boolean
 56 |   skip_formatting: boolean
 57 |   skip_processing: boolean
 58 |   selected_fovs: int[]
 59 |   clip_min: float
 60 |   clip_max: float
 61 |   level_method: string
 62 |   register_aux_view: string
 63 |   register_to_primary: boolean
 64 |   channels_per_reg: int
 65 |   background_view: string
 66 |   register_background: boolean
 67 |   anchor_view: string
 68 |   high_sigma: int
 69 |   deconvolve_iter: int
 70 |   deconvolve_sigma: int
 71 |   low_sigma: int
 72 |   rolling_radius: int
 73 |   match_histogram: boolean
 74 |   tophat_radius: int
 75 |   use_ref_img: boolean
 76 |   is_volume: boolean
 77 |   rescale: boolean
 78 |   not_filtered_results: boolean
 79 |   n_processes: int
 80 |   scatter_into_n: int
 81 |   decoding_min_sigma: float[]
 82 |   decoding_max_sigma: float[]
 83 |   decoding_num_sigma: int
 84 |   decoding_threshold: float
 85 |   decoding_overlap: float
 86 |   decoding_decode_method: string
 87 |   decoding_decoder_trace_building_strategy: string
 88 |   decoding_decoder_max_distance: float
 89 |   decoding_decoder_min_intensity: float
 90 |   decoding_decoder_pnorm: int
 91 |   decoding_decoder_norm_order: int
 92 |   decoding_decoder_anchor_round: int
 93 |   decoding_decoder_search_radius: int
 94 |   decoding_decoder_return_original_intensities: boolean
 95 |   decoding_decoder_error_rounds: int
 96 |   decoding_decoder_mode: string
 97 |   decoding_decoder_physical_coords: boolean
 98 |   decoding_pnorm: int
 99 |   decoding_distance_threshold: float
100 |   decoding_magnitude_threshold: float
101 |   decoding_min_area: int
102 |   decoding_max_area: int
103 |   decoding_norm_order: int
104 |   decoding_composite_decode: boolean
105 |   decoding_composite_pmin: float
106 |   decoding_composite_pmax: float
107 |   skip_seg: boolean
108 |   run_cellpose: boolean
109 |   use_mrna: boolean
110 |   pretrained_model_str: string
111 |   diameter: float
112 |   flow_threshold: float
113 |   stitch_threshold: float
114 |   cellprob_threshold: float
115 |   border_buffer: int
116 |   label_exp_size: int
117 |   min_allowed_size: int
118 |   max_allowed_size: int
119 |   aux_views: string[]
120 |   aux_name: string
121 |   binary_mask_img_threshold: float
122 |   binary_mask_min_dist: int
123 |   binary_mask_min_allowed_size: int
124 |   binary_mask_max_allowed_size: int
125 |   binary_mask_masking_radius: int
126 |   binary_mask_nuclei_view: string
127 |   binary_mask_cyto_seg: string
128 |   binary_mask_correct_seg: boolean
129 |   binary_mask_border_buffer: int
130 |   binary_mask_area_thresh: float
131 |   binary_mask_thresh_block_size: int
132 |   binary_mask_watershed_footprint_size: int
133 |   binary_mask_label_exp_size: int
134 |   run_baysor: boolean
135 |   skip_qc: boolean
136 |   find_ripley: boolean
137 |   save_pdf: boolean
138 | 
139 | # input schema describes the expected layout of variables in json format.
140 | # inputs are stored in an array.
141 | # any items that are treated as records for cwl input are stored in an object, where the key is the prefix on all items in the object.
142 | # the value in an object is an array or an array of arrays.
143 | # if there are two nested arrays, the sub-array with the closest match is used, ie the sub-arrays are mutually exclusive.
144 | # all items in an object's array must be included in the json file, unless the item ends with a question mark.
145 | # objects can be nested inside other objects, and all of their prefixes will apply to all items.
146 | expression: |
147 |   ${   var data = JSON.parse(inputs.datafile.contents);
148 |        var schema = JSON.parse(inputs.schema.contents);
149 |        function enforce_record(data, key, items, output_dict){
150 |            if(Array.isArray(items[0])){
151 |                 // Record where one of a mutually exclusive set of sublists is defined
152 |                 // Find closest match and enforce that
153 |                 var subind = 0;
154 |                 var coverage = 0.0;
155 |                 for(var i=0;i<items.length;i++){
156 |                         var tally = 0.0;
157 |                         for(var j=0;j<items[i].length;j++){
158 |                                 if(items[i][j].constructor != Object){
159 |                                         var subkey = items[i][j].replace("?","");
160 |                                         if(subkey in data){
161 |                                                 tally++;
162 |                                         }
163 |                                         // we want to define this key as null so that
164 |                                         // all possible outputs from schema are accounted for,
165 |                                         // even for non-selected schemas
166 |                                         output_dict[key + "_" + subkey] = null;
167 |                                 } else {
168 |                                         var sbk = Object.keys(items[i][j])[0];
169 |                                         for(var k=0;k<items[i][j][sbk].length; k++){
170 |                                                 var sublis = items[i][j][sbk][k];
171 |                                                 for(var m=0;m<sublis.length;m++){
172 |                                                         var cleaned = sublis[m].replace("?","");
173 |                                                         output_dict[key + "_" + sbk + "_" + cleaned] = null;
174 |                                                 }
175 |                                         }
176 |                                 }
177 |                         }
178 |                         var new_coverage = tally / items[i].length;
179 |                         if(new_coverage > coverage){
180 |                                 coverage = new_coverage;
181 |                                 subind = i;
182 |                         }
183 |                 }
184 |                 enforce_record(data, key, items[subind], output_dict);
185 |            } else {
186 |                    for(var i=0;i<items.length;i++){
187 |                         if(items[i].constructor == Object){
188 |                                 // Record within a record, make recursive call
189 |                                 var subkey = Object.keys(items[i])[0];
190 |                                 enforce_record(data[subkey], key+"_"+subkey, items[i][subkey], output_dict);
191 |                         } else {
192 |                                 // If not present, throw an error unless marked with "?"
193 |                                 var item_comp = items[i].replace("?","");
194 |                                 if(!(item_comp in data)){
195 |                                         if(!items[i].includes("?")){
196 |                                                 throw 'If '+key+' is defined, then all of '+items+' must be defined.';
197 |                                         }
198 |                                 } else {
199 |                                 // Add val to output dict
200 |                                         output_dict[key + '_' + item_comp] = data[item_comp];
201 |                                 }
202 |                         }
203 |                    }
204 |                    return output_dict;
205 |            }
206 |        }
207 | 
208 |        var values_dict = {};
209 |        for(var i=0;i<schema.length;i++){
210 |            if(schema[i].constructor == Object){
211 |                 var key = Object.keys(schema[i])[0];
212 |                 var lis = schema[i][key];
213 |                 enforce_record(data[key], key, lis, values_dict);
214 |            } else {
215 |                 var sch = schema[i].replace("?","");
216 |                 if(sch in data){
217 |                      values_dict[sch] = data[sch];
218 |                 } else {
219 |                      values_dict[sch] = null;
220 |                 }
221 |            }
222 |        }
223 |        return values_dict;
224 |   }
225 | 


--------------------------------------------------------------------------------
/steps/processing.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 |    - class: ScatterFeatureRequirement
 12 | 
 13 | inputs:
 14 |   input_dir:
 15 |     type: Directory
 16 |     doc: Root directory containing space_tx formatted experiment
 17 | 
 18 |   dir_size:
 19 |     type: long?
 20 |     doc: The size of input_dir in MiB. If provided, will be used to specify storage space requests.
 21 | 
 22 |   parameter_json:
 23 |     type: File?
 24 |     doc: json containing step parameters.
 25 | 
 26 |   selected_fovs:
 27 |     type: int[]?
 28 |     doc: If provided, processing will only be run on FOVs with these indices.
 29 | 
 30 |   fov_count:
 31 |     type: int?
 32 |     doc: The number of FOVs that are included in this experiment
 33 | 
 34 |   clip_min:
 35 |     type: float?
 36 |     doc: Pixels below this percentile are set to 0.
 37 | 
 38 |   clip_max:
 39 |     type: float?
 40 |     doc: Pixels above this percentile are set to 1.
 41 | 
 42 |   level_method:
 43 |     type: string?
 44 |     doc: Levelling method for clip and scale application. Defaults to SCALE_BY_CHUNK. If rescaling is configured in parameter_json, will be set to SCALE_BY_CHUNK if true, SCALE_BY_IMAGE if false.
 45 | 
 46 |   is_volume:
 47 |     type: boolean?
 48 |     doc: Whether to treat the zplanes as a 3D image.
 49 | 
 50 |   register_aux_view:
 51 |     type: string?
 52 |     doc: The name of the auxillary view to be used for image registration.
 53 | 
 54 |   register_to_primary:
 55 |     type: boolean?
 56 |     doc: If true, registration will be performed between the first round of register_aux_view and the primary images.
 57 | 
 58 |   channels_per_reg:
 59 |     type: int?
 60 |     doc: The number of images associated with each channel in the registration image.  Will be calculated from aux view if provided through parameter_json, otherwise defaults to one.
 61 | 
 62 |   background_view:
 63 |     type: string?
 64 |     doc: The name of the auxillary view to be used for background subtraction.  Background will be estimated if not provided.
 65 | 
 66 |   register_background:
 67 |     type: boolean?
 68 |     doc: If true, the `background_view` will be aligned to the `aux_view`.
 69 | 
 70 |   anchor_view:
 71 |     type: string?
 72 |     doc: The name of the auxillary view to be processed in parallel with primary view, such as for anchor round in ISS processing. Will not be included if not provided.
 73 | 
 74 |   high_sigma:
 75 |     type: int?
 76 |     doc: Sigma value for high pass gaussian filter. Will not be run if not provided.
 77 | 
 78 |   deconvolve_iter:
 79 |     type: int?
 80 |     doc: Number of iterations to perform for deconvolution. High values remove more noise while lower values remove less. The value 15 will work for most datasets unless image is very noisy. Will not be run if not provided.
 81 | 
 82 |   deconvolve_sigma:
 83 |     type: int?
 84 |     doc: Sigma value for deconvolution. Should be approximately the expected spot size.
 85 | 
 86 |   low_sigma:
 87 |     type: int?
 88 |     doc: Sigma value for low pass gaussian filter. Will not be run if not provided.
 89 | 
 90 |   rolling_radius:
 91 |     type: int?
 92 |     doc: Radius for rolling ball background subtraction. Larger values lead to increased intensity evening effect. The value of 3 will work for most datasets. Will not be run if not provided.
 93 | 
 94 |   match_histogram:
 95 |     type: boolean?
 96 |     doc: If true, histograms will be equalized.
 97 | 
 98 |   tophat_radius:
 99 |     type: int?
100 |     doc: Radius for white top hat filter. Should be slightly larger than the expected spot radius. Will not be run if not provided.
101 | 
102 |   rescale:
103 |     type: boolean?
104 |     doc: Whether to iteratively rescale images before running the decoder. If true, will skip clip and scale at the end of this step.
105 | 
106 |   n_processes:
107 |     type: int?
108 |     doc: If provided, the number of processes that will be spawned for processing. Otherwise, the maximum number of available CPUs will be used.
109 | 
110 | outputs:
111 |   processed_exp:
112 |     type: Directory
113 |     outputSource: execute_processing/processed_exp
114 | 
115 | steps:
116 | 
117 |   read_schema:
118 |     run:
119 |       class: CommandLineTool
120 |       baseCommand: cat
121 | 
122 |       requirements:
123 |         DockerRequirement:
124 |           dockerPull: hubmap/starfish-custom:latest
125 |         ResourceRequirement:
126 |           ramMin: 1000
127 |           tmpdirMin: 1000
128 |           outdirMin: 1000
129 | 
130 |       inputs:
131 |         schema:
132 |           type: string
133 |           inputBinding:
134 |             position: 1
135 | 
136 |       outputs:
137 |         data:
138 |           type: stdout
139 | 
140 |     in:
141 |       schema:
142 |         valueFrom: "/opt/processing.json"
143 |     out: [data]
144 | 
145 |   stage_processing:
146 |     run: inputParser.cwl
147 |     in:
148 |       datafile: parameter_json
149 |       schema: read_schema/data
150 |     out: [fov_count, selected_fovs, clip_min, clip_max, level_method, rescale, register_aux_view, register_to_primary, channels_per_reg, background_view, register_background, anchor_view, high_sigma, deconvolve_iter, deconvolve_sigma, low_sigma, rolling_radius, match_histogram, tophat_radius, channel_count, aux_tilesets_aux_names, aux_tilesets_aux_channel_count, is_volume, n_processes]
151 |     when: $(inputs.datafile != null)
152 | 
153 |   tmpname:
154 |     run: tmpdir.cwl
155 |     in: []
156 |     out: [tmp]
157 | 
158 |   execute_processing:
159 |     run:
160 |       class: CommandLineTool
161 |       baseCommand: /opt/imgProcessing.py
162 | 
163 |       requirements:
164 |         InitialWorkDirRequirement:
165 |           listing:
166 |             - entryname: "$('input_dir_'+inputs.tmp_prefix)"
167 |               writable: true
168 |               entry: "$(inputs.input_files)"
169 |         DockerRequirement:
170 |           dockerPull: hubmap/starfish-custom:latest
171 |         ResourceRequirement:
172 |           tmpdirMin: |
173 |             ${
174 |               if(inputs.dir_size === null) {
175 |                 return null;
176 |               } else {
177 |                 return inputs.dir_size;
178 |               }
179 |             }
180 |           outdirMin: |
181 |             ${
182 |               return 1000;
183 |             }
184 |           coresMin: |
185 |             ${
186 |               if(inputs.n_processes === null) {
187 |                 return null;
188 |               } else {
189 |                 return inputs.n_processes;
190 |               }
191 |             }
192 |           ramMin: |
193 |             ${
194 |               if(inputs.n_processes === null) {
195 |                 return null;
196 |               } else {
197 |                 return Math.max(inputs.n_processes * 20 * 24, inputs.dir_size / 75);
198 |               }
199 |             }
200 | 
201 |       inputs:
202 |         dir_size:
203 |           type: long?
204 | 
205 |         tmp_prefix:
206 |           type: string
207 |           inputBinding:
208 |             prefix: --tmp-prefix
209 | 
210 |         input_files:
211 |           type: Directory
212 |           doc: Raw input folder, possibly with ugly docker string.
213 | 
214 |         input_dir:
215 |           type: string
216 |           inputBinding:
217 |             prefix: --input-dir
218 |           doc: Root directory containing space_tx formatted experiment
219 | 
220 |         selected_fovs:
221 |           type: int[]?
222 |           inputBinding:
223 |             prefix: --selected-fovs
224 |           doc: If provided, processing will only be run on FOVs with these indices.
225 | 
226 |         clip_min:
227 |           type: float?
228 |           inputBinding:
229 |             prefix: --clip-min
230 |           doc: Pixels below this percentile are set to 0. Defaults to 95.
231 | 
232 |         clip_max:
233 |           type: float?
234 |           inputBinding:
235 |             prefix: --clip-max
236 |           doc: Pixels above this percentile are set to 1. Defaults to 99.9.
237 | 
238 |         level_method:
239 |           type: string?
240 |           inputBinding:
241 |             prefix: --level-method
242 |           doc: Levelling method for clip and scale application. Defaults to SCALE_BY_CHUNK.
243 | 
244 |         is_volume:
245 |           type: boolean?
246 |           inputBinding:
247 |             prefix: --is-volume
248 |           doc: Whether to treat the zplanes as a 3D image.
249 | 
250 |         rescale:
251 |           type: boolean?
252 |           inputBinding:
253 |             prefix: --rescale
254 | 
255 |         register_aux_view:
256 |           type: string?
257 |           inputBinding:
258 |             prefix: --register-aux-view
259 |           doc: The name of the auxillary view to be used for image registration. Registration will not be performed if not provided.
260 | 
261 |         register_to_primary:
262 |           type: boolean?
263 |           inputBinding:
264 |             prefix: --register-to-primary
265 | 
266 |         channels_per_reg:
267 |           type: int?
268 |           inputBinding:
269 |             prefix: --ch-per-reg
270 |           doc: The number of images associated with each channel of the registration image.  Defaults to 1.
271 | 
272 |         background_view:
273 |           type: string?
274 |           inputBinding:
275 |             prefix: --background-view
276 |           doc: The name of the auxillary view to be used for background subtraction.  Background will be estimated if not provided.
277 | 
278 |         register_background:
279 |           type: boolean?
280 |           inputBinding:
281 |             prefix: --register-background
282 |           doc: If true, the `background_view` will be aligned to the `aux_name`.
283 | 
284 |         anchor_view:
285 |           type: string?
286 |           inputBinding:
287 |             prefix: --anchor-view
288 |           doc: The name of the auxillary view to be processed in parallel with primary view, such as for anchor round in ISS processing. Will not be included if not provided.
289 | 
290 |         high_sigma:
291 |           type: int?
292 |           inputBinding:
293 |             prefix: --high-sigma
294 |           doc: Sigma value for high pass gaussian filter. Will not be run if not provided.
295 | 
296 |         deconvolve_iter:
297 |           type: int?
298 |           inputBinding:
299 |             prefix: --decon-iter
300 |           doc: Number of iterations to perform for deconvolution. High values remove more noise while lower values remove less. The value 15 will work for most datasets unless image is very noisy. Will not be run if not provided.
301 | 
302 |         deconvolve_sigma:
303 |           type: int?
304 |           inputBinding:
305 |             prefix: --decon-sigma
306 |           doc: Sigma value for deconvolution. Should be approximately the expected spot size.
307 | 
308 |         low_sigma:
309 |           type: int?
310 |           inputBinding:
311 |             prefix: --low-sigma
312 |           doc: Sigma value for low pass gaussian filter. Will not be run if not provided.
313 | 
314 |         rolling_radius:
315 |           type: int?
316 |           inputBinding:
317 |             prefix: --rolling-radius
318 |           doc: Radius for rolling ball background subtraction. Larger values lead to increased intensity evening effect. The value of 3 will work for most datasets. Will not be run if not provided.
319 | 
320 |         match_histogram:
321 |           type: boolean?
322 |           inputBinding:
323 |             prefix: --match-histogram
324 |           doc: If true, histograms will be equalized.
325 | 
326 |         tophat_radius:
327 |           type: int?
328 |           inputBinding:
329 |             prefix: --tophat-radius
330 |           doc: Radius for white top hat filter. Should be slightly larger than the expected spot radius. Will not be run if not provided.
331 | 
332 |         n_processes:
333 |           type: int?
334 |           inputBinding:
335 |             prefix: --n-processes
336 |           doc: If provided, the number of processes that will be spawned for processing. Otherwise, the maximum number of available CPUs will be used.
337 | 
338 |       outputs:
339 |         processed_exp:
340 |           type: Directory
341 |           outputBinding:
342 |             glob: $("tmp/" + inputs.tmp_prefix + "/3_processed/")
343 |     in:
344 |       dir_size: dir_size
345 |       tmp_prefix: tmpname/tmp
346 |       input_files: input_dir
347 |       input_dir:
348 |         valueFrom: $("input_dir_" + inputs.tmp_prefix)
349 |       selected_fovs: selected_fovs
350 |       clip_min:
351 |         source: [stage_processing/clip_min, clip_min]
352 |         valueFrom: |
353 |           ${
354 |             if(!(self[0] === null)){
355 |               return self[0];
356 |             } else if(!(self[1] === null)) {
357 |               return self[1];
358 |             } else {
359 |               return null;
360 |             }
361 |           }
362 |       clip_max:
363 |         source: [stage_processing/clip_max, clip_max]
364 |         valueFrom: |
365 |           ${
366 |             if(!(self[0] === null)){
367 |               return self[0];
368 |             } else if(!(self[1] === null)) {
369 |               return self[1];
370 |             } else {
371 |               return null;
372 |             }
373 |           }
374 |       level_method:
375 |         source: [stage_processing/level_method, level_method]
376 |         valueFrom: |
377 |           ${
378 |             if(self[0]){
379 |               return self[0];
380 |             } else if(self[1]) {
381 |               return self[1];
382 |             } else {
383 |               return null;
384 |             }
385 |           }
386 |       is_volume:
387 |         source: [stage_processing/is_volume, is_volume]
388 |         valueFrom: |
389 |           ${
390 |             if(self[0]){
391 |               return self[0];
392 |             } else if(self[1]) {
393 |               return self[1];
394 |             } else {
395 |               return null;
396 |             }
397 |           }
398 |       rescale:
399 |         source: [stage_processing/rescale, rescale]
400 |         valueFrom: |
401 |           ${
402 |             if(self[0]){
403 |               return self[0];
404 |             } else if(self[1]) {
405 |               return self[1];
406 |             } else {
407 |               return null;
408 |             }
409 |           }
410 |       register_aux_view:
411 |         source: [stage_processing/register_aux_view, register_aux_view]
412 |         valueFrom: |
413 |           ${
414 |             if(self[0]){
415 |               return self[0];
416 |             } else if(self[1]) {
417 |               return self[1];
418 |             } else {
419 |               return null;
420 |             }
421 |           }
422 |       register_to_primary:
423 |         source: [stage_processing/register_to_primary, register_to_primary]
424 |         valueFrom: |
425 |           ${
426 |             if(self[0]){
427 |               return self[0];
428 |             } else if(self[1]) {
429 |               return self[1];
430 |             } else {
431 |               return null;
432 |             }
433 |           }
434 |       channels_per_reg:
435 |         source: [stage_processing/channels_per_reg, channels_per_reg, stage_processing/channel_count, stage_processing/register_aux_view, register_aux_view, stage_processing/aux_tilesets_aux_names, stage_processing/aux_tilesets_aux_channel_count]
436 |         valueFrom: |
437 |           ${
438 |             if (self[1]){
439 |               return self[1];
440 |             } else if (self[2] && self[5] && self[6]) {
441 |               var name = "";
442 |               if(self[3]){
443 |                 name = self[3];
444 |               } else {
445 |                 name = self[4];
446 |               }
447 |               var aux_ind = self[5].indexOf(name);
448 |               var aux_count = self[6][aux_ind];
449 |               return Math.round(self[2] / aux_count);
450 |             } else if(self[0]){
451 |               return self[0];
452 |             } else {
453 |               return null;
454 |             }
455 |           }
456 |       background_view:
457 |         source: [stage_processing/background_view, background_view]
458 |         valueFrom: |
459 |           ${
460 |             if(self[0]){
461 |               return self[0];
462 |             } else if(self[1]) {
463 |               return self[1];
464 |             } else {
465 |               return null;
466 |             }
467 |           }
468 |       register_background:
469 |         source: [stage_processing/register_background, register_background]
470 |         valueFrom: |
471 |           ${
472 |             if(self[0]){
473 |               return self[0];
474 |             } else if(self[1]) {
475 |               return self[1];
476 |             } else {
477 |               return null;
478 |             }
479 |           }
480 |       anchor_view:
481 |         source: [stage_processing/anchor_view, anchor_view]
482 |         valueFrom: |
483 |           ${
484 |             if(self[0]){
485 |               return self[0];
486 |             } else if(self[1]) {
487 |               return self[1];
488 |             } else {
489 |               return null;
490 |             }
491 |           }
492 |       high_sigma:
493 |        source: [stage_processing/high_sigma, high_sigma]
494 |        valueFrom: |
495 |           ${
496 |             if(self[0]){
497 |               return self[0];
498 |             } else if(self[1]) {
499 |               return self[1];
500 |             } else {
501 |               return null;
502 |             }
503 |           }
504 |       deconvolve_iter:
505 |         source: [stage_processing/deconvolve_iter, deconvolve_iter]
506 |         valueFrom: |
507 |           ${
508 |             if(self[0]){
509 |               return self[0];
510 |             } else if(self[1]) {
511 |               return self[1];
512 |             } else {
513 |               return null;
514 |             }
515 |           }
516 |       deconvolve_sigma:
517 |         source: [stage_processing/deconvolve_sigma, deconvolve_sigma]
518 |         valueFrom: |
519 |           ${
520 |             if(self[0]){
521 |               return self[0];
522 |             } else if(self[1]) {
523 |               return self[1];
524 |             } else {
525 |               return null;
526 |             }
527 |           }
528 |       low_sigma:
529 |         source: [stage_processing/low_sigma, low_sigma]
530 |         valueFrom: |
531 |           ${
532 |             if(self[0]){
533 |               return self[0];
534 |             } else if(self[1]) {
535 |               return self[1];
536 |             } else {
537 |               return null;
538 |             }
539 |           }
540 |       rolling_radius:
541 |         source: [stage_processing/rolling_radius, rolling_radius]
542 |         valueFrom: |
543 |           ${
544 |             if(self[0]){
545 |               return self[0];
546 |             } else if(self[1]) {
547 |               return self[1];
548 |             } else {
549 |               return null;
550 |             }
551 |           }
552 |       match_histogram:
553 |         source: [stage_processing/match_histogram, match_histogram]
554 |         valueFrom: |
555 |           ${
556 |             if(self[0]){
557 |               return self[0];
558 |             } else if (self[1]) {
559 |               return self[1];
560 |             } else {
561 |               return null;
562 |             }
563 |           }
564 |       tophat_radius:
565 |         source: [stage_processing/tophat_radius, tophat_radius]
566 |         valueFrom: |
567 |           ${
568 |             if(self[0]){
569 |               return self[0];
570 |             } else if(self[1]) {
571 |               return self[1];
572 |             } else {
573 |               return null;
574 |             }
575 |           }
576 |       n_processes:
577 |         source: [stage_processing/n_processes, n_processes]
578 |         valueFrom: |
579 |           ${
580 |             if(self[0]){
581 |               return self[0];
582 |             } else if(self[1]) {
583 |               return self[1];
584 |             } else {
585 |               return null;
586 |             }
587 |           }
588 |     out: [processed_exp]
589 | 


--------------------------------------------------------------------------------
/steps/psortedDefaultParams.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 |   exp_dir:
 14 |     type: Directory
 15 |     doc: Converted experiment with converted codebook from prior step.
 16 |   parameter_json:
 17 |     type: File?
 18 |     doc: Json containing information for the dataset
 19 |   aux_names:
 20 |     type: string[]?
 21 |     doc: list of the aux view names.  Assumed none if blank.
 22 |   channel_count:
 23 |     type: int?
 24 |     doc: the number of channel expected for this experiment.
 25 |   cache_read_order:
 26 |     type: string[]?
 27 |     doc: Cache read order for files. Will strip any CH dimensions.
 28 |   aux_cache_read_order:
 29 |     type: string[]?
 30 |     doc: Cache read order for aux views.  Will strip any CH dimensions.
 31 | 
 32 | outputs:
 33 |   codebook:
 34 |     type: File
 35 |     outputSource: execute_defaults/codebook
 36 |   round_count:
 37 |     type: int
 38 |     outputSource: stage_defaults/round_count
 39 |   fov_count:
 40 |     type: int
 41 |     outputSource: stage_defaults/fov_count
 42 |   channel_count:
 43 |     type: int
 44 |     outputSource: stage_defaults/channel_count
 45 |   zplane_count:
 46 |     type: int
 47 |     outputSource: stage_defaults/zplane_count
 48 |   round_offset:
 49 |     type: int
 50 |     outputSource: execute_defaults/round_offset
 51 |   fov_offset:
 52 |     type: int
 53 |     outputSource: execute_defaults/fov_offset
 54 |   channel_offset:
 55 |     type: int
 56 |     outputSource: execute_defaults/channel_offset
 57 |   zplane_offset:
 58 |     type: int
 59 |     outputSource: execute_defaults/zplane_offset
 60 |   file_format:
 61 |     type: string
 62 |     outputSource: execute_defaults/file_format
 63 |   file_vars:
 64 |     type: string[]
 65 |     outputSource: execute_defaults/file_vars
 66 |   cache_read_order:
 67 |     type: string[]
 68 |     outputSource: execute_defaults/cache_read_order
 69 |   aux_names:
 70 |     type: string[]
 71 |     outputSource: execute_defaults/aux_names
 72 |   aux_file_formats:
 73 |     type: string[]
 74 |     outputSource: execute_defaults/aux_file_formats
 75 |   aux_file_vars:
 76 |     type: string[]
 77 |     outputSource: execute_defaults/aux_file_vars
 78 |   aux_cache_read_order:
 79 |     type: string[]
 80 |     outputSource: execute_defaults/aux_cache_read_order
 81 |   aux_channel_count:
 82 |     type: int[]
 83 |     outputSource: execute_defaults/aux_channel_count
 84 |   aux_channel_slope:
 85 |     type: string[]
 86 |     outputSource: execute_defaults/aux_channel_slope
 87 |   aux_channel_intercept:
 88 |     type: string[]
 89 |     outputSource: execute_defaults/aux_channel_intercept
 90 | 
 91 | steps:
 92 |   read_schema:
 93 |     run:
 94 |       class: CommandLineTool
 95 |       baseCommand: cat
 96 | 
 97 |       requirements:
 98 |         DockerRequirement:
 99 |           dockerPull: hubmap/starfish-custom:latest
100 |         ResourceRequirement:
101 |           ramMin: 1000
102 |           tmpdirMin: 1000
103 |           outdirMin: 1000
104 | 
105 |       inputs:
106 |         schema:
107 |           type: string
108 |           inputBinding:
109 |             position: 1
110 | 
111 |       outputs:
112 |         data:
113 |           type: stdout
114 | 
115 |     in:
116 |       schema:
117 |         valueFrom: "/opt/psortedDefaultParams.json"
118 |     out: [data]
119 | 
120 |   stage_defaults:
121 |     run: inputParser.cwl
122 |     in:
123 |       datafile: parameter_json
124 |       schema: read_schema/data
125 |     out: [round_count, fov_count, channel_count, zplane_count, aux_tilesets_aux_names, cache_read_order, aux_tilesets_aux_cache_read_order, aux_tilesets_aux_channel_count]
126 |     when: $(inputs.datafile != null)
127 | 
128 |   execute_defaults:
129 |     run:
130 |       cwlVersion: v1.2
131 |       class: ExpressionTool
132 | 
133 |       requirements:
134 |         InlineJavascriptRequirement: {}
135 |         LoadListingRequirement:
136 |           loadListing: shallow_listing
137 |         InitialWorkDirRequirement:
138 |           listing:
139 |             - $(inputs.exp_dir)
140 |         ResourceRequirement:
141 |           ramMin: 1000
142 |           tmpdirMin: 1000
143 |           outdirMin: 1000
144 | 
145 |       expression: |
146 |         ${
147 |           var cb = "BLANK";
148 |           var aux = {};
149 |           var aux_names = [];
150 |           var aux_file_formats = [];
151 |           var aux_file_vars = [];
152 |           var aux_cache_read_order = [];
153 |           var aux_channel_slope = [];
154 |           var aux_channel_intercept = [];
155 |           var cache = inputs.cache_read_order;
156 |           var aux_channel_count = [];
157 |           var ind = cache.indexOf("CH"); // remove channel if it was in the read order
158 |           if(ind > -1){
159 |             cache.splice(ind, 1);
160 |           }
161 |           for(var i=0; i<inputs.exp_dir.listing.length; i++){
162 |             if(inputs.exp_dir.listing[i].basename=="pround_codebook.json"){
163 |               cb = inputs.exp_dir.listing[i];
164 |             }
165 |           }
166 |           for(var i=0; i<inputs.aux_names.length; i++){
167 |             var aux_cache = inputs.aux_cache_read_order[i];
168 |             aux_cache = aux_cache.split(";");
169 |             var aux_ind = aux_cache.indexOf("CH");
170 |             if(aux_ind > -1){
171 |               aux_cache.splice(aux_ind, 1);
172 |             }
173 |             aux_cache = aux_cache.join(";");
174 |             aux_names.push(inputs.aux_names[i]);
175 |             aux_file_formats.push("PseudoCycle{}/MMStack_Pos{}_"+inputs.aux_names[i]+"ch{}.ome.tif");
176 |             aux_file_vars.push("round;fov;channel");
177 |             aux_cache_read_order.push(aux_cache);
178 |             aux_channel_count.push(inputs.channel_count);
179 |             aux_channel_slope.push(1);
180 |             aux_channel_intercept.push(0);
181 |           }
182 |           return {"codebook":              cb,
183 |                   "round_offset":          0,
184 |                   "fov_offset":            0,
185 |                   "channel_offset":        0,
186 |                   "zplane_offset":         0,
187 |                   "file_format":           "PseudoCycle{}/MMStack_Pos{}_ch{}.ome.tif",
188 |                   "file_vars":             ["round", "fov", "channel"],
189 |                   "cache_read_order":      cache,
190 |                   "aux_names":             aux_names,
191 |                   "aux_file_formats":      aux_file_formats,
192 |                   "aux_file_vars":         aux_file_vars,
193 |                   "aux_cache_read_order":  aux_cache_read_order,
194 |                   "aux_channel_slope":     aux_channel_slope,
195 |                   "aux_channel_intercept": aux_channel_intercept,
196 |                   "aux_channel_count":     aux_channel_count
197 |                   };
198 |          }
199 | 
200 |       inputs:
201 |         exp_dir:
202 |           type: Directory
203 |         aux_names:
204 |           type: string[]?
205 |         cache_read_order:
206 |           type: string[]
207 |         aux_cache_read_order:
208 |           type: string[]?
209 |         channel_count:
210 |           type: int?
211 | 
212 |       outputs:
213 |         codebook:
214 |           type: File
215 |         round_offset:
216 |           type: int
217 |         fov_offset:
218 |           type: int
219 |         channel_offset:
220 |           type: int
221 |         zplane_offset:
222 |           type: int
223 |         file_format:
224 |           type: string
225 |         file_vars:
226 |           type: string[]
227 |         cache_read_order:
228 |           type: string[]
229 |         aux_names:
230 |           type: string[]
231 |         aux_file_formats:
232 |           type: string[]
233 |         aux_file_vars:
234 |           type: string[]
235 |         aux_cache_read_order:
236 |           type: string[]
237 |         aux_channel_slope:
238 |           type: string[]
239 |         aux_channel_intercept:
240 |           type: string[]
241 |         aux_channel_count:
242 |           type: int[]
243 |     in:
244 |       exp_dir: exp_dir
245 |       aux_names:
246 |         source: [stage_defaults/aux_tilesets_aux_names, aux_names]
247 |         valueFrom: |
248 |           ${
249 |             if(self[0]){
250 |               return self[0];
251 |             } else if(self[1]){
252 |               return self[1];
253 |             } else {
254 |               return null;
255 |             }
256 |           }
257 |       cache_read_order:
258 |         source: [stage_defaults/cache_read_order, cache_read_order]
259 |         pickValue: first_non_null
260 |       channel_count:
261 |         source: [stage_defaults/channel_count, channel_count]
262 |         pickValue: first_non_null
263 |       aux_cache_read_order:
264 |         source: [stage_defaults/aux_tilesets_aux_cache_read_order, aux_cache_read_order]
265 |         valueFrom: |
266 |           ${
267 |             if(self[0]){
268 |               return self[0];
269 |             } else if (self[1]){
270 |               return self[1];
271 |             } else {
272 |               return null;
273 |             }
274 |           }
275 | 
276 |     out: [codebook, round_offset, fov_offset, channel_offset, zplane_offset, file_format, file_vars, cache_read_order, aux_names, aux_file_formats, aux_file_vars, aux_cache_read_order, aux_channel_slope, aux_channel_intercept, aux_channel_count]
277 | 


--------------------------------------------------------------------------------
/steps/qc.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 | 
 14 |   codebook_exp:
 15 |     type: Directory?
 16 |     doc: Flattened codebook input, refer to record entry.
 17 | 
 18 |   codebook_pkl:
 19 |     type: File?
 20 |     doc: Flattened codebook input, refer to record entry.
 21 | 
 22 |   locs_json:
 23 |     type: File?
 24 |     doc: Flattened json input, refer to record entry.
 25 | 
 26 |   codebook:
 27 |     type:
 28 |       - 'null'
 29 |       - type: record
 30 |         name: pkl
 31 |         fields:
 32 |           pkl:
 33 |             type: File
 34 |             doc: A codebook for this experiment, saved in a python pickle.
 35 |       - type: record
 36 |         name: exp
 37 |         fields:
 38 |           exp:
 39 |             type: Directory
 40 |             doc: The location of an experiment.json file, which has the corresponding codebook for this experiment.
 41 |   segmentation_loc:
 42 |     type: Directory?
 43 |     doc: The location of the output from the segmentation step, if it was performed.
 44 | 
 45 |   data_pkl_spots:
 46 |     type: File?
 47 |     doc: Flattened data input, refer to record entry.
 48 | 
 49 |   data_pkl_transcripts:
 50 |     type: File?
 51 |     doc: Flattened data input, refer to record entry.
 52 | 
 53 |   data_exp:
 54 |     type: Directory?
 55 |     doc: Flattened data input, refer to record entry.
 56 | 
 57 |   data:
 58 |     type:
 59 |     - 'null'
 60 |     - type: record
 61 |       name: pkl
 62 |       fields:
 63 |         spots:
 64 |           type: File?
 65 |           doc: Spots found in this experiment, saved in a python pickle.
 66 |         transcripts:
 67 |           type: File
 68 |           doc: The output DecodedIntensityTable, saved in a python pickle.
 69 |     - type: record
 70 |       name: exp
 71 |       fields:
 72 |         exp:
 73 |           type: Directory
 74 |           doc: The location of output of starfish runner step, 4_Decoded. Contains spots (if applicable) and netcdfs containing the DecodedIntensityTable.
 75 | 
 76 |   selected_fovs:
 77 |     type: int[]?
 78 |     doc: If provided, QC will only be run on FOVs with these indices.
 79 | 
 80 |   has_spots:
 81 |     type: boolean?
 82 |     doc: If true, will look for spots within the experiment field.
 83 | 
 84 |   roi:
 85 |     type: File?
 86 |     doc: The location of the RoiSet.zip, if applicable.
 87 | 
 88 |   parameter_json:
 89 |     type: File?
 90 |     doc: The json with parameters to be read in for the following variables.
 91 | 
 92 |   imagesize:
 93 |     type:
 94 |       - 'null'
 95 |       - type: record
 96 |         name: locs
 97 |         fields:
 98 |           locs:
 99 |             type: File?
100 |             doc: Input locations as a json file, using the same records as below.
101 |       - type: record
102 |         name: fov_positioning
103 |         fields:
104 |           - name: x_size
105 |             type: int
106 |             doc: x-dimension of image
107 |           - name: y_size
108 |             type: int
109 |             doc: y-dimension of image
110 |           - name: z_size
111 |             type: int
112 |             doc: number of z-stacks
113 | 
114 |   spot_threshold:
115 |     type: float?
116 |     doc: If has_spots is true and this is provided, spots with an intensity lower than this will not be included in qc metrics
117 | 
118 |   find_ripley:
119 |     type: boolean?
120 |     doc: If true, will run ripley K estimates to find spatial density measures.  Can be slow.
121 |     default: False
122 | 
123 |   save_pdf:
124 |     type: boolean?
125 |     doc: If true, will save graphical output to a pdf.
126 |     default: True
127 | 
128 | outputs:
129 |   qc_metrics:
130 |     type: Directory
131 |     outputSource: execute_qc/qc_metrics
132 | 
133 | steps:
134 | 
135 |   tmpname:
136 |     run: tmpdir.cwl
137 |     in: []
138 |     out: [tmp]
139 | 
140 |   read_schema:
141 |     run:
142 |       class: CommandLineTool
143 |       baseCommand: cat
144 | 
145 |       requirements:
146 |         DockerRequirement:
147 |           dockerPull: hubmap/starfish-custom:latest
148 |         ResourceRequirement:
149 |           ramMin: 1000
150 |           tmpdirMin: 1000
151 |           outdirMin: 1000
152 | 
153 |       inputs:
154 |         schema:
155 |           type: string
156 |           inputBinding:
157 |             position: 1
158 | 
159 |       outputs:
160 |         data:
161 |           type: stdout
162 | 
163 |     in:
164 |       schema:
165 |         valueFrom: "/opt/qc.json"
166 |     out: [data]
167 | 
168 |   stage_qc:
169 |     run: inputParser.cwl
170 |     in:
171 |       datafile: parameter_json
172 |       schema: read_schema/data
173 |     out: [selected_fovs, find_ripley, save_pdf, fov_positioning_x_shape, fov_positioning_y_shape, fov_positioning_z_shape, decoding_decode_method, decoding_magnitude_threshold, decoding_decoder_min_intensity]
174 |     when: $(inputs.datafile != null)
175 | 
176 |   codebook_grabber:
177 |     run:
178 |       class: ExpressionTool
179 |       requirements:
180 |         - class: InlineJavascriptRequirement
181 |         - class: LoadListingRequirement
182 | 
183 |       inputs:
184 |         experiment:
185 |           type: Directory?
186 |           doc: A directory containing a spaceTx-formatted experiment
187 | 
188 |       outputs:
189 |         codebook:
190 |           type: File?
191 | 
192 |       expression: |
193 |         ${
194 |           for(var i=0;i<inputs.experiment.listing.length; i++){
195 |             if(inputs.experiment.listing[i].basename.includes("codebook.json")){
196 |               return {"codebook": inputs.experiment.listing[i]};
197 |             }
198 |           }
199 |           return null;
200 |         }
201 |     in:
202 |       experiment:
203 |         source: [codebook, codebook_exp]
204 |         valueFrom: |
205 |           ${
206 |             if(self[1]){
207 |               return self[1];
208 |             } else if(self[0] && "exp" in self[0]) {
209 |               return self[0].exp;
210 |             } else {
211 |               return null;
212 |             }
213 |           }
214 |     out:
215 |       [codebook]
216 |     when: $(inputs.experiment != null)
217 | 
218 | 
219 |   execute_qc:
220 |     run:
221 |       class: CommandLineTool
222 |       baseCommand: /opt/qcDriver.py
223 | 
224 |       requirements:
225 |         DockerRequirement:
226 |           dockerPull: hubmap/starfish-custom:latest
227 |         InitialWorkDirRequirement:
228 |           listing:
229 |             - entryname: "$('input_dir_' + inputs.tmp_prefix)"
230 |               writable: true
231 |               entry: "$(inputs.data_exp_dir)"
232 | 
233 |       inputs:
234 |         tmp_prefix:
235 |           type: string
236 |           inputBinding:
237 |             prefix: --tmp-prefix
238 |         codebook:
239 |           type:
240 |             - type: record
241 |               name: pkl
242 |               fields:
243 |                 pkl:
244 |                   type: File
245 |                   inputBinding:
246 |                     prefix: --codebook-pkl
247 |             - type: record
248 |               name: exp
249 |               fields:
250 |                 exp:
251 |                   type: File
252 |                   inputBinding:
253 |                     prefix: --codebook-file
254 | 
255 |         segmentation_loc:
256 |           type: Directory?
257 |           inputBinding:
258 |             prefix: --segmentation-loc
259 | 
260 |         data_exp_dir:
261 |           type: Directory
262 | 
263 |         data:
264 |           type:
265 |           - 'null'
266 |           - type: record
267 |             name: pkl
268 |             fields:
269 |               spots:
270 |                 type: File?
271 |                 inputBinding:
272 |                   prefix: --spots-pkl
273 |               transcripts:
274 |                 type: File
275 |                 inputBinding:
276 |                   prefix: --transcript-pkl
277 | 
278 |         data_exp_staged:
279 |           type: string
280 |           inputBinding:
281 |             prefix: --exp-output
282 | 
283 |         selected_fovs:
284 |           type: int[]?
285 |           inputBinding:
286 |             prefix: --selected-fovs
287 |           doc: If provided, processing will only be run on FOVs with these indices.
288 | 
289 |         has_spots:
290 |           type: boolean?
291 |           inputBinding:
292 |             prefix: --has-spots
293 | 
294 |         roi:
295 |           type: File?
296 |           inputBinding: 
297 |             prefix: --roi
298 | 
299 |         imagesize:
300 |           - 'null'
301 |           - type: record
302 |             name: locs
303 |             fields:
304 |               locs:
305 |                 type: File?
306 |                 inputBinding:
307 |                   prefix: --loc-json
308 |           - type: record
309 |             fields:
310 |               - name: x_size
311 |                 type: int
312 |                 inputBinding:
313 |                   prefix: --x-size
314 |               - name: y_size
315 |                 type: int
316 |                 inputBinding:
317 |                   prefix: --y-size
318 |               - name: z_size
319 |                 type: int
320 |                 inputBinding:
321 |                   prefix: --z-size
322 | 
323 |         spot_threshold:
324 |           type: float?
325 |           inputBinding:
326 |             prefix: --spot-threshold
327 | 
328 |         find_ripley:
329 |           type: boolean?
330 |           inputBinding:
331 |             prefix: --run-ripley
332 |           default: False
333 | 
334 |         save_pdf:
335 |           type: boolean?
336 |           inputBinding:
337 |             prefix: --save-pdf
338 |           default: True
339 | 
340 |       outputs:
341 |         qc_metrics:
342 |           type: Directory
343 |           outputBinding:
344 |             glob: $("tmp/" + inputs.tmp_prefix + "/7_QC/")
345 |     in:
346 |       tmp_prefix: tmpname/tmp
347 |       codebook:
348 |         source: [codebook, codebook_grabber/codebook, codebook_pkl]
349 |         valueFrom: |
350 |           ${
351 |             if(self[1]){
352 |               return {exp: self[1]};
353 |             } else if(self[0]) {
354 |               return self[0];
355 |             } else {
356 |               return {pkl: self[2]}
357 |             }
358 |           }
359 |       segmentation_loc: segmentation_loc
360 |       selected_fovs:
361 |         source: [stage_qc/selected_fovs, selected_fovs]
362 |         valueFrom: |
363 |           ${
364 |             if(self[0]){
365 |               return self[0];
366 |             } else if(self[1]) {
367 |               return self[1];
368 |             } else {
369 |               return null;
370 |             }
371 |           }
372 |       has_spots:
373 |         source: [stage_qc/decoding_decode_method, has_spots]
374 |         valueFrom: |
375 |           ${
376 |              if((self[0] && self[0].length) || self[1]){
377 |                return true;
378 |              } else {
379 |                return false;
380 |              }
381 |           }
382 |       data:
383 |         source: [data, data_pkl_spots, data_pkl_transcripts]
384 |         valueFrom: |
385 |           ${
386 |             if(self[0] && !("exp" in self[0])){
387 |               return self[0];
388 |             } else if(self[2]){
389 |               return {pkl: {spots: self[1], transcripts: self[2]}};
390 |             } else {
391 |               return null;
392 |             }
393 |           }
394 |       data_exp_dir:
395 |         source: [data, data_exp]
396 |         valueFrom: |
397 |           ${
398 |             if(self[0] && "exp" in self[0]){
399 |               return self[0].exp;
400 |             } else if(self[1]) {
401 |               return self[1];
402 |             } else {
403 |               return null;
404 |             }
405 |           }
406 |       data_exp_staged:
407 |         valueFrom: $("input_dir_" + inputs.tmp_prefix)
408 |       roi: roi
409 |       imagesize:
410 |         source: [imagesize, stage_qc/fov_positioning_x_shape, stage_qc/fov_positioning_y_shape, stage_qc/fov_positioning_z_shape, locs_json]
411 |         valueFrom: |
412 |           ${
413 |             if(!self[1]){
414 |               if(self[0]){
415 |                 return self[0];
416 |               } else if(self[4]){
417 |                 return {"locs": self[4]};
418 |               } else {
419 |                 return null;
420 |               }
421 |             } else {
422 |               return {
423 |                 "x_size": self[1],
424 |                 "y_size": self[2],
425 |                 "z_size": self[3]
426 |               };
427 |             }
428 |           }
429 |       spot_threshold:
430 |         source: [stage_qc/decoding_decoder_min_intensity, stage_qc/decoding_magnitude_threshold, spot_threshold]
431 |         valueFrom: |
432 |           ${
433 |              if(self[0]){
434 |                return self[0];
435 |              } else if(self[1]) {
436 |                return self[1];
437 |              } else if(self[2]){
438 |                return self[2];
439 |              } else {
440 |                return null;
441 |              }
442 |           }
443 |       find_ripley:
444 |         source: [stage_qc/find_ripley, find_ripley]
445 |         pickValue: first_non_null
446 |       save_pdf:
447 |         source: [stage_qc/save_pdf, save_pdf]
448 |         pickValue: first_non_null
449 | 
450 |     out: [qc_metrics]
451 | 


--------------------------------------------------------------------------------
/steps/segmentation.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 |   decoded_loc:
 14 |     type: Directory
 15 |     doc: Location of the directory that is the output from the starfishRunner step.
 16 | 
 17 |   exp_loc:
 18 |     type: Directory
 19 |     doc: Location of directory containing the 'experiment.json' file
 20 | 
 21 |   parameter_json:
 22 |     type: File?
 23 |     doc: File containing parameters to run this step.
 24 | 
 25 |   selected_fovs:
 26 |     type: int[]?
 27 |     doc: If provided, segmentation will only be run on FOVs with these indices.
 28 | 
 29 |   aux_name:
 30 |     type: string?
 31 |     doc: The name of the aux view to look at in the experiment file.
 32 | 
 33 |   mask_roi_files:
 34 |     type: Directory?
 35 |     doc: Flattened directory input, refer to record entry "binary_mask"
 36 | 
 37 |   mask_roi_formats:
 38 |     type: string?
 39 |     doc: Flattened record input, refer to record entry "binary_mask"
 40 | 
 41 |   mask_labeled_files:
 42 |     type: Directory?
 43 |     doc: Flattened file input, refer to record entry "binary_mask"
 44 | 
 45 |   mask_labeled_formats:
 46 |     type: string?
 47 |     doc: Flattened record input, refer to record entry "binary_mask"
 48 | 
 49 |   binary_mask:
 50 |     - 'null'
 51 |     - type: record
 52 |       name: roi_set
 53 |       fields:
 54 |         roi_set:
 55 |           type: Directory
 56 |           doc: Directory of RoiSet.zip for each fov, from fiji segmentation
 57 |         file_formats:
 58 |           type: string
 59 |           doc: Layout for name of each RoiSet.zip, per fov. Will be formatted with String.format([fov index]).
 60 |     - type: record
 61 |       name: labeled_image
 62 |       fields:
 63 |         labeled_image:
 64 |           type: Directory
 65 |           doc: Directory of labeled images with image segmentation data, such as from ilastik classification.
 66 |         file_formats_labeled:
 67 |           type: string
 68 |           doc: Layout for name of each labelled image. Will be formatted with String.format([fov index])
 69 |     - type: record
 70 |       name: basic_watershed
 71 |       fields:
 72 |         img_threshold:
 73 |           type: float
 74 |           doc: Global threshold value for images
 75 |         min_dist:
 76 |           type: int
 77 |           doc: minimum distance (pixels) between distance transformed peaks
 78 |         min_allowed_size:
 79 |           type: int
 80 |           doc: minimum size for a cell (in pixels)
 81 |         max_allowed_size:
 82 |           type: int
 83 |           doc: maxiumum size for a cell (in pixels)
 84 |         masking_radius:
 85 |           type: int
 86 |           doc: Radius for white tophat noise filter
 87 |     - type: record
 88 |       name: density_based
 89 |       fields:
 90 |         nuclei_view:
 91 |           type: string
 92 |           doc: Name of the auxillary view with nuclei data
 93 |         cyto_seg:
 94 |           type: boolean
 95 |           doc: If true, the cytoplasm will be segmented
 96 |         correct_seg:
 97 |           type: boolean
 98 |           doc: If true, suspected nuclei/cytoplasms that overlap will be removed.
 99 |         border_buffer:
100 |           type: int
101 |           doc: If not None, removes cytoplasms whose nuclei lie within the given distance from the border.
102 |         area_thresh:
103 |           type: float
104 |           doc: Threshold used when determining if an object is one nucleus or two or more overlapping nuclei. Objects whose ratio of convex hull area to normal area are above this threshold are removed if the option to remove overlapping nuclei is set.
105 |         thresh_block_size:
106 |           type: int
107 |           doc: Size of structuring element for local thresholding of nuclei. If nuclei interiors aren't passing threshold, increase this value, if too much non-nuclei is passing threshold, lower it.
108 |         watershed_footprint_size:
109 |           type: int
110 |           doc: Size of structuring element for watershed segmentation. Larger values will segment the nuclei into larger objects and smaller values will result in smaller objects. Adjust according to nucleus size.
111 |         label_exp_size:
112 |           type: int
113 |           doc:  Pixel size labels are dilated by in final step. Helpful for closing small holes that are common from thresholding but can also cause cell boundaries to exceed their true boundaries if set too high. Label dilation respects label borders and does not mix labels.
114 | 
115 | outputs:
116 |   segmented:
117 |     type: Directory
118 |     outputSource: execute_segmentation/segmented
119 | 
120 | steps:
121 | 
122 |   tmpname:
123 |     run: tmpdir.cwl
124 |     in: []
125 |     out: [tmp]
126 | 
127 |   read_schema:
128 |     run:
129 |       class: CommandLineTool
130 |       baseCommand: cat
131 | 
132 |       requirements:
133 |         DockerRequirement:
134 |           dockerPull: hubmap/starfish-custom:latest
135 |         ResourceRequirement:
136 |           ramMin: 1000
137 |           tmpdirMin: 1000
138 |           outdirMin: 1000
139 | 
140 |       inputs:
141 |         schema:
142 |           type: string
143 |           inputBinding:
144 |             position: 1
145 | 
146 |       outputs:
147 |         data:
148 |           type: stdout
149 | 
150 |     in:
151 |       schema:
152 |         valueFrom: "/opt/segmentation.json"
153 |     out: [data]
154 | 
155 |   stage_segmentation:
156 |     run: inputParser.cwl
157 |     in:
158 |       datafile: parameter_json
159 |       schema: read_schema/data
160 |     out: [selected_fovs, aux_name, binary_mask_img_threshold, binary_mask_min_dist, binary_mask_min_allowed_size, binary_mask_max_allowed_size, binary_mask_masking_radius, binary_mask_nuclei_view, binary_mask_cyto_seg, binary_mask_correct_seg, binary_mask_border_buffer, binary_mask_area_thresh, binary_mask_thresh_block_size, binary_mask_watershed_footprint_size, binary_mask_label_exp_size]
161 |     when: $(inputs.datafile != null)
162 |   execute_segmentation:
163 |     run:
164 |       class: CommandLineTool
165 |       baseCommand: /opt/segmentationDriver.py
166 | 
167 |       requirements:
168 |         DockerRequirement:
169 |           dockerPull: hubmap/starfish-custom:latest
170 |         InitialWorkDirRequirement:
171 |           listing:
172 |             - entryname: "$('input_dir_'+inputs.tmp_prefix)"
173 |               writable: true
174 |               entry: "$(inputs.exp_loc)"
175 | 
176 |       inputs:
177 |         tmp_prefix:
178 |           type: string
179 |           inputBinding:
180 |             prefix: --tmp-prefix
181 | 
182 |         decoded_loc:
183 |           type: Directory
184 |           inputBinding:
185 |             prefix: --decoded-loc
186 | 
187 |         exp_loc:
188 |           type: Directory
189 | 
190 |         exp_loc_staged:
191 |           type: string
192 |           inputBinding:
193 |             prefix: --exp-loc
194 | 
195 |         selected_fovs:
196 |           type: int[]?
197 |           inputBinding:
198 |             prefix: --selected-fovs
199 |           doc: If provided, processing will only be run on FOVs with these indices.
200 | 
201 |         aux_name:
202 |           type: string?
203 |           inputBinding:
204 |             prefix: --aux-name
205 | 
206 |         binary_mask:
207 |           type:
208 |             - type: record
209 |               name: roi_set
210 |               fields:
211 |                 roi_set:
212 |                   type: Directory
213 |                   inputBinding:
214 |                     prefix: --roi-set
215 |                 file_formats:
216 |                   type: string
217 |                   inputBinding:
218 |                     prefix: --file-formats
219 |             - type: record
220 |               name: labeled_image
221 |               fields:
222 |                 labeled_image:
223 |                   type: Directory
224 |                   inputBinding:
225 |                     prefix: --labeled-image
226 |                 file_formats_labeled:
227 |                   type: string
228 |                   inputBinding:
229 |                     prefix: --file-formats-labeled
230 |             - type: record
231 |               name: basic_watershed
232 |               fields:
233 |                 img_threshold:
234 |                   type: float
235 |                   inputBinding:
236 |                     prefix: --img-threshold
237 |                 min_dist:
238 |                   type: int
239 |                   inputBinding:
240 |                     prefix: --min-dist
241 |                 min_allowed_size:
242 |                   type: int
243 |                   inputBinding:
244 |                     prefix: --min-size
245 |                 max_allowed_size:
246 |                   type: int
247 |                   inputBinding:
248 |                     prefix: --max-size
249 |                 masking_radius:
250 |                   type: int
251 |                   inputBinding:
252 |                     prefix: --masking-radius
253 |             - type: record
254 |               name: density_based
255 |               fields:
256 |                 nuclei_view:
257 |                   type: string
258 |                   inputBinding:
259 |                     prefix: --nuclei-view
260 |                 cyto_seg:
261 |                   type: boolean
262 |                   inputBinding:
263 |                     prefix: --cyto-seg
264 |                 correct_seg:
265 |                   type: boolean
266 |                   inputBinding:
267 |                     prefix: --correct-seg
268 |                 border_buffer:
269 |                   type: int
270 |                   inputBinding:
271 |                     prefix: --border-buffer
272 |                 area_thresh:
273 |                   type: float
274 |                   inputBinding:
275 |                     prefix: --area-thresh
276 |                 thresh_block_size:
277 |                   type: int
278 |                   inputBinding:
279 |                     prefix: --thresh-block-size
280 |                 watershed_footprint_size:
281 |                   type: int
282 |                   inputBinding:
283 |                     prefix: --watershed-footprint-size
284 |                 label_exp_size:
285 |                   type: int
286 |                   inputBinding:
287 |                     prefix: --label-exp-size
288 | 
289 |       outputs:
290 |         segmented:
291 |           type: Directory
292 |           outputBinding:
293 |             glob: $("tmp/" + inputs.tmp_prefix + "/5_Segmented/")
294 | 
295 |     in:
296 |       tmp_prefix: tmpname/tmp
297 |       decoded_loc: decoded_loc
298 |       exp_loc: exp_loc
299 |       exp_loc_staged:
300 |         valueFrom: $("input_dir_" + inputs.tmp_prefix)
301 |       selected_fovs:
302 |         source: [stage_segmentation/selected_fovs, selected_fovs]
303 |         valueFrom: |
304 |           ${
305 |             if(self[0]){
306 |               return self[0];
307 |             } else if(self[1]) {
308 |               return self[1];
309 |             } else {
310 |               return null;
311 |             }
312 |           }
313 |       aux_name:
314 |         source: [stage_segmentation/aux_name, aux_name]
315 |         valueFrom: |
316 |           ${
317 |             if(self[0]){
318 |               return self[0];
319 |             } else if (self[1]){
320 |               return self[1];
321 |             } else {
322 |               return null;
323 |             }
324 |           }
325 |       binary_mask:
326 |         source: [binary_mask, stage_segmentation/binary_mask_img_threshold, stage_segmentation/binary_mask_min_dist, stage_segmentation/binary_mask_min_allowed_size, stage_segmentation/binary_mask_max_allowed_size, stage_segmentation/binary_mask_masking_radius, stage_segmentation/binary_mask_nuclei_view, stage_segmentation/binary_mask_cyto_seg, stage_segmentation/binary_mask_correct_seg, stage_segmentation/binary_mask_border_buffer, stage_segmentation/binary_mask_area_thresh, stage_segmentation/binary_mask_thresh_block_size, stage_segmentation/binary_mask_watershed_footprint_size, stage_segmentation/binary_mask_label_exp_size, mask_roi_files, mask_roi_formats, mask_labeled_files, mask_labeled_formats]
327 |         valueFrom: |
328 |           ${
329 |             if(self[14] && self[15]) {
330 |               return {
331 |                 "roi_set": self[14],
332 |                 "file_formats": self[15]
333 |               }
334 |             } else if(self[16] && self[17]){
335 |               return {
336 |                 "labeled_image": self[16],
337 |                 "file_formats_labeled": self[17]
338 |               };
339 |             } else if(!self[1] && !self[6]){
340 |               return self[0];
341 |             } else if(self[1]){
342 |               return {
343 |                 "img_threshold": self[1],
344 |                 "min_dist": self[2],
345 |                 "min_allowed_size": self[3],
346 |                 "max_allowed_size": self[4],
347 |                 "masking_radius": self[5]
348 |               };
349 |             } else {
350 |               return {
351 |                 "nuclei_view": self[6],
352 |                 "cyto_seg": self[7],
353 |                 "correct_seg": self[8],
354 |                 "border_buffer": self[9],
355 |                 "area_thresh": self[10],
356 |                 "thresh_block_size": self[11],
357 |                 "watershed_footprint_size": self[12],
358 |                 "label_exp_size": self[13]
359 |               };
360 |             }
361 |           }
362 |     out: [segmented]
363 | 


--------------------------------------------------------------------------------
/steps/sorter.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 |   input_dir:
 14 |     type: Directory
 15 |     doc: The root directory containing all images.
 16 | 
 17 |   dir_size:
 18 |     type: long?
 19 |     doc: Size of input_dir, in MiB. If provided, will be used to calculate ResourceRequirement.
 20 | 
 21 |   codebook_csv:
 22 |     type: File?
 23 |     doc: Flattened csv input, refer to record entry.
 24 | 
 25 |   codebook_json:
 26 |     type: File?
 27 |     doc: Flattened json input, refer to record entry.
 28 | 
 29 |   codebook:
 30 |     type:
 31 |       - 'null'
 32 |       - type: record
 33 |         name: csv
 34 |         fields:
 35 |           csv:
 36 |             type: File
 37 |             doc: The codebook for this experiment in .csv format, where the rows are barcodes and the columns are imaging rounds. Column IDs are expected to be sequential, and round identifiers are expected to be integers (not roman numerals).
 38 |       - type: record
 39 |         name: json
 40 |         fields:
 41 |           json:
 42 |             type: File
 43 |             doc: The codebook for this experiment, already formatted in the spaceTx defined .json format.
 44 | 
 45 |   channel_yml:
 46 |     type: File
 47 |     doc: PyYML-formatted list containing a dictionary outlining how the truechannels in imaging relate to the pseudochannels in the decoding codebook. The index of each dict within the list is the trueround % (count of pseudorounds). The keys of the dict are the channels within the image and the values are the pseudochannels in the converted notebook.
 48 | 
 49 |   cycle_yml:
 50 |     type: File
 51 |     doc: PyYML-formatted dictionary outlining how the truerounds in imaging relate to the pseudorounds in the decoding codebook. The keys are truerounds and the values are the corresponding pseudorounds.
 52 | 
 53 |   parameter_json:
 54 |     type: File?
 55 |     doc: json file containing parameters for conversion
 56 | 
 57 |   file_format:
 58 |     type: string?
 59 |     doc: String with layout for .tiff files. Will be formatted via str.format().
 60 | 
 61 |   file_vars:
 62 |     type: string[]?
 63 |     doc: Variables to get substituted into the file_format string.
 64 | 
 65 |   cache_read_order:
 66 |     type: string[]?
 67 |     doc: Order of x,y,z,ch dimensions within each image.
 68 | 
 69 |   fov_count:
 70 |     type: int?
 71 |     doc: The number of FOVs that are included in this experiment
 72 | 
 73 |   round_offset:
 74 |     type: int?
 75 |     doc: The index of the first round (for file names).
 76 |     default: 0
 77 | 
 78 |   fov_offset:
 79 |     type: int?
 80 |     doc: The index of the first FOV (for file names).
 81 |     default: 0
 82 | 
 83 |   channel_offset:
 84 |     type: int?
 85 |     doc: The index of the first channel (for file names).
 86 |     default: 0
 87 | 
 88 |   channel_slope:
 89 |     type: float?
 90 |     default: 1
 91 | 
 92 |   aux_tilesets:
 93 |     - 'null'
 94 |     - type: record
 95 |       name: aux_tilesets
 96 |       fields:
 97 |         aux_names:
 98 |           type: string[]?
 99 |           doc: Names of the Auxillary tiles.
100 |         aux_file_formats:
101 |           type: string[]?
102 |           doc: String layout for .tiff files of aux views.
103 |         aux_file_vars:
104 |           type: string[]?
105 |           doc: Variables to be substituted into aux_file_formats. One entry per aux_name, with semicolon-delimited vars.
106 |         aux_cache_read_order:
107 |           type: string[]?
108 |           doc: Order of non x,y dimensions within each image. One entry per aux_name, with semicolon-delimited vars.
109 |         aux_channel_count:
110 |           type: float[]?
111 |           doc: Count of channels in each aux image.
112 |         aux_channel_slope:
113 |           type: float[]?
114 |           doc: Used to convert 0-indexed channel IDs to the channel index within the image.  Calculated as (image index) = int(index*slope) + intercept
115 |         aux_channel_intercept:
116 |           type: int[]?
117 |           doc: Used to convert 0-indexed channel IDs to the channel index within the image.  Calculated as (image index) = int(index*slope) + intercept
118 | 
119 | 
120 | outputs:
121 |   pseudosorted_dir:
122 |     type: Directory
123 |     outputSource: execute_sort/pseudosorted_dir
124 | 
125 | steps:
126 | 
127 |   read_schema:
128 |     run:
129 |       class: CommandLineTool
130 |       baseCommand: cat
131 | 
132 |       requirements:
133 |         DockerRequirement:
134 |           dockerPull: hubmap/starfish-custom:latest
135 |         ResourceRequirement:
136 |           ramMin: 1000
137 |           tmpdirMin: 1000
138 |           outdirMin: 1000
139 | 
140 |       inputs:
141 |         schema:
142 |           type: string
143 |           inputBinding:
144 |             position: 1
145 | 
146 |       outputs:
147 |         data:
148 |           type: stdout
149 | 
150 |     in:
151 |       schema:
152 |         valueFrom: "/opt/sorter.json"
153 |     out: [data]
154 | 
155 |   tmpname:
156 |     run: tmpdir.cwl
157 |     in: []
158 |     out: [tmp]
159 | 
160 |   stage_sort:
161 |     run: inputParser.cwl
162 |     in:
163 |       datafile: parameter_json
164 |       schema: read_schema/data
165 |     out: [round_count, fov_count, round_offset, fov_offset, channel_offset, channel_slope, file_format, file_vars, cache_read_order, aux_tilesets_aux_names, aux_tilesets_aux_file_formats, aux_tilesets_aux_file_vars, aux_tilesets_aux_cache_read_order, aux_tilesets_aux_channel_count, aux_tilesets_aux_channel_slope, aux_tilesets_aux_channel_intercept]
166 |     when: $(inputs.datafile != null)
167 | 
168 |   execute_sort:
169 |     run:
170 |       class: CommandLineTool
171 |       baseCommand: /opt/pseudoSort.py
172 | 
173 |       requirements:
174 |         DockerRequirement:
175 |           dockerPull: hubmap/starfish-custom:latest
176 |         ResourceRequirement:
177 |           tmpdirMin: |
178 |             ${
179 |               if(inputs.dir_size === null) {
180 |                 return null;
181 |               } else {
182 |                 return inputs.dir_size * 1.2;
183 |               }
184 |             }
185 |           outdirMin: |
186 |             ${
187 |               if(inputs.dir_size === null) {
188 |                 return null;
189 |               } else {
190 |                 return inputs.dir_size * 1.2;
191 |               }
192 |             }
193 | 
194 |       inputs:
195 | 
196 |         dir_size:
197 |           type: long?
198 | 
199 |         tmp_prefix:
200 |           type: string
201 |           inputBinding: 
202 |             prefix: --tmp-prefix
203 | 
204 |         input_dir:
205 |           type: Directory
206 |           inputBinding:
207 |             prefix: --input-dir
208 | 
209 |         codebook:
210 |           type:
211 |             - type: record
212 |               name: csv
213 |               fields:
214 |                 csv:
215 |                   type: File
216 |                   inputBinding:
217 |                     prefix: --codebook-csv
218 |             - type: record
219 |               name: json
220 |               fields:
221 |                 json:
222 |                   type: File
223 |                   inputBinding:
224 |                     prefix: --codebook-json
225 | 
226 |         channel_yml:
227 |           type: File
228 |           inputBinding:
229 |             prefix: --channel-yml
230 | 
231 |         cycle_yml:
232 |           type: File
233 |           inputBinding:
234 |             prefix: --cycle-yml
235 | 
236 |         file_format:
237 |           type: string
238 |           inputBinding:
239 |             prefix: --file-format
240 | 
241 |         file_vars:
242 |           type: string[]
243 |           inputBinding:
244 |             prefix: --file-vars
245 | 
246 |         cache_read_order:
247 |           type: string[]
248 |           inputBinding:
249 |             prefix: --cache-read-order
250 | 
251 |         fov_count:
252 |           type: int
253 |           inputBinding:
254 |             prefix: --fov-count
255 | 
256 |         round_offset:
257 |           type: int?
258 |           inputBinding:
259 |             prefix: --round-offset
260 | 
261 |         fov_offset:
262 |           type: int?
263 |           inputBinding:
264 |             prefix: --fov-offset
265 | 
266 |         channel_offset:
267 |           type: int?
268 |           inputBinding:
269 |             prefix: --channel-offset
270 | 
271 |         channel_slope:
272 |           type: float?
273 |           inputBinding:
274 |             prefix: --channel-slope
275 | 
276 |         aux_tilesets:
277 |           type:
278 |             type: record
279 |             name: aux_tilesets
280 |             fields:
281 |               aux_names:
282 |                 type: string[]?
283 |                 inputBinding:
284 |                   prefix: --aux-names
285 |               aux_file_formats:
286 |                 type: string[]?
287 |                 inputBinding:
288 |                   prefix: --aux-file-formats
289 |               aux_file_vars:
290 |                 type: string[]?
291 |                 inputBinding:
292 |                   prefix: --aux-file-vars
293 |               aux_cache_read_order:
294 |                 type: string[]?
295 |                 inputBinding:
296 |                   prefix: --aux-cache-read-order
297 |               aux_channel_count:
298 |                 type: int[]?
299 |                 inputBinding:
300 |                   prefix: --aux-channel-count
301 |               aux_channel_slope:
302 |                 type: float[]?
303 |                 inputBinding:
304 |                   prefix: --aux-channel-slope
305 |               aux_channel_intercept:
306 |                 type: int[]?
307 |                 inputBinding:
308 |                   prefix: --aux-channel-intercept
309 | 
310 |       outputs:
311 |         pseudosorted_dir:
312 |           type: Directory
313 |           outputBinding:
314 |             glob: $("tmp/" + inputs.tmp_prefix + "/1_pseudosort/")
315 | 
316 |         log:
317 |           type: stdout
318 |     in:
319 |       dir_size: dir_size
320 |       tmp_prefix: tmpname/tmp
321 |       input_dir: input_dir
322 |       codebook:
323 |         source: [codebook, codebook_csv, codebook_json]
324 |         linkMerge: merge_flattened
325 |         valueFrom: |
326 |           ${
327 |             if(self[0]){
328 |               return self[0];
329 |             } else if(self[1]){
330 |               return {csv: self[1]};
331 |             } else {
332 |               return {json: self[2]};
333 |             }
334 |           }
335 |       channel_yml: channel_yml
336 |       cycle_yml: cycle_yml
337 |       file_format:
338 |         source: [stage_sort/file_format, file_format]
339 |         pickValue: first_non_null
340 |       file_vars:
341 |         source: [stage_sort/file_vars, file_vars]
342 |         pickValue: first_non_null
343 |       cache_read_order:
344 |         source: [stage_sort/cache_read_order, cache_read_order]
345 |         pickValue: first_non_null
346 |       fov_count:
347 |         source: [stage_sort/fov_count, fov_count]
348 |         pickValue: first_non_null
349 |       round_offset:
350 |         source: [stage_sort/round_offset, round_offset]
351 |         pickValue: first_non_null
352 |       fov_offset:
353 |         source: [stage_sort/fov_offset, fov_offset]
354 |         pickValue: first_non_null
355 |       channel_offset:
356 |         source: [stage_sort/channel_offset, channel_offset]
357 |         pickValue: first_non_null
358 |       channel_slope:
359 |         source: [stage_sort/channel_slope, channel_slope]
360 |         pickValue: first_non_null
361 |       aux_tilesets:
362 |         source: [aux_tilesets, stage_sort/aux_tilesets_aux_names, stage_sort/aux_tilesets_aux_file_formats, stage_sort/aux_tilesets_aux_file_vars, stage_sort/aux_tilesets_aux_cache_read_order, stage_sort/aux_tilesets_aux_channel_count, stage_sort/aux_tilesets_aux_channel_slope, stage_sort/aux_tilesets_aux_channel_intercept]
363 |         valueFrom: |
364 |           ${
365 |             if(!self[1]){
366 |               return self[0];
367 |             } else {
368 |               return {
369 |                 aux_names: self[1],
370 |                 aux_file_formats: self[2],
371 |                 aux_file_vars: self[3],
372 |                 aux_cache_read_order: self[4],
373 |                 aux_channel_count: self[5],
374 |                 aux_channel_slope: self[6],
375 |                 aux_channel_intercept: self[7]
376 |               };
377 |             }
378 |           }
379 |     out:
380 |       [pseudosorted_dir]
381 | 


--------------------------------------------------------------------------------
/steps/spaceTxConversion.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 | 
 12 | inputs:
 13 |   tiffs:
 14 |     type: Directory
 15 |     doc: The directory containing all .tiff files
 16 | 
 17 |   dir_size:
 18 |     type: long?
 19 |     doc: Size of tiffs, in MiB. If provided, will be used to calculate ResourceRequirement.
 20 | 
 21 |   codebook_csv:
 22 |     type: File?
 23 |     doc: Flattened csv input, refer to record entry.
 24 | 
 25 |   codebook_json:
 26 |     type: File?
 27 |     doc: Flattened json input, refer to record entry.
 28 | 
 29 |   locs_json:
 30 |     type: File?
 31 |     doc: Flattened json input, refer to record entry.
 32 | 
 33 |   data_org_file:
 34 |     type: File?
 35 |     doc: The data org file used to describe .dax formatted images.
 36 | 
 37 |   codebook:
 38 |     type:
 39 |       - 'null'
 40 |       - type: record
 41 |         name: csv
 42 |         fields:
 43 |           csv:
 44 |             type: File
 45 |             doc: The codebook for this experiment in .csv format, where the rows are barcodes and the columns are imaging rounds. Column IDs are expected to be sequential, and round identifiers are expected to be integers (not roman numerals).
 46 |       - type: record
 47 |         name: json
 48 |         fields:
 49 |           json:
 50 |             type: File
 51 |             doc: The codebook for this experiment, already formatted in the spaceTx defined .json format.
 52 | 
 53 |   parameter_json:
 54 |     type: File?
 55 |     doc: json file with values to be read into other input variables.
 56 | 
 57 |   round_count:
 58 |     type: int?
 59 |     doc: The number of imaging rounds in the experiment
 60 | 
 61 |   zplane_count:
 62 |     type: int?
 63 |     doc: The number of z-planes in each image
 64 | 
 65 |   channel_count:
 66 |     type: int?
 67 |     doc: The number of total channels per imaging round
 68 | 
 69 |   fov_count:
 70 |     type: int?
 71 |     doc: The number of FOVs that are included in this experiment
 72 | 
 73 |   round_offset:
 74 |     type: int?
 75 |     doc: The index of the first round (for file names).
 76 |     default: 0
 77 | 
 78 |   fov_offset:
 79 |     type: int?
 80 |     doc: The index of the first FOV (for file names).
 81 |     default: 0
 82 | 
 83 |   channel_offset:
 84 |     type: int?
 85 |     doc: The index of the first channel (for file names).
 86 |     default: 0
 87 | 
 88 |   zplane_offset:
 89 |     type: int?
 90 |     doc: The index of the first zplane (for file names).
 91 |     default: 0
 92 | 
 93 |   file_format:
 94 |     type: string?
 95 |     doc: String with layout for .tiff files
 96 | 
 97 |   file_vars:
 98 |     type: string[]?
 99 |     doc: Variables to get substituted into the file_format string.
100 | 
101 |   cache_read_order:
102 |     type: string[]?
103 |     doc: Order of non x,y dimensions within each image.
104 | 
105 |   aux_tilesets:
106 |     - 'null'
107 |     - type: record
108 |       name: aux_tilesets
109 |       fields:
110 |         aux_names:
111 |           type: string[]?
112 |           doc: Names of the Auxillary tiles.
113 |         aux_file_formats:
114 |           type: string[]?
115 |           doc: String layout for .tiff files of aux views.
116 |         aux_file_vars:
117 |           type: string[]?
118 |           doc: Variables to be substituted into aux_file_formats. One entry per aux_name, with semicolon-delimited vars.
119 |         aux_cache_read_order:
120 |           type: string[]?
121 |           doc: Order of non x,y dimensions within each image. One entry per aux_name, with semicolon-delimited vars.
122 |         aux_single_round:
123 |           type: string[]?
124 |           doc: If True, aux view will only be a single round.
125 |         aux_channel_count:
126 |           type: int[]?
127 |           doc: Count of channels in each aux image
128 |         aux_channel_slope:
129 |           type: float[]?
130 |           doc: Used to convert 0-indexed channel IDs to the channel index within the image.  Calculated as (image index) = int(index*slope) + intercept
131 |         aux_channel_intercept:
132 |           type: int[]?
133 |           doc: Used to convert 0-indexed channel IDs to the channel index within the image.  Calculated as (image index) = int(index*slope) + intercept
134 | 
135 |   fov_positioning:
136 |     - 'null'
137 |     - type: record
138 |       name: locs
139 |       fields:
140 |         locs:
141 |           type: File?
142 |           doc: Input locations as a json file, using the same records as below.
143 |     - type: record
144 |       name: fov_positioning
145 |       fields:
146 |         - name: x_locs
147 |           type: string
148 |           doc: list of x-axis start locations per fov index
149 |         - name: x_shape
150 |           type: int
151 |           doc: shape of each fov item in the x-axis
152 |         - name: x_voxel
153 |           type: float
154 |           doc: size of voxels in the x-axis
155 |         - name: y_locs
156 |           type: string
157 |           doc: list of y-axis start locations per fov index
158 |         - name: y_shape
159 |           type: int
160 |           doc: shape of each fov item in the y-axis
161 |         - name: y_voxel
162 |           type: float
163 |           doc: size of voxels in the y-axis
164 |         - name: z_locs
165 |           type: string
166 |           doc: list of z-axis start locations per fov index
167 |         - name: z_shape
168 |           type: int
169 |           doc: shape of each fov item in the z-axis
170 |         - name: z_voxel
171 |           type: float
172 |           doc: size of voxels in the z-axis
173 | 
174 |   add_blanks:
175 |     type: boolean?
176 |     doc: If true, will add blanks with a hamming distance 1 from the existing codes.
177 |     default: False
178 | 
179 | outputs:
180 |   spaceTx_converted:
181 |     type: Directory
182 |     outputSource: execute_conversion/spaceTx_converted
183 | 
184 | steps:
185 | 
186 |   tmpname:
187 |     run: tmpdir.cwl
188 |     in: []
189 |     out: [tmp]
190 | 
191 |   read_schema:
192 |     run:
193 |       class: CommandLineTool
194 |       baseCommand: cat
195 | 
196 |       requirements:
197 |         DockerRequirement:
198 |           dockerPull: hubmap/starfish-custom:latest
199 |         ResourceRequirement:
200 |           ramMin: 1000
201 |           tmpdirMin: 1000
202 |           outdirMin: 1000
203 | 
204 |       inputs:
205 |         schema:
206 |           type: string
207 |           inputBinding:
208 |             position: 1
209 | 
210 |       outputs:
211 |         data:
212 |           type: stdout
213 | 
214 |     in:
215 |       schema:
216 |         valueFrom: "/opt/spaceTxConversion.json"
217 |     out: [data]
218 | 
219 |   stage_conversion:
220 |     run: inputParser.cwl
221 |     in:
222 |       datafile: parameter_json
223 |       schema: read_schema/data
224 |     out: [round_count, zplane_count, channel_count, fov_count, round_offset, fov_offset, zplane_offset, channel_offset, file_format, file_vars, cache_read_order, aux_tilesets_aux_names, aux_tilesets_aux_file_formats, aux_tilesets_aux_file_vars, aux_tilesets_aux_cache_read_order, aux_tilesets_aux_single_round, aux_tilesets_aux_channel_count, aux_tilesets_aux_channel_slope, aux_tilesets_aux_channel_intercept,  fov_positioning_x_locs, fov_positioning_x_shape, fov_positioning_x_voxel, fov_positioning_y_locs, fov_positioning_y_shape, fov_positioning_y_voxel, fov_positioning_z_locs, fov_positioning_z_shape, fov_positioning_z_voxel, add_blanks]
225 |     when: $(inputs.datafile != null)
226 | 
227 |   execute_conversion:
228 |     run:
229 |       class: CommandLineTool
230 |       baseCommand: /opt/spaceTxConverter.py
231 | 
232 |       requirements:
233 |         DockerRequirement:
234 |             dockerPull: hubmap/starfish-custom:latest
235 |         ResourceRequirement:
236 |           tmpdirMin: |
237 |             ${
238 |               if(inputs.dir_size === null) {
239 |                 return null;
240 |               } else {
241 |                 return inputs.dir_size;
242 |               }
243 |             }
244 |           outdirMin: |
245 |             ${
246 |               return 1000;
247 |             }
248 | 
249 |       inputs:
250 |         dir_size:
251 |           type: long?
252 | 
253 |         tmp_prefix:
254 |           type: string
255 |           inputBinding:
256 |             prefix: --tmp-prefix
257 | 
258 |         tiffs:
259 |           type: Directory
260 |           inputBinding:
261 |             prefix: --input-dir
262 | 
263 |         codebook:
264 |           type:
265 |             - type: record
266 |               name: csv
267 |               fields:
268 |                 csv:
269 |                   type: File
270 |                   inputBinding:
271 |                     prefix: --codebook-csv
272 |             - type: record
273 |               name: json
274 |               fields:
275 |                 json:
276 |                   type: File
277 |                   inputBinding:
278 |                     prefix: --codebook-json
279 | 
280 |         data_org_file:
281 |           type: File?
282 |           inputBinding:
283 |             prefix: --data-org-file
284 | 
285 |         round_count:
286 |           type: int
287 |           inputBinding:
288 |             prefix: --round-count
289 | 
290 |         zplane_count:
291 |           type: int
292 |           inputBinding:
293 |             prefix: --zplane-count
294 | 
295 |         channel_count:
296 |           type: int
297 |           inputBinding:
298 |             prefix: --channel-count
299 | 
300 |         fov_count:
301 |           type: int
302 |           inputBinding:
303 |             prefix: --fov-count
304 | 
305 |         round_offset:
306 |           type: int?
307 |           inputBinding:
308 |             prefix: --round-offset
309 | 
310 |         fov_offset:
311 |           type: int?
312 |           inputBinding:
313 |             prefix: --fov-offset
314 | 
315 |         channel_offset:
316 |           type: int?
317 |           inputBinding:
318 |             prefix: --channel-offset
319 | 
320 |         zplane_offset:
321 |           type: int?
322 |           inputBinding:
323 |             prefix: --zplane-offset
324 | 
325 |         file_format:
326 |           type: string
327 |           inputBinding:
328 |             prefix: --file-format
329 | 
330 |         file_vars:
331 |           type: string[]
332 |           inputBinding:
333 |             prefix: --file-vars
334 | 
335 |         cache_read_order:
336 |           type: string[]
337 |           inputBinding:
338 |             prefix: --cache-read-order
339 | 
340 |         aux_tilesets:
341 |           - type: record
342 |             name: aux_tilesets
343 |             fields:
344 |               aux_names:
345 |                 type: string[]?
346 |                 inputBinding:
347 |                   prefix: --aux-names
348 |               aux_file_formats:
349 |                 type: string[]?
350 |                 inputBinding:
351 |                   prefix: --aux-file-formats
352 |               aux_file_vars:
353 |                 type: string[]?
354 |                 inputBinding:
355 |                   prefix: --aux-file-vars
356 |               aux_cache_read_order:
357 |                 type: string[]?
358 |                 inputBinding:
359 |                   prefix: --aux-cache-read-order
360 |               aux_single_round:
361 |                 type: string[]?
362 |                 inputBinding:
363 |                   prefix: --aux-single-round
364 |               aux_channel_count:
365 |                 type: int[]?
366 |                 inputBinding:
367 |                   prefix: --aux-channel-count
368 |               aux_channel_slope:
369 |                 type: float[]?
370 |                 inputBinding:
371 |                   prefix: --aux-channel-slope
372 |               aux_channel_intercept:
373 |                 type: int[]?
374 |                 inputBinding:
375 |                   prefix: --aux-channel-intercept
376 | 
377 |         fov_positioning_json:
378 |           - 'null'
379 |           - type: record
380 |             name: locs
381 |             fields:
382 |               locs:
383 |                 type: File?
384 |                 inputBinding:
385 |                   prefix: --loc-json
386 | 
387 |         fov_positioning_inline:
388 |           - 'null'
389 |           - type: record
390 |             name: fov_positioning
391 |             fields:
392 |               - name: x_locs
393 |                 type: string
394 |                 inputBinding:
395 |                   prefix: --x-pos-locs
396 |               - name: x_shape
397 |                 type: int
398 |                 inputBinding:
399 |                   prefix: --x-pos-shape
400 |               - name: x_voxel
401 |                 type: float
402 |                 inputBinding:
403 |                   prefix: --x-pos-voxel
404 |               - name: y_locs
405 |                 type: string
406 |                 inputBinding:
407 |                   prefix: --y-pos-locs
408 |               - name: y_shape
409 |                 type: int
410 |                 inputBinding:
411 |                   prefix: --y-pos-shape
412 |               - name: y_voxel
413 |                 type: float
414 |                 inputBinding:
415 |                   prefix: --y-pos-voxel
416 |               - name: z_locs
417 |                 type: string
418 |                 inputBinding:
419 |                   prefix: --z-pos-locs
420 |               - name: z_shape
421 |                 type: int
422 |                 inputBinding:
423 |                   prefix: --z-pos-shape
424 |               - name: z_voxel
425 |                 type: float
426 |                 inputBinding:
427 |                   prefix: --z-pos-voxel
428 | 
429 |         add_blanks:
430 |           type: boolean
431 |           inputBinding:
432 |             prefix: --add-blanks
433 | 
434 |       outputs:
435 |         spaceTx_converted:
436 |           type: Directory
437 |           outputBinding:
438 |             glob: $("tmp/" + inputs.tmp_prefix + "/2_tx_converted/")
439 |     in:
440 |       dir_size: dir_size
441 |       tmp_prefix: tmpname/tmp
442 |       tiffs: tiffs
443 |       codebook:
444 |         source: [codebook, codebook_csv, codebook_json]
445 |         linkMerge: merge_flattened
446 |         valueFrom: |
447 |           ${
448 |             if(self[0]){
449 |               return self[0];
450 |             } else if(self[1]){
451 |               return {csv: self[1]};
452 |             } else {
453 |               return {json: self[2]};
454 |             }
455 |           }
456 |       data_org_file: data_org_file
457 |       round_count:
458 |         source: [stage_conversion/round_count, round_count]
459 |         pickValue: first_non_null
460 |       zplane_count:
461 |         source: [stage_conversion/zplane_count, zplane_count]
462 |         pickValue: first_non_null
463 |       channel_count:
464 |         source: [stage_conversion/channel_count, channel_count]
465 |         pickValue: first_non_null
466 |       fov_count:
467 |         source: [stage_conversion/fov_count, fov_count]
468 |         pickValue: first_non_null
469 |       round_offset:
470 |         source: [stage_conversion/round_offset, round_offset]
471 |         pickValue: first_non_null
472 |       fov_offset:
473 |         source: [stage_conversion/fov_offset, fov_offset]
474 |         pickValue: first_non_null
475 |       channel_offset:
476 |         source: [stage_conversion/channel_offset, channel_offset]
477 |         pickValue: first_non_null
478 |       zplane_offset:
479 |         source: [stage_conversion/zplane_offset, zplane_offset]
480 |         pickValue: first_non_null
481 |       file_format:
482 |         source: [stage_conversion/file_format, file_format]
483 |         pickValue: first_non_null
484 |       file_vars:
485 |         source: [stage_conversion/file_vars, file_vars]
486 |         pickValue: first_non_null
487 |       cache_read_order:
488 |         source: [stage_conversion/cache_read_order, cache_read_order]
489 |         pickValue: first_non_null
490 |       aux_tilesets:
491 |         source: [aux_tilesets, stage_conversion/aux_tilesets_aux_names, stage_conversion/aux_tilesets_aux_file_formats, stage_conversion/aux_tilesets_aux_file_vars, stage_conversion/aux_tilesets_aux_cache_read_order, stage_conversion/aux_tilesets_aux_single_round, stage_conversion/aux_tilesets_aux_channel_count, stage_conversion/aux_tilesets_aux_channel_slope, stage_conversion/aux_tilesets_aux_channel_intercept]
492 |         valueFrom: |
493 |           ${
494 |             if(!self[1]){
495 |               return self[0];
496 |             } else {
497 |               return {
498 |                 aux_names: self[1],
499 |                 aux_file_formats: self[2],
500 |                 aux_file_vars: self[3],
501 |                 aux_cache_read_order: self[4],
502 |                 aux_single_round: self[5],
503 |                 aux_channel_count: self[6],
504 |                 aux_channel_slope: self[7],
505 |                 aux_channel_intercept: self[8]
506 |               };
507 |             };
508 |           }
509 |       fov_positioning_json:
510 |         source: [fov_positioning, locs_json]
511 |         valueFrom: |
512 |           ${
513 |             if(self[0] !== null && self[0].locs !== null) {
514 |               return self[0];
515 |             } else if(self[1] !== null) {
516 |               return {"locs": self[1]};
517 |             } else {
518 |               return null;
519 |             }
520 |           }
521 |       fov_positioning_inline:
522 |         source: [fov_positioning, stage_conversion/fov_positioning_x_locs, stage_conversion/fov_positioning_x_shape, stage_conversion/fov_positioning_x_voxel, stage_conversion/fov_positioning_y_locs, stage_conversion/fov_positioning_y_shape, stage_conversion/fov_positioning_y_voxel, stage_conversion/fov_positioning_z_locs, stage_conversion/fov_positioning_z_shape, stage_conversion/fov_positioning_z_voxel]
523 |         valueFrom: |
524 |           ${
525 |             if(self[1] === null){
526 |               if(self[0] !== null && (self[0].x_locs !== null && self[0].x_shape !== null && self[0].x_voxel !== null) && self[0].locs === null){
527 |                 return self[0];
528 |               } else {
529 |                 return null;
530 |               }
531 |             } else {
532 |               return {
533 |                 x_locs: self[1],
534 |                 x_shape: self[2],
535 |                 x_voxel: self[3],
536 |                 y_locs: self[4],
537 |                 y_shape: self[5],
538 |                 y_voxel: self[6],
539 |                 z_locs: self[7],
540 |                 z_shape: self[8],
541 |                 z_voxel: self[9]
542 |               };
543 |             };
544 |           }
545 |       add_blanks:
546 |         source: [stage_conversion/add_blanks, add_blanks]
547 |         pickValue: first_non_null
548 |     out: [spaceTx_converted]
549 | 
550 | 


--------------------------------------------------------------------------------
/steps/starfishRunner.cwl:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env cwl-runner
  2 | 
  3 | class: Workflow
  4 | cwlVersion: v1.2
  5 | 
  6 | requirements:
  7 |    - class: SubworkflowFeatureRequirement
  8 |    - class: InlineJavascriptRequirement
  9 |    - class: StepInputExpressionRequirement
 10 |    - class: MultipleInputFeatureRequirement
 11 |    - class: ScatterFeatureRequirement
 12 | 
 13 | inputs:
 14 |   exp_loc:
 15 |     type: Directory
 16 |     doc: Location of directory containing starfish experiment.json file
 17 | 
 18 |   dir_size:
 19 |     type: long?
 20 |     doc: Size of exp_loc, in MiB. If provided, will be used to calculate ResourceRequirement.
 21 | 
 22 |   parameter_json:
 23 |     type: File?
 24 |     doc: JSON formatted input parameters.
 25 | 
 26 |   selected_fovs:
 27 |     type: int[]?
 28 |     doc: If provided, starfish will only be run on FOVs with these indices.
 29 | 
 30 |   fov_count:
 31 |     type: int?
 32 |     doc: The number of FOVs that are included in this experiment
 33 | 
 34 |   use_ref_img:
 35 |     type: boolean?
 36 |     doc: Whether to generate a reference image and use it alongside spot detection.
 37 |     default: False
 38 | 
 39 |   level_method:
 40 |     type: string?
 41 |     doc: Levelling method for clip and scale application. Defaults to SCALE_BY_IMAGE.
 42 | 
 43 |   anchor_view:
 44 |     type: string?
 45 |     doc: The name of the auxillary view to be used as a reference view, such as for anchor round in ISS processing. Will not be included if not provided.
 46 | 
 47 |   is_volume:
 48 |     type: boolean?
 49 |     doc: Whether to treat the zplanes as a 3D image.
 50 |     default: False
 51 | 
 52 |   rescale:
 53 |     type: boolean?
 54 |     doc: Whether to iteratively rescale images before running the decoder.
 55 | 
 56 |   not_filtered_results:
 57 |     type: boolean?
 58 |     doc: Will not remove genes that do not match a target and do not meet criteria.
 59 | 
 60 |   n_processes:
 61 |     type: int?
 62 |     doc: If provided, the number of processes that will be spawned for processing. Otherwise, the maximum number of available CPUs will be used.
 63 | 
 64 |   scatter_into_n:
 65 |     type: int?
 66 |     doc: If provided, the step to run decoding will be split into n batches, where each batch is (FOV count/n) FOVs big.
 67 | 
 68 |   decoding_blob:
 69 |     - 'null'
 70 |     - type: record
 71 |       name: dummy
 72 |       fields:
 73 |         dummy:
 74 |           type: string?
 75 |           doc: Added to prevent cli parsing of the decoding_blob record.
 76 |     - type: record
 77 |       name: blob
 78 |       fields:
 79 |         min_sigma:
 80 |           type: float[]?
 81 |           doc: Minimum sigma tuple to be passed to blob detector
 82 |         max_sigma:
 83 |           type: float[]?
 84 |           doc: Maximum sigma tuple to be passed to blob detector
 85 |         num_sigma:
 86 |           type: int?
 87 |           doc: The number of sigma values to be tested, passed to blob detector
 88 |         threshold:
 89 |           type: float?
 90 |           doc: Threshold of blob detection
 91 |         overlap:
 92 |           type: float?
 93 |           doc: Amount of overlap allowed between blobs, passed to blob detector
 94 |         detector_method:
 95 |           type: string?
 96 |           doc: Name of the scikit-image spot detection method to use
 97 |         composite_decode:
 98 |           type: boolean?
 99 |           doc: Whether to composite all FOVs into one image, typically for PoSTcode decoding.
100 |         composite_pmin:
101 |           type: float?
102 |           doc: pmin value for clip and scale of composite image.
103 |         composite_pmax:
104 |           type: float?
105 |           doc: pmax value for clip and scale of composite image.
106 |         decode_method:
107 |           type: string
108 |           doc: Method name for spot decoding. Refer to starfish documentation.
109 |         decoder:
110 |           type:
111 |             - type: record
112 |               name: metric_distance
113 |               fields:
114 |                 trace_building_strategy:
115 |                   type: string
116 |                   doc: Which tracing strategy to use.  See starfish docs.
117 |                 max_distance:
118 |                   type: float
119 |                   doc: Maximum distance between spots.
120 |                 min_intensity:
121 |                   type: float
122 |                   doc: Minimum intensity of spots.
123 |                 pnorm:
124 |                   type: int?
125 |                   doc: Which Minkowski p-norm to use. 1 is the sum-of-absolute-values “Manhattan” distance 2 is the usual Euclidean distance infinity is the maximum-coordinate-difference distance A finite large p may cause a ValueError if overflow can occur.
126 |                 norm_order:
127 |                   type: int?
128 |                   doc: Refer to starfish documentation for metric_distance
129 |                 anchor_round:
130 |                   type: int?
131 |                   doc: Anchor round for comparison.
132 |                 search_radius:
133 |                   type: float?
134 |                   doc: Distance to search for matching spots.
135 |                 return_original_intensities:
136 |                   type: boolean?
137 |                   doc: Return original intensities instead of normalized ones.
138 |             - type: record
139 |               name: per_round_max
140 |               fields:
141 |                 trace_building_strategy:
142 |                   type: string
143 |                   doc: Which tracing strategy to use.  See starfish docs.
144 |                 anchor_round:
145 |                   type: int?
146 |                   doc: Round to refer to.  Required for nearest_neighbor.
147 |                 search_radius:
148 |                   type: float?
149 |                   doc: Distance to search for matching spots.
150 |             - type: record
151 |               name: check_all
152 |               fields:
153 |                 search_radius:
154 |                   type: float?
155 |                   doc: Distance to search for matching spots.
156 |                 error_rounds:
157 |                   type: int?
158 |                   doc: Maximum hamming distance a barcode can be from its target and still be uniquely identified.
159 |                 mode:
160 |                   type: string?
161 |                   doc: Accuracy mode to run in.  Can be 'high', 'med', or 'low'.
162 |                 physical_coords:
163 |                   type: boolean?
164 |                   doc: Whether to use physical coordinates or pixel coordinates 
165 | 
166 | 
167 |   decoding_pixel:
168 |     - 'null'
169 |     - type: record
170 |       name: dummy
171 |       fields:
172 |         dummy:
173 |           type: string?
174 |           doc: Added to prevent cli parsing of the decoding_blob record.
175 |     - type: record
176 |       name: pixel
177 |       fields:
178 |         distance_threshold:
179 |           type: float
180 |           doc: Spots whose codewords are more than this metric distance from an expected code are filtered
181 |         magnitude_threshold:
182 |           type: float
183 |           doc: spots with intensity less than this value are filtered.
184 |         min_area:
185 |           type: int?
186 |           doc: Spots with total area less than this value are filtered. Defaults to 2.
187 |         max_area:
188 |           type: int?
189 |           doc: Spots with total area greater than this value are filtered. Defaults to `np.inf`.
190 |         pnorm:
191 |           type: int?
192 |           doc: Which Minkowski p-norm to use. 1 is the sum-of-absolute-values “Manhattan” distance 2 is the usual Euclidean distance infinity is the maximum-coordinate-difference distance A finite large p may cause a ValueError if overflow can occur.
193 |         norm_order:
194 |           type: int?
195 |           doc: Order of L_p norm to apply to intensities and codes when using metric_decode to pair each intensities to its closest target (default = 2)
196 | 
197 | outputs:
198 |   decoded:
199 |     type: Directory
200 |     outputSource: restage/pool_dir
201 | 
202 | steps:
203 | 
204 |   read_schema:
205 |     run:
206 |       class: CommandLineTool
207 |       baseCommand: cat
208 | 
209 |       requirements:
210 |         DockerRequirement:
211 |           dockerPull: hubmap/starfish-custom:latest
212 |         ResourceRequirement:
213 |           ramMin: 1000
214 |           tmpdirMin: 1000
215 |           outdirMin: 1000
216 | 
217 |       inputs:
218 |         schema:
219 |           type: string
220 |           inputBinding:
221 |             position: 1
222 | 
223 |       outputs:
224 |         data:
225 |           type: stdout
226 | 
227 |     in:
228 |       schema:
229 |         valueFrom: "/opt/starfishRunner.json"
230 |     out: [data]
231 | 
232 |   stage_runner:
233 |     run: inputParser.cwl
234 |     in:
235 |       datafile: parameter_json
236 |       schema: read_schema/data
237 |     out: [fov_count, selected_fovs, level_method, use_ref_img, is_volume, anchor_view, rescale, not_filtered_results, n_processes, scatter_into_n, decoding_min_sigma, decoding_max_sigma, decoding_num_sigma, decoding_threshold, decoding_overlap, decoding_decode_method, decoding_decoder_trace_building_strategy, decoding_decoder_max_distance, decoding_decoder_min_intensity, decoding_decoder_pnorm, decoding_decoder_norm_order, decoding_decoder_anchor_round, decoding_decoder_search_radius, decoding_decoder_return_original_intensities, decoding_decoder_error_rounds, decoding_decoder_mode, decoding_decoder_physical_coords, decoding_pnorm, decoding_distance_threshold, decoding_magnitude_threshold, decoding_min_area, decoding_max_area, decoding_norm_order, decoding_composite_decode, decoding_composite_pmin, decoding_composite_pmax]
238 |     when: $(inputs.datafile != null)
239 | 
240 |   scatter_generator:
241 |     run:
242 |       class: ExpressionTool
243 |       expression: |
244 |         ${ var fovs = inputs.selected_fovs;
245 |            if(fovs === null){
246 |              fovs = [];
247 |              for (let i=0; i<inputs.fov_count; i++) {
248 |                fovs.push(Number(i));
249 |              }
250 |            }
251 |            if(inputs.scatter_into_n === null){
252 |              return {"scatter_out": new Array(fovs)};
253 |            } else {
254 |              var scattered = new Array(inputs.scatter_into_n);
255 |              var chunkSize = Math.ceil(fovs.length / inputs.scatter_into_n);
256 |              var loc = 0;
257 |              for (let i = 0; i<fovs.length; i += chunkSize) {
258 |                var subs = [];
259 |                for (let j=i; j<i + chunkSize && j<fovs.length; j +=1) {
260 |                  subs.push(Number(fovs[j]));
261 |                }
262 |                scattered[loc] = subs;
263 |                loc += 1;
264 |              }
265 |              return {"scatter_out": scattered};
266 |            }; }
267 |       inputs:
268 |         scatter_into_n:
269 |           type: int?
270 |         selected_fovs:
271 |           type: int[]?
272 |         fov_count:
273 |           type: int
274 |       outputs:
275 |         scatter_out:
276 |           type:
277 |             type: array
278 |             items:
279 |               type: array
280 |               items: int
281 |     in:
282 |       scatter_into_n:
283 |         source: [stage_runner/scatter_into_n, scatter_into_n]
284 |         valueFrom: |
285 |           ${
286 |             if(self[0]){
287 |               return self[0];
288 |             } else if(self[1]) {
289 |               return self[1];
290 |             } else {
291 |               return null;
292 |             }
293 |           }
294 |       selected_fovs:
295 |         source: [stage_runner/selected_fovs, selected_fovs]
296 |         valueFrom: |
297 |           ${
298 |             if(self[0]){
299 |               return self[0];
300 |             } else if(self[1]) {
301 |               return self[1];
302 |             } else {
303 |               return null;
304 |             }
305 |           }
306 |       fov_count:
307 |         source: [stage_runner/fov_count, fov_count]
308 |         valueFrom: |
309 |           ${
310 |             if(self[0]){
311 |               return self[0];
312 |             } else if(self[1]) {
313 |               return self[1];
314 |             } else {
315 |               return null;
316 |             }
317 |           }
318 |     out: [scatter_out]
319 | 
320 |   tmpname:
321 |     run: tmpdir.cwl
322 |     scatter: sc_count
323 |     in:
324 |       sc_count: scatter_generator/scatter_out
325 |     out: [tmp]
326 | 
327 |   fileDivider:
328 |     scatter: scatter
329 |     run:
330 |       class: ExpressionTool
331 |       requirements:
332 |         - class: InlineJavascriptRequirement
333 |         - class: LoadListingRequirement
334 | 
335 |       inputs:
336 |         experiment:
337 |           type: Directory
338 |           doc: Directory containing spaceTx-formatted experiment
339 | 
340 |         scatter:
341 |           type:
342 |             type: array
343 |             items: int
344 |           doc: List describing the FOVs in this specific scatter.
345 | 
346 |       outputs:
347 |         out: File[]
348 | 
349 |       expression: |
350 |         ${
351 |           var dir_lis = [];
352 |           for(var i=0;i<inputs.experiment.listing.length; i++){
353 |             var id = inputs.experiment.listing[i].basename;
354 |             if(id.includes("json")){
355 |               dir_lis.push(inputs.experiment.listing[i])
356 |             } else {
357 |               for(var j=0;j<inputs.scatter.length; j++) {
358 |                 if(id.includes("fov_"+String(inputs.scatter[j]).padStart(5,'0'))){
359 |                   dir_lis.push(inputs.experiment.listing[i])
360 |                 }
361 |               }
362 |             }
363 |           }
364 |           return {"out": dir_lis};
365 |         }
366 |     in:
367 |       experiment: exp_loc
368 |       scatter: scatter_generator/scatter_out
369 |     out:
370 |       [out]
371 | 
372 |   execute_runner:
373 |     scatter: [selected_fovs, tmp_prefix, exp_files]
374 |     scatterMethod: dotproduct
375 |     run:
376 |       class: CommandLineTool
377 |       baseCommand: /opt/starfishDriver.py
378 | 
379 |       requirements:
380 |         InitialWorkDirRequirement:
381 |           listing:
382 |             - entryname: "$('input_dir_'+inputs.tmp_prefix)"
383 |               writable: true
384 |               entry: "$({class: 'Directory', listing: inputs.exp_files})"
385 |         DockerRequirement:
386 |           dockerPull: hubmap/starfish-custom:latest
387 |         ResourceRequirement:
388 |           tmpdirMin: |
389 |             ${
390 |               if(inputs.dir_size === null) {
391 |                 return null;
392 |               } else {
393 |                 return inputs.dir_size;
394 |               }
395 |             }
396 |           outdirMin: |
397 |             ${
398 |               return 1000;
399 |             }
400 |           coresMin: |
401 |             ${
402 |               if(inputs.n_processes === null) {
403 |                 return null;
404 |               } else {
405 |                 return inputs.n_processes;
406 |               }
407 |             }
408 |           ramMin: |
409 |             ${
410 |               if(inputs.dir_size === null){
411 |                 return null;
412 |               } else {
413 |                 if(inputs.decoding_blob === null){
414 |                   return parseInt((inputs.dir_size/inputs.fov_count) * 4);
415 |                 } else if(inputs.decoding_blob.min_intensity !== null) {
416 |                   return parseInt((inputs.dir_size/inputs.fov_count) * 10);
417 |                 } else if(inputs.decoding_blob.mode !== null) {
418 |                   return parseInt((inputs.dir_size/inputs.fov_count) * 10);
419 |                 } else {
420 |                   return parseInt((inputs.dir_size/inputs.fov_count) * 10);
421 |                 }
422 |               }
423 |             }
424 | 
425 |       inputs:
426 |         dir_size:
427 |           type: long?
428 | 
429 |         tmp_prefix:
430 |           type: string
431 |           inputBinding:
432 |             prefix: --tmp-prefix
433 | 
434 |         exp_files:
435 |           type: File[]
436 |           doc: Formatted input from fileDivider step.
437 | 
438 |         exp_loc:
439 |           type: string
440 |           inputBinding:
441 |             prefix: --exp-loc
442 | 
443 |         selected_fovs:
444 |           type:
445 |             type: array
446 |             items: int
447 |           inputBinding:
448 |             prefix: --selected-fovs
449 |           doc: If provided, processing will only be run on FOVs with these indices.
450 | 
451 |         fov_count:
452 |           type: int
453 | 
454 |         use_ref_img:
455 |           type: boolean?
456 |           inputBinding:
457 |             prefix: --use-ref-img
458 | 
459 |         anchor_view:
460 |           type: string?
461 |           inputBinding:
462 |             prefix: --anchor-view
463 | 
464 |         is_volume:
465 |           type: boolean?
466 |           inputBinding:
467 |             prefix: --is-volume
468 | 
469 |         rescale:
470 |           type: boolean?
471 |           inputBinding:
472 |             prefix: --rescale
473 | 
474 |         level_method:
475 |           type: string?
476 |           inputBinding:
477 |             prefix: --level-method
478 | 
479 |         not_filtered_results:
480 |           type: boolean?
481 |           inputBinding:
482 |             prefix: --not-filtered-results
483 | 
484 |         n_processes:
485 |           type: int?
486 |           inputBinding:
487 |             prefix: --n-processes
488 | 
489 |         decoding_blob:
490 |           - 'null'
491 |           - type: record
492 |             name: blob
493 |             fields:
494 |               min_sigma:
495 |                 type: float[]?
496 |                 inputBinding:
497 |                   prefix: --min-sigma
498 |               max_sigma:
499 |                 type: float[]?
500 |                 inputBinding:
501 |                   prefix: --max-sigma
502 |               num_sigma:
503 |                 type: int?
504 |                 inputBinding:
505 |                   prefix: --num-sigma
506 |               threshold:
507 |                 type: float?
508 |                 inputBinding:
509 |                   prefix: --threshold
510 |               overlap:
511 |                 type: float?
512 |                 inputBinding:
513 |                   prefix: --overlap
514 |               detector_method:
515 |                 type: string?
516 |                 inputBinding:
517 |                   prefix: --detector-method
518 |               composite_decode:
519 |                 type: boolean?
520 |                 inputBinding:
521 |                   prefix: --composite-decode
522 |               composite_pmin:
523 |                 type: float?
524 |                 inputBinding:
525 |                   prefix: --composite-pmin
526 |               composite_pmax:
527 |                 type: float?
528 |                 inputBinding:
529 |                   prefix: --composite-pmax
530 |               decode_method:
531 |                 type: string
532 |                 inputBinding:
533 |                   prefix: --decode-spots-method
534 |               decoder:
535 |                 type:
536 |                   - type: record
537 |                     name: metric_distance
538 |                     fields:
539 |                       trace_building_strategy:
540 |                         type: string
541 |                         inputBinding:
542 |                           prefix: --trace-building-strategy
543 |                       max_distance:
544 |                         type: float
545 |                         inputBinding:
546 |                           prefix: --max-distance
547 |                       min_intensity:
548 |                         type: float
549 |                         inputBinding:
550 |                           prefix: --min-intensity
551 |                       pnorm:
552 |                         type: int?
553 |                         inputBinding:
554 |                           prefix: --int
555 |                       norm_order:
556 |                         type: int?
557 |                         inputBinding:
558 |                           prefix: --norm-order
559 |                       anchor_round:
560 |                         type: int?
561 |                         inputBinding:
562 |                           prefix: --anchor-round
563 |                       search_radius:
564 |                         type: float?
565 |                         inputBinding:
566 |                           prefix: --search-radius
567 |                       return_original_intensities:
568 |                         type: boolean?
569 |                         inputBinding:
570 |                           prefix: --return-original-intensities
571 |                   - type: record
572 |                     name: per_round_max
573 |                     fields:
574 |                       trace_building_strategy:
575 |                         type: string
576 |                         inputBinding:
577 |                           prefix: --trace-building-strategy
578 |                       anchor_round:
579 |                         type: int?
580 |                         inputBinding:
581 |                           prefix: --anchor-round
582 |                       search_radius:
583 |                         type: float?
584 |                         inputBinding:
585 |                           prefix: --search-radius
586 |                   - type: record
587 |                     name: check_all
588 |                     fields:
589 |                       search_radius:
590 |                         type: float?
591 |                         inputBinding:
592 |                           prefix: --search-radius
593 |                       error_rounds:
594 |                         type: int?
595 |                         inputBinding:
596 |                           prefix: --error-rounds
597 |                       mode:
598 |                         type: string?
599 |                         inputBinding:
600 |                           prefix: --mode
601 |                       physical_coords:
602 |                         type: boolean?
603 |                         inputBinding:
604 |                           prefix: --physical-coords
605 | 
606 |         decoding_pixel:
607 |            - 'null'
608 |            - type: record
609 |              name: pixel
610 |              fields:
611 |                pnorm:
612 |                  type: int?
613 |                  inputBinding:
614 |                    prefix: --pnorm
615 |                distance_threshold:
616 |                  type: float
617 |                  inputBinding:
618 |                    prefix: --distance-threshold
619 |                magnitude_threshold:
620 |                  type: float
621 |                  inputBinding:
622 |                    prefix: --magnitude-threshold
623 |                min_area:
624 |                  type: int?
625 |                  inputBinding:
626 |                    prefix: --min-area
627 |                max_area:
628 |                  type: int?
629 |                  inputBinding:
630 |                    prefix: --max-area
631 |                norm_order:
632 |                  type: int?
633 |                  inputBinding:
634 |                    prefix: --norm-order
635 | 
636 |       outputs:
637 |         decoded:
638 |           type: Directory
639 |           outputBinding:
640 |             glob: $("tmp/" + inputs.tmp_prefix + "/4_Decoded_" + inputs.tmp_prefix + "/")
641 | 
642 |     in:
643 |       tmp_prefix: tmpname/tmp
644 |       dir_size: dir_size
645 |       exp_files: fileDivider/out
646 |       exp_loc:
647 |         valueFrom: $("input_dir_" + inputs.tmp_prefix)
648 |       selected_fovs: scatter_generator/scatter_out
649 |       fov_count:
650 |         source: [stage_runner/fov_count, fov_count]
651 |         valueFrom: |
652 |           ${
653 |             if(self[0]){
654 |               return self[0];
655 |             } else if(self[1]) {
656 |               return self[1];
657 |             } else {
658 |               return null;
659 |             }
660 |           }
661 |       use_ref_img:
662 |         source: [stage_runner/use_ref_img, use_ref_img]
663 |         pickValue: first_non_null
664 |       anchor_view:
665 |         source: [stage_runner/anchor_view, anchor_view]
666 |         valueFrom: |
667 |           ${
668 |             if(self[0]){
669 |               return self[0];
670 |             } else if(self[1]) {
671 |               return self[1];
672 |             } else {
673 |               return null;
674 |             }
675 |           }
676 |       is_volume:
677 |         source: [stage_runner/is_volume, is_volume]
678 |         pickValue: first_non_null
679 |       rescale:
680 |         source: [stage_runner/rescale, rescale]
681 |         valueFrom: |
682 |           ${
683 |             if(self[0]){
684 |               return self[0];
685 |             } else if(self[1]) {
686 |               return self[1];
687 |             } else {
688 |               return null;
689 |             }
690 |           }
691 |       level_method:
692 |         source: [stage_runner/level_method, level_method]
693 |         valueFrom: |
694 |           ${
695 |             if(self[0]){
696 |               return self[0];
697 |             } else if(self[1]) {
698 |               return self[1];
699 |             } else {
700 |               return null;
701 |             }
702 |           }
703 |       not_filtered_results:
704 |         source: [stage_runner/not_filtered_results, not_filtered_results]
705 |         valueFrom: |
706 |           ${
707 |             if(self[0]){
708 |               return self[0];
709 |             } else if(self[1]) {
710 |               return self[1];
711 |             } else {
712 |               return null;
713 |             }
714 |           }
715 |       n_processes:
716 |         source: [stage_runner/n_processes, n_processes]
717 |         valueFrom: |
718 |           ${
719 |             if(self[0]){
720 |               return self[0];
721 |             } else if(self[1]) {
722 |               return self[1];
723 |             } else {
724 |               return null;
725 |             }
726 |           }
727 |       decoding_blob:
728 |         source: [decoding_blob, stage_runner/decoding_min_sigma, stage_runner/decoding_max_sigma, stage_runner/decoding_num_sigma, stage_runner/decoding_threshold, stage_runner/decoding_overlap, stage_runner/decoding_decode_method, stage_runner/decoding_decoder_trace_building_strategy, stage_runner/decoding_decoder_max_distance, stage_runner/decoding_decoder_min_intensity, stage_runner/decoding_decoder_pnorm, stage_runner/decoding_decoder_norm_order, stage_runner/decoding_decoder_anchor_round, stage_runner/decoding_decoder_search_radius, stage_runner/decoding_decoder_return_original_intensities, stage_runner/decoding_decoder_error_rounds, stage_runner/decoding_decoder_mode, stage_runner/decoding_decoder_physical_coords, stage_runner/decoding_composite_decode, stage_runner/decoding_composite_pmin, stage_runner/decoding_composite_pmax]
729 |         valueFrom: |
730 |           ${
731 |             if(!self[6]){
732 |               return self[0];
733 |             } else {
734 |               var decode = {
735 |                 min_sigma: self[1],
736 |                 max_sigma: self[2],
737 |                 num_sigma: self[3],
738 |                 threshold: self[4],
739 |                 overlap: self[5],
740 |                 decode_method: self[6],
741 |                 composite_decode: self[18],
742 |                 composite_pmin: self[19],
743 |                 composite_pmax: self[20]
744 |               };
745 |               if(self[9]){
746 |                 /* metric distance decoder */
747 |                 decode["decoder"] = {
748 |                   trace_building_strategy: self[7],
749 |                   max_distance: self[8],
750 |                   min_intensity: self[9],
751 |                   pnorm: self[10],
752 |                   norm_order: self[11],
753 |                   anchor_round: self[12],
754 |                   search_radius: self[13],
755 |                   return_original_intensities: self[14]
756 |                 };
757 |               } else if(self[16]){
758 |                 /* check all decoder */
759 |                 decode["decoder"] = {
760 |                   search_radius: self[13],
761 |                   error_rounds: self[15],
762 |                   mode: self[16],
763 |                   physical_coords: self[17]
764 |                 };
765 |               } else {
766 |                 /* per round max decoder */
767 |                 decode["decoder"] = {
768 |                   trace_building_strategy: self[7],
769 |                   anchor_round: self[12],
770 |                   search_radius: self[13]
771 |                 };
772 |               };
773 |               return decode;
774 |             };
775 |           }
776 |       decoding_pixel:
777 |         source: [decoding_pixel, stage_runner/decoding_pnorm, stage_runner/decoding_distance_threshold, stage_runner/decoding_magnitude_threshold, stage_runner/decoding_min_area, stage_runner/decoding_max_area, stage_runner/decoding_norm_order]
778 |         valueFrom: |
779 |           ${
780 |             if(!self[2]){
781 |               return self[0]
782 |             } else {
783 |               return {
784 |                 pnorm: self[1],
785 |                 distance_threshold: self[2],
786 |                 magnitude_threshold: self[3],
787 |                 min_area: self[4],
788 |                 max_area: self[5],
789 |                 norm_order: self[6]
790 |               };
791 |             };
792 |           }
793 |     out: [decoded]
794 |   restage:
795 |     run:
796 |       class: ExpressionTool
797 |       requirements:
798 |         InlineJavascriptRequirement: {}
799 |         LoadListingRequirement:
800 |           loadListing: deep_listing
801 |       expression: |
802 |         ${
803 |           var listing = [];
804 |           var csv = [];
805 |           var cdf = [];
806 |           var spots = [];
807 |           for(var i=0;i<inputs.file_array.length;i++){
808 |             for(var j=0;j<inputs.file_array[i].listing.length;j++){
809 |               var item = inputs.file_array[i].listing[j];
810 |               if(item.class == "Directory") {
811 |                 if(item.basename === "csv") {
812 |                   for(var k=0;k<item.listing.length;k++){
813 |                     csv.push(item.listing[k]);
814 |                   }
815 |                 } else if(item.basename === "cdf") {
816 |                   for(var k=0;k<item.listing.length;k++){
817 |                     cdf.push(item.listing[k]);
818 |                   }
819 |                 } else {
820 |                   for(var k=0;k<item.listing.length; k++){
821 |                     spots.push(item.listing[k]);
822 |                   }
823 |                 }
824 |               } else {
825 |                 listing.push(item);
826 |               }
827 |             }
828 |           }
829 |           listing.push({"class":"Directory","basename":"csv","listing":csv});
830 |           listing.push({"class":"Directory","basename":"cdf","listing":cdf});
831 |           if(spots.length > 0){
832 |             listing.push({"class":"Directory","basename":"spots","listing":spots});
833 |           }
834 |           return {"pool_dir": {
835 |             "class": "Directory",
836 |             "basename": "4_Decoded",
837 |             "listing": listing,
838 |           }};
839 |         }
840 |       inputs:
841 |         dir_size:
842 |           type: long
843 | 
844 |         file_array:
845 |           type:
846 |             type: array
847 |             items: Directory
848 | 
849 |       outputs:
850 |         pool_dir:
851 |           type: Directory
852 | 
853 |     in:
854 |       file_array: execute_runner/decoded
855 |       dir_size: dir_size
856 |     out: [pool_dir]
857 | 


--------------------------------------------------------------------------------
/steps/tmpdir.cwl:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env cwl-runner
 2 | class: ExpressionTool
 3 | cwlVersion: v1.2
 4 | 
 5 | requirements:
 6 |   InlineJavascriptRequirement: {}
 7 |   ResourceRequirement:
 8 |     ramMin: 1000
 9 |     tmpdirMin: 1000
10 |     outdirMin: 1000
11 | 
12 | expression: |
13 |   ${
14 |       const characters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789';
15 |       const charactersLength = characters.length;
16 |       let counter = 0;
17 |       let result = "";
18 |       while (counter < 10) {
19 |         result += characters.charAt(Math.floor(Math.random() * charactersLength));
20 |         counter += 1;
21 |       }
22 |       return {"tmp": result};
23 |   }
24 | inputs: []
25 | outputs:
26 |   tmp: string
27 | 


--------------------------------------------------------------------------------
/test.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | set -o errexit
 3 | set -o pipefail
 4 | 
 5 | start() { echo travis_fold':'start:$1; echo $1; }
 6 | end() { set +v; echo travis_fold':'end:$1; echo; echo; }
 7 | die() { set +v; echo "$*" 1>&2 ; exit 1; }
 8 | 
 9 | start black
10 | black --check .
11 | end black
12 | 
13 | start isort
14 | isort --check-only .
15 | end isort
16 | 


--------------------------------------------------------------------------------