Build branch main with version main (795abd6)

Build pipeline: viash-hub.demultiplex.main-4xxbp Source commit: 795abd6868 Source message: Run Falco in parallel for each well (#33)
2025-03-04 06:00:00 +00:00
parent eb8d600efc
commit e16f7d7290
35 changed files with 988 additions and 2491 deletions
--- a/target/nextflow/dataflow/combine_samples/.config.vsh.yaml
+++ b/target/nextflow/dataflow/combine_samples/.config.vsh.yaml
@@ -30,6 +30,15 @@ argument_groups:
    direction: "input"
    multiple: true
    multiple_sep: ";"
+  - type: "file"
+    name: "--falco_dir"
+    info: null
+    must_exist: true
+    create_parent: true
+    required: true
+    direction: "input"
+    multiple: false
+    multiple_sep: ";"
 - name: "Output arguments"
  arguments:
  - type: "file"
@@ -50,6 +59,15 @@ argument_groups:
    direction: "output"
    multiple: true
    multiple_sep: ";"
+  - type: "file"
+    name: "--output_falco"
+    info: null
+    must_exist: true
+    create_parent: true
+    required: true
+    direction: "output"
+    multiple: true
+    multiple_sep: ";"
 resources:
 - type: "nextflow_script"
  path: "main.nf"
@@ -62,9 +80,6 @@ description: "Combine fastq files from across samples into one event with a list
  \ fastq files per orientation."
 info: null
 status: "enabled"
-scope:
-  image: "public"
-  target: "public"
 requirements:
  commands:
  - "ps"
@@ -146,10 +161,10 @@ build_info:
  engine: "native|native"
  output: "target/nextflow/dataflow/combine_samples"
  executable: "target/nextflow/dataflow/combine_samples/main.nf"
-  viash_version: "0.9.1"
-  git_commit: "dd1f93487f4e908999504e1fcdf97f6c59f743d9"
-  git_remote: "https://x-access-token:ghs_NbivUxJIyO1sd735kE5b6eTS6tHmjH0IsDUF@github.com/viash-hub/demultiplex"
-  git_tag: "v0.1.1-16-gdd1f934"
+  viash_version: "0.9.0"
+  git_commit: "795abd68688f4f31b0587bc8e4a7de49b6c00825"
+  git_remote: "https://github.com/viash-hub/demultiplex"
+  git_tag: "v0.1.1-18-g795abd6"
 package_config:
  name: "demultiplex"
  version: "main"
@@ -158,7 +173,7 @@ package_config:
    test_resources:
    - path: "gs://viash-hub-test-data/demultiplex/v2/"
      dest: "testData"
-  viash_version: "0.9.1"
+  viash_version: "0.9.0"
  source: "src"
  target: "target"
  config_mods:
--- a/target/nextflow/dataflow/combine_samples/main.nf
+++ b/target/nextflow/dataflow/combine_samples/main.nf
@@ -1,6 +1,6 @@
 // combine_samples main
 // 
-// This wrapper script is auto-generated by viash 0.9.1 and is thus a derivative
+// This wrapper script is auto-generated by viash 0.9.0 and is thus a derivative
 // work thereof. This software comes with ABSOLUTELY NO WARRANTY from Data
 // Intuitive.
 // 
@@ -173,7 +173,7 @@ def _checkArgumentType(String stage, Map par, Object value, String errorIdentifi
 Map _processInputValues(Map inputs, Map config, String id, String key) {
  if (!workflow.stubRun) {
    config.allArguments.each { arg ->
-      if (arg.required && arg.direction == "input") {
+      if (arg.required) {
        assert inputs.containsKey(arg.plainName) && inputs.get(arg.plainName) != null : 
          "Error in module '${key}' id '${id}': required input argument '${arg.plainName}' is missing"
      }
@@ -192,8 +192,15 @@ Map _processInputValues(Map inputs, Map config, String id, String key) {
 }

 // helper file: 'src/main/resources/io/viash/runners/nextflow/arguments/_processOutputValues.nf'
-Map _checkValidOutputArgument(Map outputs, Map config, String id, String key) {
+Map _processOutputValues(Map outputs, Map config, String id, String key) {
  if (!workflow.stubRun) {
+    config.allArguments.each { arg ->
+      if (arg.direction == "output" && arg.required) {
+        assert outputs.containsKey(arg.plainName) && outputs.get(arg.plainName) != null : 
+          "Error in module '${key}' id '${id}': required output argument '${arg.plainName}' is missing"
+      }
+    }
+
    outputs = outputs.collectEntries { name, value ->
      def par = config.allArguments.find { it.plainName == name && it.direction == "output" }
      assert par != null : "Error in module '${key}' id '${id}': '${name}' is not a valid output argument"
@@ -206,16 +213,6 @@ Map _checkValidOutputArgument(Map outputs, Map config, String id, String key) {
  return outputs
 }

-void _checkAllRequiredOuputsPresent(Map outputs, Map config, String id, String key) {
-  if (!workflow.stubRun) {
-    config.allArguments.each { arg ->
-      if (arg.direction == "output" && arg.required) {
-        assert outputs.containsKey(arg.plainName) && outputs.get(arg.plainName) != null : 
-          "Error in module '${key}' id '${id}': required output argument '${arg.plainName}' is missing"
-      }
-    }
-  }
-}
 // helper file: 'src/main/resources/io/viash/runners/nextflow/channel/IDChecker.nf'
 class IDChecker {
  final def items = [] as Set
@@ -1669,162 +1666,6 @@ def joinStates(Closure apply_) {
  }
  return joinStatesWf
 }
-// helper file: 'src/main/resources/io/viash/runners/nextflow/states/publishFiles.nf'
-def publishFiles(Map args) {
-  def key_ = args.get("key")
-
-  assert key_ != null : "publishFiles: key must be specified"
-  
-  workflow publishFilesWf {
-    take: input_ch
-    main:
-      input_ch
-        | map { tup ->
-          def id_ = tup[0]
-          def state_ = tup[1]
-
-          // the input files and the target output filenames
-          def inputoutputFilenames_ = collectInputOutputPaths(state_, id_ + "." + key_).transpose()
-          def inputFiles_ = inputoutputFilenames_[0]
-          def outputFilenames_ = inputoutputFilenames_[1]
-
-          [id_, inputFiles_, outputFilenames_]
-        }
-        | publishFilesProc
-    emit: input_ch
-  }
-  return publishFilesWf
-}
-
-process publishFilesProc {
-  // todo: check publishpath?
-  publishDir path: "${getPublishDir()}/", mode: "copy"
-  tag "$id"
-  input:
-    tuple val(id), path(inputFiles, stageAs: "_inputfile?/*"), val(outputFiles)
-  output:
-    tuple val(id), path{outputFiles}
-  script:
-  def copyCommands = [
-    inputFiles instanceof List ? inputFiles : [inputFiles],
-    outputFiles instanceof List ? outputFiles : [outputFiles]
-  ]
-    .transpose()
-    .collectMany{infile, outfile ->
-      if (infile.toString() != outfile.toString()) {
-        [
-          "[ -d \"\$(dirname '${outfile.toString()}')\" ] || mkdir -p \"\$(dirname '${outfile.toString()}')\"",
-          "cp -r '${infile.toString()}' '${outfile.toString()}'"
-        ]
-      } else {
-        // no need to copy if infile is the same as outfile
-        []
-      }
-    }
-  """
-  echo "Copying output files to destination folder"
-  ${copyCommands.join("\n  ")}
-  """
-}
-
-
-// this assumes that the state contains no other values other than those specified in the config
-def publishFilesByConfig(Map args) {
-  def config = args.get("config")
-  assert config != null : "publishFilesByConfig: config must be specified"
-
-  def key_ = args.get("key", config.name)
-  assert key_ != null : "publishFilesByConfig: key must be specified"
-  
-  workflow publishFilesSimpleWf {
-    take: input_ch
-    main:
-      input_ch
-        | map { tup ->
-          def id_ = tup[0]
-          def state_ = tup[1] // e.g. [output: new File("myoutput.h5ad"), k: 10]
-          def origState_ = tup[2] // e.g. [output: '$id.$key.foo.h5ad']
-
-
-          // the processed state is a list of [key, value, inputPath, outputFilename] tuples, where
-          //   - key is a String
-          //   - value is any object that can be serialized to a Yaml (so a String/Integer/Long/Double/Boolean, a List, a Map, or a Path)
-          //   - inputPath is a List[Path]
-          //   - outputFilename is a List[String]
-          //   - (inputPath, outputFilename) are the files that will be copied from src to dest (relative to the state.yaml)
-          def processedState =
-            config.allArguments
-              .findAll { it.direction == "output" }
-              .collectMany { par ->
-                def plainName_ = par.plainName
-                // if the state does not contain the key, it's an
-                // optional argument for which the component did 
-                // not generate any output OR multiple channels were emitted
-                // and the output was just not added to using the channel
-                // that is now being parsed
-                if (!state_.containsKey(plainName_)) {
-                  return []
-                }
-                def value = state_[plainName_]
-                // if the parameter is not a file, it should be stored
-                // in the state as-is, but is not something that needs 
-                // to be copied from the source path to the dest path
-                if (par.type != "file") {
-                  return [[inputPath: [], outputFilename: []]]
-                }
-                // if the orig state does not contain this filename,
-                // it's an optional argument for which the user specified
-                // that it should not be returned as a state
-                if (!origState_.containsKey(plainName_)) {
-                  return []
-                }
-                def filenameTemplate = origState_[plainName_]
-                // if the pararameter is multiple: true, fetch the template
-                if (par.multiple && filenameTemplate instanceof List) {
-                  filenameTemplate = filenameTemplate[0]
-                }
-                // instantiate the template
-                def filename = filenameTemplate
-                  .replaceAll('\\$id', id_)
-                  .replaceAll('\\$\\{id\\}', id_)
-                  .replaceAll('\\$key', key_)
-                  .replaceAll('\\$\\{key\\}', key_)
-                if (par.multiple) {
-                  // if the parameter is multiple: true, the filename
-                  // should contain a wildcard '*' that is replaced with
-                  // the index of the file
-                  assert filename.contains("*") : "Module '${key_}' id '${id_}': Multiple output files specified, but no wildcard '*' in the filename: ${filename}"
-                  def outputPerFile = value.withIndex().collect{ val, ix ->
-                    def filename_ix = filename.replace("*", ix.toString())
-                    def inputPath = val instanceof File ? val.toPath() : val
-                    [inputPath: inputPath, outputFilename: filename_ix]
-                  }
-                  def transposedOutputs = ["inputPath", "outputFilename"].collectEntries{ key -> 
-                    [key, outputPerFile.collect{dic -> dic[key]}]
-                  }
-                  return [[key: plainName_] + transposedOutputs]
-                } else {
-                  def value_ = java.nio.file.Paths.get(filename)
-                  def inputPath = value instanceof File ? value.toPath() : value
-                  return [[inputPath: [inputPath], outputFilename: [filename]]]
-                }
-              }
-          
-          def inputPaths = processedState.collectMany{it.inputPath}
-          def outputFilenames = processedState.collectMany{it.outputFilename}
-          
-
-          [id_, inputPaths, outputFilenames]
-        }
-        | publishFilesProc
-    emit: input_ch
-  }
-  return publishFilesSimpleWf
-}
-
-
-
-
 // helper file: 'src/main/resources/io/viash/runners/nextflow/states/publishStates.nf'
 def collectFiles(obj) {
  if (obj instanceof java.io.File || obj instanceof Path)  {
@@ -1882,6 +1723,8 @@ def publishStates(Map args) {

          // the input files and the target output filenames
          def inputoutputFilenames_ = collectInputOutputPaths(state_, id_ + "." + key_).transpose()
+          def inputFiles_ = inputoutputFilenames_[0]
+          def outputFilenames_ = inputoutputFilenames_[1]

          def yamlFilename = yamlTemplate_
            .replaceAll('\\$id', id_)
@@ -1894,7 +1737,7 @@ def publishStates(Map args) {
          // convert state to yaml blob
          def yamlBlob_ = toRelativeTaggedYamlBlob([id: id_] + state_, java.nio.file.Paths.get(yamlFilename))

-          [id_, yamlBlob_, yamlFilename]
+          [id_, yamlBlob_, yamlFilename, inputFiles_, outputFilenames_]
        }
        | publishStatesProc
    emit: input_ch
@@ -1906,17 +1749,33 @@ process publishStatesProc {
  publishDir path: "${getPublishDir()}/", mode: "copy"
  tag "$id"
  input:
-    tuple val(id), val(yamlBlob), val(yamlFile)
+    tuple val(id), val(yamlBlob), val(yamlFile), path(inputFiles, stageAs: "_inputfile?/*"), val(outputFiles)
  output:
-    tuple val(id), path{[yamlFile]}
+    tuple val(id), path{[yamlFile] + outputFiles}
  script:
+  def copyCommands = [
+    inputFiles instanceof List ? inputFiles : [inputFiles],
+    outputFiles instanceof List ? outputFiles : [outputFiles]
+  ]
+    .transpose()
+    .collectMany{infile, outfile ->
+      if (infile.toString() != outfile.toString()) {
+        [
+          "[ -d \"\$(dirname '${outfile.toString()}')\" ] || mkdir -p \"\$(dirname '${outfile.toString()}')\"",
+          "cp -r '${infile.toString()}' '${outfile.toString()}'"
+        ]
+      } else {
+        // no need to copy if infile is the same as outfile
+        []
+      }
+    }
  """
-  mkdir -p "\$(dirname '${yamlFile}')"
-  echo "Storing state as yaml"
-  cat > '${yamlFile}' << HERE
-${yamlBlob}
-HERE
-  """
+mkdir -p "\$(dirname '${yamlFile}')"
+echo "Storing state as yaml"
+echo '${yamlBlob}' > '${yamlFile}'
+echo "Copying output files to destination folder"
+${copyCommands.join("\n  ")}
+"""
 }


@@ -1947,10 +1806,13 @@ def publishStatesByConfig(Map args) {
            .replaceAll('\\$\\{key\\}', key_)
          def yamlDir = java.nio.file.Paths.get(yamlFilename).getParent()

-          // the processed state is a list of [key, value] tuples, where
+          // the processed state is a list of [key, value, inputPath, outputFilename] tuples, where
          //   - key is a String
          //   - value is any object that can be serialized to a Yaml (so a String/Integer/Long/Double/Boolean, a List, a Map, or a Path)
+          //   - inputPath is a List[Path]
+          //   - outputFilename is a List[String]
          //   - (key, value) are the tuples that will be saved to the state.yaml file
+          //   - (inputPath, outputFilename) are the files that will be copied from src to dest (relative to the state.yaml)
          def processedState =
            config.allArguments
              .findAll { it.direction == "output" }
@@ -1967,7 +1829,7 @@ def publishStatesByConfig(Map args) {
                // in the state as-is, but is not something that needs 
                // to be copied from the source path to the dest path
                if (par.type != "file") {
-                  return [[key: plainName_, value: value]]
+                  return [[key: plainName_, value: value, inputPath: [], outputFilename: []]]
                }
                // if the orig state does not contain this filename,
                // it's an optional argument for which the user specified
@@ -1998,9 +1860,13 @@ def publishStatesByConfig(Map args) {
                    if (yamlDir != null) {
                      value_ = yamlDir.relativize(value_)
                    }
-                    return value_
+                    def inputPath = val instanceof File ? val.toPath() : val
+                    [value: value_, inputPath: inputPath, outputFilename: filename_ix]
                  }
-                  return [["key": plainName_, "value": outputPerFile]]
+                  def transposedOutputs = ["value", "inputPath", "outputFilename"].collectEntries{ key -> 
+                    [key, outputPerFile.collect{dic -> dic[key]}]
+                  }
+                  return [[key: plainName_] + transposedOutputs]
                } else {
                  def value_ = java.nio.file.Paths.get(filename)
                  // if id contains a slash
@@ -2008,17 +1874,18 @@ def publishStatesByConfig(Map args) {
                    value_ = yamlDir.relativize(value_)
                  }
                  def inputPath = value instanceof File ? value.toPath() : value
-                  return [["key": plainName_, value: value_]]
+                  return [[key: plainName_, value: value_, inputPath: [inputPath], outputFilename: [filename]]]
                }
              }
-              
          
          def updatedState_ = processedState.collectEntries{[it.key, it.value]}
+          def inputPaths = processedState.collectMany{it.inputPath}
+          def outputFilenames = processedState.collectMany{it.outputFilename}
          
          // convert state to yaml blob
          def yamlBlob_ = toTaggedYamlBlob([id: id_] + updatedState_)

-          [id_, yamlBlob_, yamlFilename]
+          [id_, yamlBlob_, yamlFilename, inputPaths, outputFilenames]
        }
        | publishStatesProc
    emit: input_ch
@@ -2692,8 +2559,7 @@ def _debug(workflowArgs, debugKey) {
 def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
  def workflowArgs = processWorkflowArgs(args, defaultWfArgs, meta)
  def key_ = workflowArgs["key"]
-  def multipleArgs = meta.config.allArguments.findAll{ it.multiple }.collect{it.plainName}
-
+  
  workflow workflowInstance {
    take: input_

@@ -2850,36 +2716,12 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
      }

    // TODO: move some of the _meta.join_id wrangling to the safeJoin() function.
-    def chInitialOutputMulti = chArgsWithDefaults
+    def chInitialOutput = chArgsWithDefaults
      | _debug(workflowArgs, "processed")
      // run workflow
      | innerWorkflowFactory(workflowArgs)
-    def chInitialOutputList = chInitialOutputMulti instanceof List ? chInitialOutputMulti : [chInitialOutputMulti]
-    assert chInitialOutputList.size() > 0: "should have emitted at least one output channel"
-    // Add a channel ID to the events, which designates the channel the event was emitted from as a running number
-    // This number is used to sort the events later when the events are gathered from across the channels.
-    def chInitialOutputListWithIndexedEvents = chInitialOutputList.withIndex().collect{channel, channelIndex ->
-      def newChannel = channel
-        | map {tuple ->
-          assert tuple instanceof List : 
-          "Error in module '${key_}': element in output channel should be a tuple [id, data, ...otherargs...]\n" +
-          "  Example: [\"id\", [input: file('foo.txt'), arg: 10]].\n" +
-          "  Expected class: List. Found: tuple.getClass() is ${tuple.getClass()}"
-        
-          def newEvent = [channelIndex] + tuple
-          return newEvent
-        }
-      return newChannel
-    }
-    // Put the events into 1 channel, cover case where there is only one channel is emitted
-    def chInitialOutput = chInitialOutputList.size() > 1 ? \
-      chInitialOutputListWithIndexedEvents[0].mix(*chInitialOutputListWithIndexedEvents.tail()) : \
-      chInitialOutputListWithIndexedEvents[0]
-    def chInitialOutputProcessed = chInitialOutput
-      | map { tuple  ->
-        def channelId = tuple[0]
-        def id_ = tuple[1]
-        def output_ = tuple[2]
+      // check output tuple
+      | map { id_, output_ ->

        // see if output map contains metadata
        def meta_ =
@@ -2892,95 +2734,19 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
        output_ = output_.findAll{k, v -> k != "_meta"}

        // check value types
-        output_ = _checkValidOutputArgument(output_, meta.config, id_, key_)
+        output_ = _processOutputValues(output_, meta.config, id_, key_)

-        [join_id, channelId, id_, output_]
+        // simplify output if need be
+        if (workflowArgs.auto.simplifyOutput && output_.size() == 1) {
+          output_ = output_.values()[0]
+        }
+
+        [join_id, id_, output_]
      }
      // | view{"chInitialOutput: ${it.take(3)}"}

-    // join the output [prev_id, channel_id, new_id, output] with the previous state [prev_id, state, ...]
-    def chPublishWithPreviousState = safeJoin(chInitialOutputProcessed, chRunFiltered, key_)
-      // input tuple format: [join_id, channel_id, id, output, prev_state, ...]
-      // output tuple format: [join_id, channel_id, id, new_state, ...]
-      | map{ tup ->
-        def new_state = workflowArgs.toState(tup.drop(2).take(3))
-        tup.take(3) + [new_state] + tup.drop(5)
-      }
-    if (workflowArgs.auto.publish == "state") {
-      def chPublishFiles = chPublishWithPreviousState
-        // input tuple format: [join_id, channel_id, id, new_state, ...]
-        // output tuple format: [join_id, channel_id, id, new_state]
-        | map{ tup ->
-          tup.take(4)
-        }
-
-      safeJoin(chPublishFiles, chArgsWithDefaults, key_)
-        // input tuple format: [join_id, channel_id, id, new_state, orig_state, ...]
-        // output tuple format: [id, new_state, orig_state]
-        | map { tup ->
-          tup.drop(2).take(3)
-        }
-        | publishFilesByConfig(key: key_, config: meta.config)
-    }
-    // Join the state from the events that were emitted from different channels
-    def chJoined = chInitialOutputProcessed
-      | map {tuple ->
-        def join_id = tuple[0]
-        def channel_id = tuple[1]
-        def id = tuple[2]
-        def other = tuple.drop(3)
-        // Below, groupTuple is used to join the events. To make sure resuming a workflow
-        // keeps working, the output state must be deterministic. This means the state needs to be
-        // sorted with groupTuple's has a 'sort' argument. This argument can be set to 'hash',
-        // but hashing the state when it is large can be problematic in terms of performance.
-        // Therefore, a custom comparator function is provided. We add the channel ID to the 
-        // states so that we can use the channel ID to sort the items. 
-        def stateWithChannelID = [[channel_id] * other.size(), other].transpose()
-        // A comparator that is provided to groupTuple's 'sort' argument is applied
-        // to all elements of the event tuple (that is not the 'id'). The comparator
-        // closure that is used below expects the input to be List. So the join_id and
-        // channel_id must also be wrapped in a list. 
-        [[join_id], [channel_id], id] + stateWithChannelID
-      }
-      | groupTuple(by: 2, sort: {a, b -> a[0] <=> b[0]}, size: chInitialOutputList.size(), remainder: true)
-      | map {join_ids, _, id, statesWithChannelID ->
-        // Remove the channel IDs from the states
-        def states = statesWithChannelID.collect{it[1]}
-        def newJoinId = join_ids.flatten().unique{a, b -> a <=> b}
-        assert newJoinId.size() == 1: "Multiple events were emitted for '$id'."
-        def newJoinIdUnique = newJoinId[0]
-        def newState = states.inject([:]){ old_state, state_to_add ->
-          def stateToAddNoMultiple = state_to_add.findAll{k, v -> !multipleArgs.contains(k)}
-          // First add non multiple arguments
-
-          def overlap = old_state.keySet().intersect(stateToAddNoMultiple.keySet())
-          assert overlap.isEmpty() : "ID $id: multiple entries for " + 
-            " argument(s) $overlap were emitted."
-          def return_state = old_state + stateToAddNoMultiple
-
-          // Add `multiple: true` arguments
-          def stateToAddMultiple = state_to_add.findAll{k, v -> multipleArgs.contains(k)}
-          stateToAddMultiple.each {k, v ->
-            def currentKey = return_state.getOrDefault(k, [])
-            def currentKeyList = currentKey instanceof List ? currentKey : [currentKey]
-            currentKeyList.add(v)
-            return_state[k] = currentKeyList
-          }
-          return return_state
-        }
-
-        _checkAllRequiredOuputsPresent(newState, meta.config, id, key_)
-
-        // simplify output if need be
-        if (workflowArgs.auto.simplifyOutput && newState.size() == 1) {
-          newState = newState.values()[0]
-        }
-
-        return [newJoinIdUnique, id, newState]
-      }
-    
    // join the output [prev_id, new_id, output] with the previous state [prev_id, state, ...]
-    def chNewState = safeJoin(chJoined, chRunFiltered, key_)
+    def chNewState = safeJoin(chInitialOutput, chRunFiltered, key_)
      // input tuple format: [join_id, id, output, prev_state, ...]
      // output tuple format: [join_id, id, new_state, ...]
      | map{ tup ->
@@ -2989,21 +2755,23 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
      }

    if (workflowArgs.auto.publish == "state") {
-      def chPublishStates = chNewState
+      def chPublish = chNewState
        // input tuple format: [join_id, id, new_state, ...]
        // output tuple format: [join_id, id, new_state]
        | map{ tup ->
          tup.take(3)
        }

-      safeJoin(chPublishStates, chArgsWithDefaults, key_)
+      safeJoin(chPublish, chArgsWithDefaults, key_)
        // input tuple format: [join_id, id, new_state, orig_state, ...]
        // output tuple format: [id, new_state, orig_state]
        | map { tup ->
          tup.drop(1).take(3)
-        }
+      }
        | publishStatesByConfig(key: key_, config: meta.config)
    }
+
+    // remove join_id and meta
    chReturn = chNewState
      | map { tup ->
        // input tuple format: [join_id, id, new_state, ...]
@@ -3071,6 +2839,16 @@ meta = [
          "direction" : "input",
          "multiple" : true,
          "multiple_sep" : ";"
+        },
+        {
+          "type" : "file",
+          "name" : "--falco_dir",
+          "must_exist" : true,
+          "create_parent" : true,
+          "required" : true,
+          "direction" : "input",
+          "multiple" : false,
+          "multiple_sep" : ";"
        }
      ]
    },
@@ -3096,6 +2874,16 @@ meta = [
          "direction" : "output",
          "multiple" : true,
          "multiple_sep" : ";"
+        },
+        {
+          "type" : "file",
+          "name" : "--output_falco",
+          "must_exist" : true,
+          "create_parent" : true,
+          "required" : true,
+          "direction" : "output",
+          "multiple" : true,
+          "multiple_sep" : ";"
        }
      ]
    }
@@ -3115,10 +2903,6 @@ meta = [
  ],
  "description" : "Combine fastq files from across samples into one event with a list of fastq files per orientation.",
  "status" : "enabled",
-  "scope" : {
-    "image" : "public",
-    "target" : "public"
-  },
  "requirements" : {
    "commands" : [
      "ps"
@@ -3215,10 +2999,10 @@ meta = [
    "runner" : "nextflow",
    "engine" : "native|native",
    "output" : "target/nextflow/dataflow/combine_samples",
-    "viash_version" : "0.9.1",
-    "git_commit" : "dd1f93487f4e908999504e1fcdf97f6c59f743d9",
-    "git_remote" : "https://x-access-token:ghs_NbivUxJIyO1sd735kE5b6eTS6tHmjH0IsDUF@github.com/viash-hub/demultiplex",
-    "git_tag" : "v0.1.1-16-gdd1f934"
+    "viash_version" : "0.9.0",
+    "git_commit" : "795abd68688f4f31b0587bc8e4a7de49b6c00825",
+    "git_remote" : "https://github.com/viash-hub/demultiplex",
+    "git_tag" : "v0.1.1-18-g795abd6"
  },
  "package_config" : {
    "name" : "demultiplex",
@@ -3232,7 +3016,7 @@ meta = [
        }
      ]
    },
-    "viash_version" : "0.9.1",
+    "viash_version" : "0.9.0",
    "source" : "src",
    "target" : "target",
    "config_mods" : [
@@ -3277,10 +3061,12 @@ workflow run_wf {
        // Gather the following state for all samples
        def forward_fastqs = states.collect{it.forward_input}.flatten()
        def reverse_fastqs = states.collect{it.reverse_input}.findAll{it != null}.flatten()
+        def falco_dirs = states.collect{it.falco_dir}
        
        def resultState = [
          "output_forward": forward_fastqs,
          "output_reverse": reverse_fastqs,
+          "output_falco": falco_dirs,
          // The join ID is the same across all samples from the same run
          "_meta": ["join_id": states[0]._meta.join_id]
        ]
--- a/target/nextflow/dataflow/combine_samples/nextflow_schema.json
+++ b/target/nextflow/dataflow/combine_samples/nextflow_schema.json
@@ -43,6 +43,16 @@
            }
    

+        ,
+                "falco_dir": {
+                "type":
+                "string",
+                "description": "Type: `file`, required. ",
+                "help_text": "Type: `file`, required. "
+            
+            }
+    
+
 }
 },
    
@@ -75,6 +85,17 @@
            }
    

+        ,
+                "output_falco": {
+                "type":
+                "string",
+                "description": "Type: List of `file`, required, default: `$id.$key.output_falco_*.output_falco_*`, multiple_sep: `\";\"`. ",
+                "help_text": "Type: List of `file`, required, default: `$id.$key.output_falco_*.output_falco_*`, multiple_sep: `\";\"`. "
+            ,
+                "default":"$id.$key.output_falco_*.output_falco_*"
+            }
+    
+
 }
 },
    
--- a/target/nextflow/dataflow/gather_fastqs_and_validate/.config.vsh.yaml
+++ b/target/nextflow/dataflow/gather_fastqs_and_validate/.config.vsh.yaml
@@ -56,9 +56,6 @@ description: "From a directory containing fastq files, gather the files per samp
  \ \nand validate according to the contents of the sample sheet.\n"
 info: null
 status: "enabled"
-scope:
-  image: "public"
-  target: "public"
 requirements:
  commands:
  - "ps"
@@ -140,10 +137,10 @@ build_info:
  engine: "native|native"
  output: "target/nextflow/dataflow/gather_fastqs_and_validate"
  executable: "target/nextflow/dataflow/gather_fastqs_and_validate/main.nf"
-  viash_version: "0.9.1"
-  git_commit: "dd1f93487f4e908999504e1fcdf97f6c59f743d9"
-  git_remote: "https://x-access-token:ghs_NbivUxJIyO1sd735kE5b6eTS6tHmjH0IsDUF@github.com/viash-hub/demultiplex"
-  git_tag: "v0.1.1-16-gdd1f934"
+  viash_version: "0.9.0"
+  git_commit: "795abd68688f4f31b0587bc8e4a7de49b6c00825"
+  git_remote: "https://github.com/viash-hub/demultiplex"
+  git_tag: "v0.1.1-18-g795abd6"
 package_config:
  name: "demultiplex"
  version: "main"
@@ -152,7 +149,7 @@ package_config:
    test_resources:
    - path: "gs://viash-hub-test-data/demultiplex/v2/"
      dest: "testData"
-  viash_version: "0.9.1"
+  viash_version: "0.9.0"
  source: "src"
  target: "target"
  config_mods:
--- a/target/nextflow/dataflow/gather_fastqs_and_validate/main.nf
+++ b/target/nextflow/dataflow/gather_fastqs_and_validate/main.nf
@@ -1,6 +1,6 @@
 // gather_fastqs_and_validate main
 // 
-// This wrapper script is auto-generated by viash 0.9.1 and is thus a derivative
+// This wrapper script is auto-generated by viash 0.9.0 and is thus a derivative
 // work thereof. This software comes with ABSOLUTELY NO WARRANTY from Data
 // Intuitive.
 // 
@@ -173,7 +173,7 @@ def _checkArgumentType(String stage, Map par, Object value, String errorIdentifi
 Map _processInputValues(Map inputs, Map config, String id, String key) {
  if (!workflow.stubRun) {
    config.allArguments.each { arg ->
-      if (arg.required && arg.direction == "input") {
+      if (arg.required) {
        assert inputs.containsKey(arg.plainName) && inputs.get(arg.plainName) != null : 
          "Error in module '${key}' id '${id}': required input argument '${arg.plainName}' is missing"
      }
@@ -192,8 +192,15 @@ Map _processInputValues(Map inputs, Map config, String id, String key) {
 }

 // helper file: 'src/main/resources/io/viash/runners/nextflow/arguments/_processOutputValues.nf'
-Map _checkValidOutputArgument(Map outputs, Map config, String id, String key) {
+Map _processOutputValues(Map outputs, Map config, String id, String key) {
  if (!workflow.stubRun) {
+    config.allArguments.each { arg ->
+      if (arg.direction == "output" && arg.required) {
+        assert outputs.containsKey(arg.plainName) && outputs.get(arg.plainName) != null : 
+          "Error in module '${key}' id '${id}': required output argument '${arg.plainName}' is missing"
+      }
+    }
+
    outputs = outputs.collectEntries { name, value ->
      def par = config.allArguments.find { it.plainName == name && it.direction == "output" }
      assert par != null : "Error in module '${key}' id '${id}': '${name}' is not a valid output argument"
@@ -206,16 +213,6 @@ Map _checkValidOutputArgument(Map outputs, Map config, String id, String key) {
  return outputs
 }

-void _checkAllRequiredOuputsPresent(Map outputs, Map config, String id, String key) {
-  if (!workflow.stubRun) {
-    config.allArguments.each { arg ->
-      if (arg.direction == "output" && arg.required) {
-        assert outputs.containsKey(arg.plainName) && outputs.get(arg.plainName) != null : 
-          "Error in module '${key}' id '${id}': required output argument '${arg.plainName}' is missing"
-      }
-    }
-  }
-}
 // helper file: 'src/main/resources/io/viash/runners/nextflow/channel/IDChecker.nf'
 class IDChecker {
  final def items = [] as Set
@@ -1669,162 +1666,6 @@ def joinStates(Closure apply_) {
  }
  return joinStatesWf
 }
-// helper file: 'src/main/resources/io/viash/runners/nextflow/states/publishFiles.nf'
-def publishFiles(Map args) {
-  def key_ = args.get("key")
-
-  assert key_ != null : "publishFiles: key must be specified"
-  
-  workflow publishFilesWf {
-    take: input_ch
-    main:
-      input_ch
-        | map { tup ->
-          def id_ = tup[0]
-          def state_ = tup[1]
-
-          // the input files and the target output filenames
-          def inputoutputFilenames_ = collectInputOutputPaths(state_, id_ + "." + key_).transpose()
-          def inputFiles_ = inputoutputFilenames_[0]
-          def outputFilenames_ = inputoutputFilenames_[1]
-
-          [id_, inputFiles_, outputFilenames_]
-        }
-        | publishFilesProc
-    emit: input_ch
-  }
-  return publishFilesWf
-}
-
-process publishFilesProc {
-  // todo: check publishpath?
-  publishDir path: "${getPublishDir()}/", mode: "copy"
-  tag "$id"
-  input:
-    tuple val(id), path(inputFiles, stageAs: "_inputfile?/*"), val(outputFiles)
-  output:
-    tuple val(id), path{outputFiles}
-  script:
-  def copyCommands = [
-    inputFiles instanceof List ? inputFiles : [inputFiles],
-    outputFiles instanceof List ? outputFiles : [outputFiles]
-  ]
-    .transpose()
-    .collectMany{infile, outfile ->
-      if (infile.toString() != outfile.toString()) {
-        [
-          "[ -d \"\$(dirname '${outfile.toString()}')\" ] || mkdir -p \"\$(dirname '${outfile.toString()}')\"",
-          "cp -r '${infile.toString()}' '${outfile.toString()}'"
-        ]
-      } else {
-        // no need to copy if infile is the same as outfile
-        []
-      }
-    }
-  """
-  echo "Copying output files to destination folder"
-  ${copyCommands.join("\n  ")}
-  """
-}
-
-
-// this assumes that the state contains no other values other than those specified in the config
-def publishFilesByConfig(Map args) {
-  def config = args.get("config")
-  assert config != null : "publishFilesByConfig: config must be specified"
-
-  def key_ = args.get("key", config.name)
-  assert key_ != null : "publishFilesByConfig: key must be specified"
-  
-  workflow publishFilesSimpleWf {
-    take: input_ch
-    main:
-      input_ch
-        | map { tup ->
-          def id_ = tup[0]
-          def state_ = tup[1] // e.g. [output: new File("myoutput.h5ad"), k: 10]
-          def origState_ = tup[2] // e.g. [output: '$id.$key.foo.h5ad']
-
-
-          // the processed state is a list of [key, value, inputPath, outputFilename] tuples, where
-          //   - key is a String
-          //   - value is any object that can be serialized to a Yaml (so a String/Integer/Long/Double/Boolean, a List, a Map, or a Path)
-          //   - inputPath is a List[Path]
-          //   - outputFilename is a List[String]
-          //   - (inputPath, outputFilename) are the files that will be copied from src to dest (relative to the state.yaml)
-          def processedState =
-            config.allArguments
-              .findAll { it.direction == "output" }
-              .collectMany { par ->
-                def plainName_ = par.plainName
-                // if the state does not contain the key, it's an
-                // optional argument for which the component did 
-                // not generate any output OR multiple channels were emitted
-                // and the output was just not added to using the channel
-                // that is now being parsed
-                if (!state_.containsKey(plainName_)) {
-                  return []
-                }
-                def value = state_[plainName_]
-                // if the parameter is not a file, it should be stored
-                // in the state as-is, but is not something that needs 
-                // to be copied from the source path to the dest path
-                if (par.type != "file") {
-                  return [[inputPath: [], outputFilename: []]]
-                }
-                // if the orig state does not contain this filename,
-                // it's an optional argument for which the user specified
-                // that it should not be returned as a state
-                if (!origState_.containsKey(plainName_)) {
-                  return []
-                }
-                def filenameTemplate = origState_[plainName_]
-                // if the pararameter is multiple: true, fetch the template
-                if (par.multiple && filenameTemplate instanceof List) {
-                  filenameTemplate = filenameTemplate[0]
-                }
-                // instantiate the template
-                def filename = filenameTemplate
-                  .replaceAll('\\$id', id_)
-                  .replaceAll('\\$\\{id\\}', id_)
-                  .replaceAll('\\$key', key_)
-                  .replaceAll('\\$\\{key\\}', key_)
-                if (par.multiple) {
-                  // if the parameter is multiple: true, the filename
-                  // should contain a wildcard '*' that is replaced with
-                  // the index of the file
-                  assert filename.contains("*") : "Module '${key_}' id '${id_}': Multiple output files specified, but no wildcard '*' in the filename: ${filename}"
-                  def outputPerFile = value.withIndex().collect{ val, ix ->
-                    def filename_ix = filename.replace("*", ix.toString())
-                    def inputPath = val instanceof File ? val.toPath() : val
-                    [inputPath: inputPath, outputFilename: filename_ix]
-                  }
-                  def transposedOutputs = ["inputPath", "outputFilename"].collectEntries{ key -> 
-                    [key, outputPerFile.collect{dic -> dic[key]}]
-                  }
-                  return [[key: plainName_] + transposedOutputs]
-                } else {
-                  def value_ = java.nio.file.Paths.get(filename)
-                  def inputPath = value instanceof File ? value.toPath() : value
-                  return [[inputPath: [inputPath], outputFilename: [filename]]]
-                }
-              }
-          
-          def inputPaths = processedState.collectMany{it.inputPath}
-          def outputFilenames = processedState.collectMany{it.outputFilename}
-          
-
-          [id_, inputPaths, outputFilenames]
-        }
-        | publishFilesProc
-    emit: input_ch
-  }
-  return publishFilesSimpleWf
-}
-
-
-
-
 // helper file: 'src/main/resources/io/viash/runners/nextflow/states/publishStates.nf'
 def collectFiles(obj) {
  if (obj instanceof java.io.File || obj instanceof Path)  {
@@ -1882,6 +1723,8 @@ def publishStates(Map args) {

          // the input files and the target output filenames
          def inputoutputFilenames_ = collectInputOutputPaths(state_, id_ + "." + key_).transpose()
+          def inputFiles_ = inputoutputFilenames_[0]
+          def outputFilenames_ = inputoutputFilenames_[1]

          def yamlFilename = yamlTemplate_
            .replaceAll('\\$id', id_)
@@ -1894,7 +1737,7 @@ def publishStates(Map args) {
          // convert state to yaml blob
          def yamlBlob_ = toRelativeTaggedYamlBlob([id: id_] + state_, java.nio.file.Paths.get(yamlFilename))

-          [id_, yamlBlob_, yamlFilename]
+          [id_, yamlBlob_, yamlFilename, inputFiles_, outputFilenames_]
        }
        | publishStatesProc
    emit: input_ch
@@ -1906,17 +1749,33 @@ process publishStatesProc {
  publishDir path: "${getPublishDir()}/", mode: "copy"
  tag "$id"
  input:
-    tuple val(id), val(yamlBlob), val(yamlFile)
+    tuple val(id), val(yamlBlob), val(yamlFile), path(inputFiles, stageAs: "_inputfile?/*"), val(outputFiles)
  output:
-    tuple val(id), path{[yamlFile]}
+    tuple val(id), path{[yamlFile] + outputFiles}
  script:
+  def copyCommands = [
+    inputFiles instanceof List ? inputFiles : [inputFiles],
+    outputFiles instanceof List ? outputFiles : [outputFiles]
+  ]
+    .transpose()
+    .collectMany{infile, outfile ->
+      if (infile.toString() != outfile.toString()) {
+        [
+          "[ -d \"\$(dirname '${outfile.toString()}')\" ] || mkdir -p \"\$(dirname '${outfile.toString()}')\"",
+          "cp -r '${infile.toString()}' '${outfile.toString()}'"
+        ]
+      } else {
+        // no need to copy if infile is the same as outfile
+        []
+      }
+    }
  """
-  mkdir -p "\$(dirname '${yamlFile}')"
-  echo "Storing state as yaml"
-  cat > '${yamlFile}' << HERE
-${yamlBlob}
-HERE
-  """
+mkdir -p "\$(dirname '${yamlFile}')"
+echo "Storing state as yaml"
+echo '${yamlBlob}' > '${yamlFile}'
+echo "Copying output files to destination folder"
+${copyCommands.join("\n  ")}
+"""
 }


@@ -1947,10 +1806,13 @@ def publishStatesByConfig(Map args) {
            .replaceAll('\\$\\{key\\}', key_)
          def yamlDir = java.nio.file.Paths.get(yamlFilename).getParent()

-          // the processed state is a list of [key, value] tuples, where
+          // the processed state is a list of [key, value, inputPath, outputFilename] tuples, where
          //   - key is a String
          //   - value is any object that can be serialized to a Yaml (so a String/Integer/Long/Double/Boolean, a List, a Map, or a Path)
+          //   - inputPath is a List[Path]
+          //   - outputFilename is a List[String]
          //   - (key, value) are the tuples that will be saved to the state.yaml file
+          //   - (inputPath, outputFilename) are the files that will be copied from src to dest (relative to the state.yaml)
          def processedState =
            config.allArguments
              .findAll { it.direction == "output" }
@@ -1967,7 +1829,7 @@ def publishStatesByConfig(Map args) {
                // in the state as-is, but is not something that needs 
                // to be copied from the source path to the dest path
                if (par.type != "file") {
-                  return [[key: plainName_, value: value]]
+                  return [[key: plainName_, value: value, inputPath: [], outputFilename: []]]
                }
                // if the orig state does not contain this filename,
                // it's an optional argument for which the user specified
@@ -1998,9 +1860,13 @@ def publishStatesByConfig(Map args) {
                    if (yamlDir != null) {
                      value_ = yamlDir.relativize(value_)
                    }
-                    return value_
+                    def inputPath = val instanceof File ? val.toPath() : val
+                    [value: value_, inputPath: inputPath, outputFilename: filename_ix]
                  }
-                  return [["key": plainName_, "value": outputPerFile]]
+                  def transposedOutputs = ["value", "inputPath", "outputFilename"].collectEntries{ key -> 
+                    [key, outputPerFile.collect{dic -> dic[key]}]
+                  }
+                  return [[key: plainName_] + transposedOutputs]
                } else {
                  def value_ = java.nio.file.Paths.get(filename)
                  // if id contains a slash
@@ -2008,17 +1874,18 @@ def publishStatesByConfig(Map args) {
                    value_ = yamlDir.relativize(value_)
                  }
                  def inputPath = value instanceof File ? value.toPath() : value
-                  return [["key": plainName_, value: value_]]
+                  return [[key: plainName_, value: value_, inputPath: [inputPath], outputFilename: [filename]]]
                }
              }
-              
          
          def updatedState_ = processedState.collectEntries{[it.key, it.value]}
+          def inputPaths = processedState.collectMany{it.inputPath}
+          def outputFilenames = processedState.collectMany{it.outputFilename}
          
          // convert state to yaml blob
          def yamlBlob_ = toTaggedYamlBlob([id: id_] + updatedState_)

-          [id_, yamlBlob_, yamlFilename]
+          [id_, yamlBlob_, yamlFilename, inputPaths, outputFilenames]
        }
        | publishStatesProc
    emit: input_ch
@@ -2692,8 +2559,7 @@ def _debug(workflowArgs, debugKey) {
 def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
  def workflowArgs = processWorkflowArgs(args, defaultWfArgs, meta)
  def key_ = workflowArgs["key"]
-  def multipleArgs = meta.config.allArguments.findAll{ it.multiple }.collect{it.plainName}
-
+  
  workflow workflowInstance {
    take: input_

@@ -2850,36 +2716,12 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
      }

    // TODO: move some of the _meta.join_id wrangling to the safeJoin() function.
-    def chInitialOutputMulti = chArgsWithDefaults
+    def chInitialOutput = chArgsWithDefaults
      | _debug(workflowArgs, "processed")
      // run workflow
      | innerWorkflowFactory(workflowArgs)
-    def chInitialOutputList = chInitialOutputMulti instanceof List ? chInitialOutputMulti : [chInitialOutputMulti]
-    assert chInitialOutputList.size() > 0: "should have emitted at least one output channel"
-    // Add a channel ID to the events, which designates the channel the event was emitted from as a running number
-    // This number is used to sort the events later when the events are gathered from across the channels.
-    def chInitialOutputListWithIndexedEvents = chInitialOutputList.withIndex().collect{channel, channelIndex ->
-      def newChannel = channel
-        | map {tuple ->
-          assert tuple instanceof List : 
-          "Error in module '${key_}': element in output channel should be a tuple [id, data, ...otherargs...]\n" +
-          "  Example: [\"id\", [input: file('foo.txt'), arg: 10]].\n" +
-          "  Expected class: List. Found: tuple.getClass() is ${tuple.getClass()}"
-        
-          def newEvent = [channelIndex] + tuple
-          return newEvent
-        }
-      return newChannel
-    }
-    // Put the events into 1 channel, cover case where there is only one channel is emitted
-    def chInitialOutput = chInitialOutputList.size() > 1 ? \
-      chInitialOutputListWithIndexedEvents[0].mix(*chInitialOutputListWithIndexedEvents.tail()) : \
-      chInitialOutputListWithIndexedEvents[0]
-    def chInitialOutputProcessed = chInitialOutput
-      | map { tuple  ->
-        def channelId = tuple[0]
-        def id_ = tuple[1]
-        def output_ = tuple[2]
+      // check output tuple
+      | map { id_, output_ ->

        // see if output map contains metadata
        def meta_ =
@@ -2892,95 +2734,19 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
        output_ = output_.findAll{k, v -> k != "_meta"}

        // check value types
-        output_ = _checkValidOutputArgument(output_, meta.config, id_, key_)
+        output_ = _processOutputValues(output_, meta.config, id_, key_)

-        [join_id, channelId, id_, output_]
+        // simplify output if need be
+        if (workflowArgs.auto.simplifyOutput && output_.size() == 1) {
+          output_ = output_.values()[0]
+        }
+
+        [join_id, id_, output_]
      }
      // | view{"chInitialOutput: ${it.take(3)}"}

-    // join the output [prev_id, channel_id, new_id, output] with the previous state [prev_id, state, ...]
-    def chPublishWithPreviousState = safeJoin(chInitialOutputProcessed, chRunFiltered, key_)
-      // input tuple format: [join_id, channel_id, id, output, prev_state, ...]
-      // output tuple format: [join_id, channel_id, id, new_state, ...]
-      | map{ tup ->
-        def new_state = workflowArgs.toState(tup.drop(2).take(3))
-        tup.take(3) + [new_state] + tup.drop(5)
-      }
-    if (workflowArgs.auto.publish == "state") {
-      def chPublishFiles = chPublishWithPreviousState
-        // input tuple format: [join_id, channel_id, id, new_state, ...]
-        // output tuple format: [join_id, channel_id, id, new_state]
-        | map{ tup ->
-          tup.take(4)
-        }
-
-      safeJoin(chPublishFiles, chArgsWithDefaults, key_)
-        // input tuple format: [join_id, channel_id, id, new_state, orig_state, ...]
-        // output tuple format: [id, new_state, orig_state]
-        | map { tup ->
-          tup.drop(2).take(3)
-        }
-        | publishFilesByConfig(key: key_, config: meta.config)
-    }
-    // Join the state from the events that were emitted from different channels
-    def chJoined = chInitialOutputProcessed
-      | map {tuple ->
-        def join_id = tuple[0]
-        def channel_id = tuple[1]
-        def id = tuple[2]
-        def other = tuple.drop(3)
-        // Below, groupTuple is used to join the events. To make sure resuming a workflow
-        // keeps working, the output state must be deterministic. This means the state needs to be
-        // sorted with groupTuple's has a 'sort' argument. This argument can be set to 'hash',
-        // but hashing the state when it is large can be problematic in terms of performance.
-        // Therefore, a custom comparator function is provided. We add the channel ID to the 
-        // states so that we can use the channel ID to sort the items. 
-        def stateWithChannelID = [[channel_id] * other.size(), other].transpose()
-        // A comparator that is provided to groupTuple's 'sort' argument is applied
-        // to all elements of the event tuple (that is not the 'id'). The comparator
-        // closure that is used below expects the input to be List. So the join_id and
-        // channel_id must also be wrapped in a list. 
-        [[join_id], [channel_id], id] + stateWithChannelID
-      }
-      | groupTuple(by: 2, sort: {a, b -> a[0] <=> b[0]}, size: chInitialOutputList.size(), remainder: true)
-      | map {join_ids, _, id, statesWithChannelID ->
-        // Remove the channel IDs from the states
-        def states = statesWithChannelID.collect{it[1]}
-        def newJoinId = join_ids.flatten().unique{a, b -> a <=> b}
-        assert newJoinId.size() == 1: "Multiple events were emitted for '$id'."
-        def newJoinIdUnique = newJoinId[0]
-        def newState = states.inject([:]){ old_state, state_to_add ->
-          def stateToAddNoMultiple = state_to_add.findAll{k, v -> !multipleArgs.contains(k)}
-          // First add non multiple arguments
-
-          def overlap = old_state.keySet().intersect(stateToAddNoMultiple.keySet())
-          assert overlap.isEmpty() : "ID $id: multiple entries for " + 
-            " argument(s) $overlap were emitted."
-          def return_state = old_state + stateToAddNoMultiple
-
-          // Add `multiple: true` arguments
-          def stateToAddMultiple = state_to_add.findAll{k, v -> multipleArgs.contains(k)}
-          stateToAddMultiple.each {k, v ->
-            def currentKey = return_state.getOrDefault(k, [])
-            def currentKeyList = currentKey instanceof List ? currentKey : [currentKey]
-            currentKeyList.add(v)
-            return_state[k] = currentKeyList
-          }
-          return return_state
-        }
-
-        _checkAllRequiredOuputsPresent(newState, meta.config, id, key_)
-
-        // simplify output if need be
-        if (workflowArgs.auto.simplifyOutput && newState.size() == 1) {
-          newState = newState.values()[0]
-        }
-
-        return [newJoinIdUnique, id, newState]
-      }
-    
    // join the output [prev_id, new_id, output] with the previous state [prev_id, state, ...]
-    def chNewState = safeJoin(chJoined, chRunFiltered, key_)
+    def chNewState = safeJoin(chInitialOutput, chRunFiltered, key_)
      // input tuple format: [join_id, id, output, prev_state, ...]
      // output tuple format: [join_id, id, new_state, ...]
      | map{ tup ->
@@ -2989,21 +2755,23 @@ def workflowFactory(Map args, Map defaultWfArgs, Map meta) {
      }

    if (workflowArgs.auto.publish == "state") {
-      def chPublishStates = chNewState
+      def chPublish = chNewState
        // input tuple format: [join_id, id, new_state, ...]
        // output tuple format: [join_id, id, new_state]
        | map{ tup ->
          tup.take(3)
        }

-      safeJoin(chPublishStates, chArgsWithDefaults, key_)
+      safeJoin(chPublish, chArgsWithDefaults, key_)
        // input tuple format: [join_id, id, new_state, orig_state, ...]
        // output tuple format: [id, new_state, orig_state]
        | map { tup ->
          tup.drop(1).take(3)
-        }
+      }
        | publishStatesByConfig(key: key_, config: meta.config)
    }
+
+    // remove join_id and meta
    chReturn = chNewState
      | map { tup ->
        // input tuple format: [join_id, id, new_state, ...]
@@ -3108,10 +2876,6 @@ meta = [
  ],
  "description" : "From a directory containing fastq files, gather the files per sample \nand validate according to the contents of the sample sheet.\n",
  "status" : "enabled",
-  "scope" : {
-    "image" : "public",
-    "target" : "public"
-  },
  "requirements" : {
    "commands" : [
      "ps"
@@ -3208,10 +2972,10 @@ meta = [
    "runner" : "nextflow",
    "engine" : "native|native",
    "output" : "target/nextflow/dataflow/gather_fastqs_and_validate",
-    "viash_version" : "0.9.1",
-    "git_commit" : "dd1f93487f4e908999504e1fcdf97f6c59f743d9",
-    "git_remote" : "https://x-access-token:ghs_NbivUxJIyO1sd735kE5b6eTS6tHmjH0IsDUF@github.com/viash-hub/demultiplex",
-    "git_tag" : "v0.1.1-16-gdd1f934"
+    "viash_version" : "0.9.0",
+    "git_commit" : "795abd68688f4f31b0587bc8e4a7de49b6c00825",
+    "git_remote" : "https://github.com/viash-hub/demultiplex",
+    "git_tag" : "v0.1.1-18-g795abd6"
  },
  "package_config" : {
    "name" : "demultiplex",
@@ -3225,7 +2989,7 @@ meta = [
        }
      ]
    },
-    "viash_version" : "0.9.1",
+    "viash_version" : "0.9.0",
    "source" : "src",
    "target" : "target",
    "config_mods" : [