From 562d4935d7c95d52136c63abea7accc7cc400dc9 Mon Sep 17 00:00:00 2001
From: Dave Bunten <dave.bunten@cuanschutz.edu>
Date: Fri, 19 Jan 2024 15:46:25 -0700
Subject: [PATCH] Add IN Carta preset and related compatibility changes +
 testing (#145)

* add initial in-carta preset

* add test dir fixture for in carta

* add in carta test

* modify source path processing for no targets

* raise errors for special no target sources case

* update pre-commit versions

* set explicit order for column metadata extraction

* further test revision

* add comment about uncertain version

* add casting for mypy

* add docs for in carta usage

* add in-carta version specification

* distinct dest dir for test

* move to errno reference for dir not empty

* Update docs/source/overview.md

Co-authored-by: Gregory Way <gregory.way@gmail.com>

* add in-carta as data source in main readme

* add logging, comments for no target circumstances

* linting

---------

Co-authored-by: Gregory Way <gregory.way@gmail.com>
---
 .pre-commit-config.yaml          |  4 +-
 cytotable/convert.py             | 22 +++++++++--
 cytotable/presets.py             | 28 ++++++++++++++
 cytotable/sources.py             | 65 +++++++++++++++++++++++---------
 cytotable/utils.py               |  9 ++++-
 docs/source/_static/dataflow.mmd |  9 ++++-
 docs/source/_static/dataflow.svg |  2 +-
 docs/source/overview.md          |  9 +++++
 readme.md                        |  2 +-
 tests/conftest.py                |  9 +++++
 tests/test_convert.py            | 40 ++++++++++++++++++++
 11 files changed, 171 insertions(+), 28 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index c25e6787..48c64bae 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -33,7 +33,7 @@ repos:
     hooks:
       - id: yamllint
   - repo: https://github.com/psf/black
-    rev: 23.12.0
+    rev: 23.12.1
     hooks:
       - id: black
   - repo: https://github.com/asottile/blacken-docs
@@ -55,7 +55,7 @@ repos:
     hooks:
       - id: vulture
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v1.7.1
+    rev: v1.8.0
     hooks:
       - id: mypy
   - repo: https://github.com/PyCQA/pylint
diff --git a/cytotable/convert.py b/cytotable/convert.py
index ad083b80..098f040a 100644
--- a/cytotable/convert.py
+++ b/cytotable/convert.py
@@ -75,7 +75,9 @@ def _get_table_columns_and_types(source: Dict[str, Any]) -> List[Dict[str, str]]
             segment_type as column_dtype
         FROM pragma_storage_info('column_details')
         /* avoid duplicate entries in the form of VALIDITY segment_types */
-        WHERE segment_type != 'VALIDITY';
+        WHERE segment_type != 'VALIDITY'
+        /* explicitly order the columns by their id to avoid inconsistent results */
+        ORDER BY column_id ASC;
         """
 
     # attempt to read the data to parquet from duckdb
@@ -319,7 +321,7 @@ def _source_chunk_to_parquet(
     select_columns = ",".join(
         [
             # here we cast the column to the specified type ensure the colname remains the same
-            f"CAST({column['column_name']} AS {column['column_dtype']}) AS {column['column_name']}"
+            f"CAST(\"{column['column_name']}\" AS {column['column_dtype']}) AS \"{column['column_name']}\""
             for column in source["columns"]
         ]
     )
@@ -414,6 +416,7 @@ def _prepend_column_name(
             Path to the modified file.
     """
 
+    import logging
     import pathlib
 
     import pyarrow.parquet as parquet
@@ -421,8 +424,20 @@ def _prepend_column_name(
     from cytotable.constants import CYTOTABLE_ARROW_USE_MEMORY_MAPPING
     from cytotable.utils import _write_parquet_table_with_metadata
 
+    logger = logging.getLogger(__name__)
+
     targets = tuple(metadata) + tuple(compartments)
 
+    # if we have no targets or metadata to work from, return the table unchanged
+    if len(targets) == 0:
+        logger.warning(
+            msg=(
+                "Skipping column name prepend operations"
+                "because no compartments or metadata were provided."
+            )
+        )
+        return table_path
+
     table = parquet.read_table(
         source=table_path, memory_map=CYTOTABLE_ARROW_USE_MEMORY_MAPPING
     )
@@ -569,6 +584,7 @@ def _concat_source_group(
             Updated dictionary containing concatenated sources.
     """
 
+    import errno
     import pathlib
 
     import pyarrow as pa
@@ -649,7 +665,7 @@ def _concat_source_group(
                 pathlib.Path(pathlib.Path(source["table"][0]).parent).rmdir()
             except OSError as os_err:
                 # raise only if we don't have a dir not empty errno
-                if os_err.errno != 66:
+                if os_err.errno != errno.ENOTEMPTY:
                     raise
 
     # return the concatted parquet filename
diff --git a/cytotable/presets.py b/cytotable/presets.py
index 488fe6b1..4d8c7095 100644
--- a/cytotable/presets.py
+++ b/cytotable/presets.py
@@ -204,6 +204,34 @@
                 AND nuclei.Nuclei_ObjectNumber = cytoplasm.Metadata_Cytoplasm_Parent_Nuclei
         """,
     },
+    "in-carta": {
+        # version specifications using related references
+        "CONFIG_SOURCE_VERSION": {
+            "in-carta": "v1.17.0412545",
+        },
+        # names of source table compartments (for ex. cells.csv, etc.)
+        "CONFIG_NAMES_COMPARTMENTS": tuple(),
+        # names of source table metadata (for ex. image.csv, etc.)
+        "CONFIG_NAMES_METADATA": tuple(),
+        # column names in any compartment or metadata tables which contain
+        # unique names to avoid renaming
+        "CONFIG_IDENTIFYING_COLUMNS": (
+            "OBJECT ID",
+            "Row",
+            "Column",
+            "FOV",
+            "WELL LABEL",
+            "Z",
+            "T",
+        ),
+        # chunk size to use for join operations to help with possible performance issues
+        # note: this number is an estimate and is may need changes contingent on data
+        # and system used by this library.
+        "CONFIG_CHUNK_SIZE": 1000,
+        # compartment and metadata joins performed using DuckDB SQL
+        # and modified at runtime as needed
+        "CONFIG_JOINS": "",
+    },
 }
 """
 Configuration presets for CytoTable
diff --git a/cytotable/sources.py b/cytotable/sources.py
index 2e81955e..87ec9578 100644
--- a/cytotable/sources.py
+++ b/cytotable/sources.py
@@ -47,6 +47,7 @@ def _build_path(
 def _get_source_filepaths(
     path: Union[pathlib.Path, AnyPath],
     targets: List[str],
+    source_datatype: Optional[str] = None,
 ) -> Dict[str, List[Dict[str, Any]]]:
     """
     Gather dataset of filepaths from a provided directory path.
@@ -56,19 +57,27 @@ def _get_source_filepaths(
             Either a directory path to seek filepaths within or a path directly to a file.
         targets: List[str]:
             Compartment and metadata names to seek within the provided path.
+        source_datatype: Optional[str]:  (Default value = None)
+            The source datatype (extension) to use for reading the tables.
 
     Returns:
         Dict[str, List[Dict[str, Any]]]
             Data structure which groups related files based on the compartments.
     """
 
+    import os
     import pathlib
 
     from cloudpathlib import AnyPath
 
-    from cytotable.exceptions import NoInputDataException
+    from cytotable.exceptions import DatatypeException, NoInputDataException
     from cytotable.utils import _cache_cloudpath_to_local, _duckdb_reader
 
+    if (targets is None or targets == []) and source_datatype is None:
+        raise DatatypeException(
+            f"A source_datatype must be specified when using undefined compartments and metadata names."
+        )
+
     # gathers files from provided path using compartments + metadata as a filter
     sources = [
         # build source_paths for all files
@@ -85,6 +94,7 @@ def _get_source_filepaths(
         # ensure the subpaths meet certain specifications
         if (
             targets is None
+            or targets == []
             # checks for name of the file from targets (compartment + metadata names)
             or str(subpath.stem).lower() in [target.lower() for target in targets]
             # checks for sqlite extension (which may include compartment + metadata names)
@@ -134,21 +144,38 @@ def _get_source_filepaths(
 
     # group files together by similar filename for later data operations
     grouped_sources = {}
-    for unique_source in set(source["source_path"].name for source in sources):
-        grouped_sources[unique_source.capitalize()] = [
-            # case for files besides sqlite
-            source if source["source_path"].suffix.lower() != ".sqlite"
-            # if we have sqlite entries, update the source_path to the parent
-            # (the parent table database file) as grouped key name will now
-            # encapsulate the table name details.
-            else {
-                "source_path": source["source_path"].parent,
-                "table_name": source["table_name"],
-            }
-            for source in sources
-            # focus only on entries which include the unique_source name
-            if source["source_path"].name == unique_source
-        ]
+
+    # if we have no targets, create a single group inferred from a common prefix and suffix
+    # note: this may apply for scenarios where no compartments or metadata are
+    # provided as input to CytoTable operations.
+    if targets is None or targets == []:
+        # gather a common prefix to use for the group
+        common_prefix = os.path.commonprefix(
+            [
+                source["source_path"].stem
+                for source in sources
+                if source["source_path"].suffix == f".{source_datatype}"
+            ]
+        )
+        grouped_sources[f"{common_prefix}.{source_datatype}"] = sources
+
+    # otherwise, use the unique names in the paths to determine source grouping
+    else:
+        for unique_source in set(source["source_path"].name for source in sources):
+            grouped_sources[unique_source.capitalize()] = [
+                # case for files besides sqlite
+                source if source["source_path"].suffix.lower() != ".sqlite"
+                # if we have sqlite entries, update the source_path to the parent
+                # (the parent table database file) as grouped key name will now
+                # encapsulate the table name details.
+                else {
+                    "source_path": source["source_path"].parent,
+                    "table_name": source["table_name"],
+                }
+                for source in sources
+                # focus only on entries which include the unique_source name
+                if source["source_path"].name == unique_source
+            ]
 
     return grouped_sources
 
@@ -190,7 +217,7 @@ def _infer_source_datatype(
         raise DatatypeException(
             (
                 f"Unable to find source datatype {source_datatype} "
-                "within files. Detected datatypes: {suffixes}"
+                f"within files. Detected datatypes: {suffixes}"
             )
         )
 
@@ -270,7 +297,9 @@ def _gather_sources(
     source_path = _build_path(path=source_path, **kwargs)
 
     # gather filepaths which will be used as the basis for this work
-    sources = _get_source_filepaths(path=source_path, targets=targets)
+    sources = _get_source_filepaths(
+        path=source_path, targets=targets, source_datatype=source_datatype
+    )
 
     # infer or validate the source datatype based on source filepaths
     source_datatype = _infer_source_datatype(
diff --git a/cytotable/utils.py b/cytotable/utils.py
index 8f317b0c..9789f42e 100644
--- a/cytotable/utils.py
+++ b/cytotable/utils.py
@@ -202,13 +202,18 @@ def _sqlite_mixed_type_query_to_parquet(
     with sqlite3.connect(source_path) as conn:
         cursor = conn.cursor()
 
-        # gather table column details including datatype
+        # Gather table column details including datatype.
+        # Note: uses SQLite pragma for table information.
+        # See the following for more information:
+        # https://sqlite.org/pragma.html#pragma_table_info
         cursor.execute(
             f"""
             SELECT :table_name as table_name,
                     name as column_name,
                     type as column_type
-            FROM pragma_table_info(:table_name);
+            FROM pragma_table_info(:table_name)
+            /* explicit column ordering by 'cid' */
+            ORDER BY cid ASC;
             """,
             {"table_name": table_name},
         )
diff --git a/docs/source/_static/dataflow.mmd b/docs/source/_static/dataflow.mmd
index bdd06f58..eb0159e9 100644
--- a/docs/source/_static/dataflow.mmd
+++ b/docs/source/_static/dataflow.mmd
@@ -6,20 +6,27 @@ flowchart LR
     DeepProfiler
     npz[(NPZ Files)]
     cytominer-database
-    sqlite[(SQLite File)]
+    sqlite[(SQLite Files)]
     cp_sqlite[(SQLite File)]
+    in_carta[IN Carta]
+    ic_csv[(CSV files)]
     pycytominer
     CytoTable
 
     images --> CellProfiler
     images --> DeepProfiler
+     images --> in_carta
     CellProfiler --> csv
     CellProfiler --> cp_sqlite
     DeepProfiler --> npz
     csv --> cytominer-database
     cytominer-database --> sqlite
+    in_carta --> ic_csv
     csv --> CytoTable
     npz --> CytoTable
     sqlite --> CytoTable
     cp_sqlite --> CytoTable
+    ic_csv --> CytoTable
     CytoTable --> pycytominer
+
+    style CytoTable fill:#FDCA88,stroke:#D96026;
diff --git a/docs/source/_static/dataflow.svg b/docs/source/_static/dataflow.svg
index 387b37ac..ac86ca67 100644
--- a/docs/source/_static/dataflow.svg
+++ b/docs/source/_static/dataflow.svg
@@ -1 +1 @@
-<svg id="mermaid-1665603401412" width="100%" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" height="306.4931640625" style="max-width: 1143.15625px;" viewBox="0 0 1143.15625 306.4931640625"><style>#mermaid-1665603401412{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;fill:#333;}#mermaid-1665603401412 .error-icon{fill:#552222;}#mermaid-1665603401412 .error-text{fill:#552222;stroke:#552222;}#mermaid-1665603401412 .edge-thickness-normal{stroke-width:2px;}#mermaid-1665603401412 .edge-thickness-thick{stroke-width:3.5px;}#mermaid-1665603401412 .edge-pattern-solid{stroke-dasharray:0;}#mermaid-1665603401412 .edge-pattern-dashed{stroke-dasharray:3;}#mermaid-1665603401412 .edge-pattern-dotted{stroke-dasharray:2;}#mermaid-1665603401412 .marker{fill:#333333;stroke:#333333;}#mermaid-1665603401412 .marker.cross{stroke:#333333;}#mermaid-1665603401412 svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;}#mermaid-1665603401412 .label{font-family:"trebuchet ms",verdana,arial,sans-serif;color:#333;}#mermaid-1665603401412 .cluster-label text{fill:#333;}#mermaid-1665603401412 .cluster-label span{color:#333;}#mermaid-1665603401412 .label text,#mermaid-1665603401412 span{fill:#333;color:#333;}#mermaid-1665603401412 .node rect,#mermaid-1665603401412 .node circle,#mermaid-1665603401412 .node ellipse,#mermaid-1665603401412 .node polygon,#mermaid-1665603401412 .node path{fill:#ECECFF;stroke:#9370DB;stroke-width:1px;}#mermaid-1665603401412 .node .label{text-align:center;}#mermaid-1665603401412 .node.clickable{cursor:pointer;}#mermaid-1665603401412 .arrowheadPath{fill:#333333;}#mermaid-1665603401412 .edgePath .path{stroke:#333333;stroke-width:1.5px;}#mermaid-1665603401412 .flowchart-link{stroke:#333333;fill:none;}#mermaid-1665603401412 .edgeLabel{background-color:#e8e8e8;text-align:center;}#mermaid-1665603401412 .edgeLabel rect{opacity:0.5;background-color:#e8e8e8;fill:#e8e8e8;}#mermaid-1665603401412 .cluster rect{fill:#ffffde;stroke:#aaaa33;stroke-width:1px;}#mermaid-1665603401412 .cluster text{fill:#333;}#mermaid-1665603401412 .cluster span{color:#333;}#mermaid-1665603401412 div.mermaidTooltip{position:absolute;text-align:center;max-width:200px;padding:2px;font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:12px;background:hsl(80,100%,96.2745098039%);border:1px solid #aaaa33;border-radius:2px;pointer-events:none;z-index:100;}#mermaid-1665603401412:root{--mermaid-font-family:"trebuchet ms",verdana,arial,sans-serif;}</style><g transform="translate(0, 0)"><marker id="flowchart-pointEnd" class="marker flowchart" viewBox="0 0 10 10" refX="9" refY="5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 0 0 L 10 5 L 0 10 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-pointStart" class="marker flowchart" viewBox="0 0 10 10" refX="0" refY="5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 0 5 L 10 10 L 10 0 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-circleEnd" class="marker flowchart" viewBox="0 0 10 10" refX="11" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></circle></marker><marker id="flowchart-circleStart" class="marker flowchart" viewBox="0 0 10 10" refX="-1" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></circle></marker><marker id="flowchart-crossEnd" class="marker cross flowchart" viewBox="0 0 11 11" refX="12" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-crossStart" class="marker cross flowchart" viewBox="0 0 11 11" refX="-1" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path d="M72.31044602569085,132.8302299653795L76.48787168807571,127.63498434716682C80.66529735046056,122.43973872895417,89.02014867523029,112.04924749252883,97.36424100428182,106.85400187431617C105.70833333333333,101.65875625610352,114.04166666666667,101.65875625610352,118.20833333333333,101.65875625610352L122.375,101.65875625610352" id="L-images-CellProfiler-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-images LE-CellProfiler" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M54.69185396825468,183.4531432376946L61.80571164021223,198.19517701753685C68.91956931216978,212.93721079737907,83.14728465608489,242.42127835706356,102.47859024470911,257.1633121369058C121.80989583333333,271.90534591674805,146.24479166666666,271.90534591674805,170.6796875,271.90534591674805C195.11458333333334,271.90534591674805,219.54947916666666,271.90534591674805,239.40625,271.90534591674805C259.2630208333333,271.90534591674805,274.5416666666667,271.90534591674805,289.8203125,271.90534591674805C305.0989583333333,271.90534591674805,320.3776041666667,271.90534591674805,336.5755208333333,271.90534591674805C352.7734375,271.90534591674805,369.890625,271.90534591674805,378.44921875,271.90534591674805L387.0078125,271.90534591674805" id="L-images-DeepProfiler-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-images LE-DeepProfiler" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M209.42340689425248,84.65875625610352L215.18356824521038,82.13130807876587C220.9437295961683,79.60385990142822,232.46405229808417,74.54896354675293,242.39088031570873,72.02151536941528C252.31770833333334,69.49406719207764,260.6510416666667,69.49406719207764,264.8177083333333,69.49406719207764L268.984375,69.49406719207764" id="L-CellProfiler-csv-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CellProfiler LE-csv" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M190.05154719712624,118.65875625610352L199.04035183093853,126.54698594411214C208.02915646475083,134.43521563212076,226.00676573237538,150.21167500813803,242.63489328285436,158.09990469614664C259.2630208333333,165.98813438415527,274.5416666666667,165.98813438415527,289.8203125,165.98813438415527C305.0989583333333,165.98813438415527,320.3776041666667,165.98813438415527,345.3294270833333,165.98813438415527C370.28125,165.98813438415527,404.90625,165.98813438415527,439.53125,165.98813438415527C474.15625,165.98813438415527,508.78125,165.98813438415527,530.2604166666666,165.98813438415527C551.7395833333334,165.98813438415527,560.0729166666666,165.98813438415527,564.2395833333334,165.98813438415527L568.40625,165.98813438415527" id="L-CellProfiler-cp_sqlite-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CellProfiler LE-cp_sqlite" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M492.0546875,271.90534591674805L500.61328125,271.90534591674805C509.171875,271.90534591674805,526.2890625,271.90534591674805,540.5403645833334,271.90534591674805C554.7916666666666,271.90534591674805,566.1770833333334,271.90534591674805,571.8697916666666,271.90534591674805L577.5625,271.90534591674805" id="L-DeepProfiler-npz-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-DeepProfiler LE-npz" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M310.65625,54.872757198255066L314.8229166666667,51.94886068655452C318.9895833333333,49.02496417485397,327.3229166666667,43.17717115145286,335.65625,40.25327463975231C343.9895833333333,37.32937812805176,352.3229166666667,37.32937812805176,356.4895833333333,37.32937812805176L360.65625,37.32937812805176" id="L-csv-cytominer-database-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-csv LE-cytominer-database" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M518.40625,37.32937812805176L522.5729166666666,37.32937812805176C526.7395833333334,37.32937812805176,535.0729166666666,37.32937812805176,543.40625,37.32937812805176C551.7395833333334,37.32937812805176,560.0729166666666,37.32937812805176,564.2395833333334,37.32937812805176L568.40625,37.32937812805176" id="L-cytominer-database-sqlite-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-cytominer-database LE-sqlite" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M310.65625,84.1153771859002L314.8229166666667,87.03927369760076C318.9895833333333,89.96317020930131,327.3229166666667,95.81096323270242,348.8020833333333,98.73485974440297C370.28125,101.65875625610352,404.90625,101.65875625610352,439.53125,101.65875625610352C474.15625,101.65875625610352,508.78125,101.65875625610352,535.3645833333334,101.65875625610352C561.9479166666666,101.65875625610352,580.4895833333334,101.65875625610352,599.03125,101.65875625610352C617.5729166666666,101.65875625610352,636.1145833333334,101.65875625610352,654.4274518940202,104.18620443344116C672.7403204547073,106.71365261077881,690.8243909094145,111.7685489654541,699.8664261367682,114.29599714279175L708.9084613641219,116.8234453201294" id="L-csv-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-csv LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M620.5,271.90534591674805L626.1927083333334,271.90534591674805C631.8854166666666,271.90534591674805,643.2708333333334,271.90534591674805,665.7807736615263,251.72502915064493C688.2907139897192,231.54471238454184,721.9251779794382,191.1840788523356,738.7424099742979,171.0037620862325L755.5596419691574,150.8234453201294" id="L-npz-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-npz LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M629.65625,37.32937812805176L633.8229166666666,37.32937812805176C637.9895833333334,37.32937812805176,646.3229166666666,37.32937812805176,666.2891853535624,50.57838932673136C686.2554540404581,63.82740052541097,717.854658080916,90.32542292277019,733.654260101145,103.57443412144978L749.453862121374,116.8234453201294" id="L-sqlite-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-sqlite LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M629.65625,165.98813438415527L633.8229166666666,165.98813438415527C637.9895833333334,165.98813438415527,646.3229166666666,165.98813438415527,659.531618560687,163.46068620681763C672.7403204547073,160.93323802947998,690.8243909094145,155.8783416748047,699.8664261367682,153.35089349746704L708.9084613641219,150.8234453201294" id="L-cp_sqlite-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-cp_sqlite LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M859.796875,133.8234453201294L863.9635416666666,133.8234453201294C868.1302083333334,133.8234453201294,876.4635416666666,133.8234453201294,884.796875,133.8234453201294C893.1302083333334,133.8234453201294,901.4635416666666,133.8234453201294,905.6302083333334,133.8234453201294L909.796875,133.8234453201294" id="L-CytoTable-parquet-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CytoTable LE-parquet" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M981.078125,133.8234453201294L985.2447916666666,133.8234453201294C989.4114583333334,133.8234453201294,997.7447916666666,133.8234453201294,1006.078125,133.8234453201294C1014.4114583333334,133.8234453201294,1022.7447916666666,133.8234453201294,1026.9114583333333,133.8234453201294L1031.078125,133.8234453201294" id="L-parquet-pycytominer-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-parquet LE-pycytominer" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path></g><g class="edgeLabels"><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g class="node default default" id="flowchart-images-37" label-offset-y="8.498349834983498" transform="translate(40.1875, 154.6173620223999)"><path style="" d="M 0,8.498349834983498 a 32.1875,8.498349834983498 0,0,0 64.375 0 a 32.1875,8.498349834983498 0,0,0 -64.375 0 l 0,42.4983498349835 a 32.1875,8.498349834983498 0,0,0 64.375 0 l 0,-42.4983498349835" transform="translate(-32.1875,-29.74752475247525)"></path><g class="label" style="" transform="translate(-24.6875, -9.5)"><foreignObject width="49.375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">Images</span></div></foreignObject></g></g><g class="node default default" id="flowchart-CellProfiler-38" transform="translate(170.6796875, 101.65875625610352)"><rect class="basic label-container" style="" rx="0" ry="0" x="-48.3046875" y="-17" width="96.609375" height="34"></rect><g class="label" style="" transform="translate(-40.8046875, -9.5)"><foreignObject width="81.609375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CellProfiler</span></div></foreignObject></g></g><g class="node default default" id="flowchart-csv-39" label-offset-y="6.2505859191900255" transform="translate(289.8203125, 69.49406719207764)"><path style="" d="M 0,6.2505859191900255 a 20.8359375,6.2505859191900255 0,0,0 41.671875 0 a 20.8359375,6.2505859191900255 0,0,0 -41.671875 0 l 0,40.25058591919003 a 20.8359375,6.2505859191900255 0,0,0 41.671875 0 l 0,-40.25058591919003" transform="translate(-20.8359375,-26.37587887878504)"></path><g class="label" style="" transform="translate(-13.3359375, -9.5)"><foreignObject width="26.671875" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CSV</span></div></foreignObject></g></g><g class="node default default" id="flowchart-DeepProfiler-40" transform="translate(439.53125, 271.90534591674805)"><rect class="basic label-container" style="" rx="0" ry="0" x="-52.5234375" y="-17" width="105.046875" height="34"></rect><g class="label" style="" transform="translate(-45.0234375, -9.5)"><foreignObject width="90.046875" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">DeepProfiler</span></div></foreignObject></g></g><g class="node default default" id="flowchart-npz-41" label-offset-y="6.391886862672125" transform="translate(599.03125, 271.90534591674805)"><path style="" d="M 0,6.391886862672125 a 21.46875,6.391886862672125 0,0,0 42.9375 0 a 21.46875,6.391886862672125 0,0,0 -42.9375 0 l 0,40.39188686267212 a 21.46875,6.391886862672125 0,0,0 42.9375 0 l 0,-40.39188686267212" transform="translate(-21.46875,-26.587830294008185)"></path><g class="label" style="" transform="translate(-13.96875, -9.5)"><foreignObject width="27.9375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">NPZ</span></div></foreignObject></g></g><g class="node default default" id="flowchart-cytominer-database-42" transform="translate(439.53125, 37.32937812805176)"><rect class="basic label-container" style="" rx="0" ry="0" x="-78.875" y="-17" width="157.75" height="34"></rect><g class="label" style="" transform="translate(-71.375, -9.5)"><foreignObject width="142.75" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">cytominer-database</span></div></foreignObject></g></g><g class="node default default" id="flowchart-sqlite-43" label-offset-y="8.221476510067115" transform="translate(599.03125, 37.32937812805176)"><path style="" d="M 0,8.221476510067115 a 30.625,8.221476510067115 0,0,0 61.25 0 a 30.625,8.221476510067115 0,0,0 -61.25 0 l 0,42.22147651006711 a 30.625,8.221476510067115 0,0,0 61.25 0 l 0,-42.22147651006711" transform="translate(-30.625,-29.332214765100673)"></path><g class="label" style="" transform="translate(-23.125, -9.5)"><foreignObject width="46.25" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">SQLite</span></div></foreignObject></g></g><g class="node default default" id="flowchart-cp_sqlite-44" label-offset-y="8.221476510067115" transform="translate(599.03125, 165.98813438415527)"><path style="" d="M 0,8.221476510067115 a 30.625,8.221476510067115 0,0,0 61.25 0 a 30.625,8.221476510067115 0,0,0 -61.25 0 l 0,42.22147651006711 a 30.625,8.221476510067115 0,0,0 61.25 0 l 0,-42.22147651006711" transform="translate(-30.625,-29.332214765100673)"></path><g class="label" style="" transform="translate(-23.125, -9.5)"><foreignObject width="46.25" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">SQLite</span></div></foreignObject></g></g><g class="node default default" id="flowchart-pycytominer-45" transform="translate(1083.1171875, 133.8234453201294)"><rect class="basic label-container" style="" rx="0" ry="0" x="-52.0390625" y="-17" width="104.078125" height="34"></rect><g class="label" style="" transform="translate(-44.5390625, -9.5)"><foreignObject width="89.078125" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">pycytominer</span></div></foreignObject></g></g><g class="node default default" id="flowchart-CytoTable-46" transform="translate(769.7265625, 133.8234453201294)"><rect class="basic label-container" style="" rx="0" ry="0" x="-90.0703125" y="-17" width="180.140625" height="34"></rect><g class="label" style="" transform="translate(-82.5703125, -9.5)"><foreignObject width="165.140625" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CytoTable</span></div></foreignObject></g></g><g class="node default default" id="flowchart-parquet-47" label-offset-y="9.07896831714695" transform="translate(945.4375, 133.8234453201294)"><path style="" d="M 0,9.07896831714695 a 35.640625,9.07896831714695 0,0,0 71.28125 0 a 35.640625,9.07896831714695 0,0,0 -71.28125 0 l 0,43.07896831714695 a 35.640625,9.07896831714695 0,0,0 71.28125 0 l 0,-43.07896831714695" transform="translate(-35.640625,-30.618452475720424)"></path><g class="label" style="" transform="translate(-28.140625, -9.5)"><foreignObject width="56.28125" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">Parquet</span></div></foreignObject></g></g></g></g></g></svg>
+<svg id="mermaid-1705600010865" width="100%" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" height="445.0036315917969" style="max-width: 1037.15625px;" viewBox="0 0 1037.15625 445.0036315917969"><style>#mermaid-1705600010865{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;fill:#333;}#mermaid-1705600010865 .error-icon{fill:#552222;}#mermaid-1705600010865 .error-text{fill:#552222;stroke:#552222;}#mermaid-1705600010865 .edge-thickness-normal{stroke-width:2px;}#mermaid-1705600010865 .edge-thickness-thick{stroke-width:3.5px;}#mermaid-1705600010865 .edge-pattern-solid{stroke-dasharray:0;}#mermaid-1705600010865 .edge-pattern-dashed{stroke-dasharray:3;}#mermaid-1705600010865 .edge-pattern-dotted{stroke-dasharray:2;}#mermaid-1705600010865 .marker{fill:#333333;stroke:#333333;}#mermaid-1705600010865 .marker.cross{stroke:#333333;}#mermaid-1705600010865 svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;}#mermaid-1705600010865 .label{font-family:"trebuchet ms",verdana,arial,sans-serif;color:#333;}#mermaid-1705600010865 .cluster-label text{fill:#333;}#mermaid-1705600010865 .cluster-label span{color:#333;}#mermaid-1705600010865 .label text,#mermaid-1705600010865 span{fill:#333;color:#333;}#mermaid-1705600010865 .node rect,#mermaid-1705600010865 .node circle,#mermaid-1705600010865 .node ellipse,#mermaid-1705600010865 .node polygon,#mermaid-1705600010865 .node path{fill:#ECECFF;stroke:#9370DB;stroke-width:1px;}#mermaid-1705600010865 .node .label{text-align:center;}#mermaid-1705600010865 .node.clickable{cursor:pointer;}#mermaid-1705600010865 .arrowheadPath{fill:#333333;}#mermaid-1705600010865 .edgePath .path{stroke:#333333;stroke-width:1.5px;}#mermaid-1705600010865 .flowchart-link{stroke:#333333;fill:none;}#mermaid-1705600010865 .edgeLabel{background-color:#e8e8e8;text-align:center;}#mermaid-1705600010865 .edgeLabel rect{opacity:0.5;background-color:#e8e8e8;fill:#e8e8e8;}#mermaid-1705600010865 .cluster rect{fill:#ffffde;stroke:#aaaa33;stroke-width:1px;}#mermaid-1705600010865 .cluster text{fill:#333;}#mermaid-1705600010865 .cluster span{color:#333;}#mermaid-1705600010865 div.mermaidTooltip{position:absolute;text-align:center;max-width:200px;padding:2px;font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:12px;background:hsl(80,100%,96.2745098039%);border:1px solid #aaaa33;border-radius:2px;pointer-events:none;z-index:100;}#mermaid-1705600010865:root{--mermaid-font-family:"trebuchet ms",verdana,arial,sans-serif;}</style><g transform="translate(0, 0)"><marker id="flowchart-pointEnd" class="marker flowchart" viewBox="0 0 10 10" refX="9" refY="5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 0 0 L 10 5 L 0 10 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-pointStart" class="marker flowchart" viewBox="0 0 10 10" refX="0" refY="5" markerUnits="userSpaceOnUse" markerWidth="12" markerHeight="12" orient="auto"><path d="M 0 5 L 10 10 L 10 0 z" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-circleEnd" class="marker flowchart" viewBox="0 0 10 10" refX="11" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></circle></marker><marker id="flowchart-circleStart" class="marker flowchart" viewBox="0 0 10 10" refX="-1" refY="5" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><circle cx="5" cy="5" r="5" class="arrowMarkerPath" style="stroke-width: 1; stroke-dasharray: 1, 0;"></circle></marker><marker id="flowchart-crossEnd" class="marker cross flowchart" viewBox="0 0 11 11" refX="12" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"></path></marker><marker id="flowchart-crossStart" class="marker cross flowchart" viewBox="0 0 11 11" refX="-1" refY="5.2" markerUnits="userSpaceOnUse" markerWidth="11" markerHeight="11" orient="auto"><path d="M 1,1 l 9,9 M 10,1 l -9,9" class="arrowMarkerPath" style="stroke-width: 2; stroke-dasharray: 1, 0;"></path></marker><g class="root"><g class="clusters"></g><g class="edgePaths"><path d="M69.87468733204199,259.784870427828L79.88515611003498,234.79181090492423C89.895624888028,209.79875138202044,109.91656244401399,159.81263233621286,124.09369788867366,134.81957281330907C138.27083333333334,109.82651329040527,146.60416666666666,109.82651329040527,150.77083333333334,109.82651329040527L154.9375,109.82651329040527" id="L-images-CellProfiler-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-images LE-CellProfiler" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M104.9375,292.73430252075195L109.10416666666667,292.73430252075195C113.27083333333333,292.73430252075195,121.60416666666667,292.73430252075195,137.98828125,292.73430252075195C154.37239583333334,292.73430252075195,178.80729166666666,292.73430252075195,203.2421875,292.73430252075195C227.67708333333334,292.73430252075195,252.11197916666666,292.73430252075195,275.1106770833333,292.73430252075195C298.109375,292.73430252075195,319.671875,292.73430252075195,341.234375,292.73430252075195C362.796875,292.73430252075195,384.359375,292.73430252075195,403.69921875,292.73430252075195C423.0390625,292.73430252075195,440.15625,292.73430252075195,448.71484375,292.73430252075195L457.2734375,292.73430252075195" id="L-images-DeepProfiler-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-images LE-DeepProfiler" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M78.17073789101602,324.95398147168413L86.79853157584667,338.4152619645219C95.42632526067734,351.8765424573597,112.68191263033867,378.79910344303534,133.527154231836,392.2603839358731C154.37239583333334,405.72166442871094,178.80729166666666,405.72166442871094,203.2421875,405.72166442871094C227.67708333333334,405.72166442871094,252.11197916666666,405.72166442871094,275.1106770833333,405.72166442871094C298.109375,405.72166442871094,319.671875,405.72166442871094,341.234375,405.72166442871094C362.796875,405.72166442871094,384.359375,405.72166442871094,406.3333333333333,405.72166442871094C428.3072916666667,405.72166442871094,450.6927083333333,405.72166442871094,461.8854166666667,405.72166442871094L473.078125,405.72166442871094" id="L-images-in_carta-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-images LE-in_carta" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M239.92410389510403,92.82651329040527L246.02789907925333,89.99774837493896C252.1316942634027,87.16898345947266,264.33928463170133,81.51145362854004,274.6097464825173,78.68268871307373C284.8802083333333,75.85392379760742,293.2135416666667,75.85392379760742,297.3802083333333,75.85392379760742L301.546875,75.85392379760742" id="L-CellProfiler-csv-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CellProfiler LE-csv" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M221.49929628758096,126.82651329040527L230.6738927396508,135.36938508351645C239.84848919172063,143.9122568766276,258.19768209586033,160.99800046284994,278.1535285479302,169.5408722559611C298.109375,178.08374404907227,319.671875,178.08374404907227,341.234375,178.08374404907227C362.796875,178.08374404907227,384.359375,178.08374404907227,412.453125,178.08374404907227C440.546875,178.08374404907227,475.171875,178.08374404907227,509.796875,178.08374404907227C544.421875,178.08374404907227,579.046875,178.08374404907227,601.06640625,178.08374404907227C623.0859375,178.08374404907227,632.5,178.08374404907227,637.20703125,178.08374404907227L641.9140625,178.08374404907227" id="L-CellProfiler-cp_sqlite-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CellProfiler LE-cp_sqlite" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M562.3203125,292.73430252075195L570.87890625,292.73430252075195C579.4375,292.73430252075195,596.5546875,292.73430252075195,610.8059895833334,292.73430252075195C625.0572916666666,292.73430252075195,636.4427083333334,292.73430252075195,642.1354166666666,292.73430252075195L647.828125,292.73430252075195" id="L-DeepProfiler-npz-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-DeepProfiler LE-npz" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M380.921875,54.81938543642201L385.0885416666667,52.61103495230805C389.2552083333333,50.4026844681941,397.5885416666667,45.98598349996619,405.921875,43.77763301585224C414.2552083333333,41.56928253173828,422.5885416666667,41.56928253173828,426.7552083333333,41.56928253173828L430.921875,41.56928253173828" id="L-csv-cytominer-database-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-csv LE-cytominer-database" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M588.671875,41.56928253173828L592.8385416666666,41.56928253173828C597.0052083333334,41.56928253173828,605.3385416666666,41.56928253173828,613.671875,41.56928253173828C622.0052083333334,41.56928253173828,630.3385416666666,41.56928253173828,634.5052083333334,41.56928253173828L638.671875,41.56928253173828" id="L-cytominer-database-sqlite-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-cytominer-database LE-sqlite" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M546.515625,405.72166442871094L557.7083333333334,405.72166442871094C568.9010416666666,405.72166442871094,591.2864583333334,405.72166442871094,608.484375,405.72166442871094C625.6822916666666,405.72166442871094,637.6927083333334,405.72166442871094,643.6979166666666,405.72166442871094L649.703125,405.72166442871094" id="L-in_carta-ic_csv-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-in_carta LE-ic_csv" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M380.921875,96.88846215879283L385.0885416666667,99.0968126429068C389.2552083333333,101.30516312702075,397.5885416666667,105.72186409524865,419.0677083333333,107.93021457936261C440.546875,110.13856506347656,475.171875,110.13856506347656,509.796875,110.13856506347656C544.421875,110.13856506347656,579.046875,110.13856506347656,608.7721354166666,110.13856506347656C638.4973958333334,110.13856506347656,663.3229166666666,110.13856506347656,688.1484375,110.13856506347656C712.9739583333334,110.13856506347656,737.7994791666666,110.13856506347656,758.8007494180279,118.62942822774251C779.8020196693891,127.12029139200847,796.9790393387783,144.10201772054037,805.5675491734728,152.5928808848063L814.1560590081674,161.08374404907227" id="L-csv-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-csv LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M728.46875,292.73430252075195L734.1614583333334,292.73430252075195C739.8541666666666,292.73430252075195,751.2395833333334,292.73430252075195,766.6882947474273,276.4592094421387C782.1370061615213,260.1841163635254,801.6490123230425,227.63393020629883,811.4050154038032,211.35883712768555L821.1610184845638,195.08374404907227" id="L-npz-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-npz LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M737.625,41.56928253173828L741.7916666666666,41.56928253173828C745.9583333333334,41.56928253173828,754.2916666666666,41.56928253173828,768.4863528533043,61.488359451293945C782.6810390399419,81.40743637084961,802.7370780798838,121.24559020996094,812.7650975998548,141.1646671295166L822.7931171198258,161.08374404907227" id="L-sqlite-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-sqlite LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M734.3828125,178.08374404907227L739.08984375,178.08374404907227C743.796875,178.08374404907227,753.2109375,178.08374404907227,762.0846354166666,178.08374404907227C770.9583333333334,178.08374404907227,779.2916666666666,178.08374404907227,783.4583333333334,178.08374404907227L787.625,178.08374404907227" id="L-cp_sqlite-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-cp_sqlite LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M726.59375,405.72166442871094L732.5989583333334,405.72166442871094C738.6041666666666,405.72166442871094,750.6145833333334,405.72166442871094,767.2188021300805,370.6153443654378C783.8230209268276,335.50902430216473,805.021041853655,265.29638417561847,815.6200523170688,230.19006411234537L826.2190627804827,195.08374404907227" id="L-ic_csv-CytoTable-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-ic_csv LE-CytoTable" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path><path d="M875.078125,178.08374404907227L879.2447916666666,178.08374404907227C883.4114583333334,178.08374404907227,891.7447916666666,178.08374404907227,900.078125,178.08374404907227C908.4114583333334,178.08374404907227,916.7447916666666,178.08374404907227,920.9114583333334,178.08374404907227L925.078125,178.08374404907227" id="L-CytoTable-pycytominer-0" class=" edge-thickness-normal edge-pattern-solid flowchart-link LS-CytoTable LE-pycytominer" style="fill:none;" marker-end="url(#flowchart-pointEnd)"></path></g><g class="edgeLabels"><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="edgeLabel"></span></div></foreignObject></g></g></g><g class="nodes"><g class="node default default" id="flowchart-images-43" label-offset-y="10.919459307237398" transform="translate(56.46875, 292.73430252075195)"><path style="" d="M 0,10.919459307237398 a 48.46875,10.919459307237398 0,0,0 96.9375 0 a 48.46875,10.919459307237398 0,0,0 -96.9375 0 l 0,44.919459307237396 a 48.46875,10.919459307237398 0,0,0 96.9375 0 l 0,-44.919459307237396" transform="translate(-48.46875,-33.3791889608561)"></path><g class="label" style="" transform="translate(-40.96875, -9.5)"><foreignObject width="81.9375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">Cell Images</span></div></foreignObject></g></g><g class="node default default" id="flowchart-CellProfiler-44" transform="translate(203.2421875, 109.82651329040527)"><rect class="basic label-container" style="" rx="0" ry="0" x="-48.3046875" y="-17" width="96.609375" height="34"></rect><g class="label" style="" transform="translate(-40.8046875, -9.5)"><foreignObject width="81.609375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CellProfiler</span></div></foreignObject></g></g><g class="node default default" id="flowchart-csv-45" label-offset-y="9.709480122324159" transform="translate(341.234375, 75.85392379760742)"><path style="" d="M 0,9.709480122324159 a 39.6875,9.709480122324159 0,0,0 79.375 0 a 39.6875,9.709480122324159 0,0,0 -79.375 0 l 0,43.70948012232416 a 39.6875,9.709480122324159 0,0,0 79.375 0 l 0,-43.70948012232416" transform="translate(-39.6875,-31.56422018348624)"></path><g class="label" style="" transform="translate(-32.1875, -9.5)"><foreignObject width="64.375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CSV Files</span></div></foreignObject></g></g><g class="node default default" id="flowchart-DeepProfiler-46" transform="translate(509.796875, 292.73430252075195)"><rect class="basic label-container" style="" rx="0" ry="0" x="-52.5234375" y="-17" width="105.046875" height="34"></rect><g class="label" style="" transform="translate(-45.0234375, -9.5)"><foreignObject width="90.046875" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">DeepProfiler</span></div></foreignObject></g></g><g class="node default default" id="flowchart-npz-47" label-offset-y="9.803586353620544" transform="translate(688.1484375, 292.73430252075195)"><path style="" d="M 0,9.803586353620544 a 40.3203125,9.803586353620544 0,0,0 80.640625 0 a 40.3203125,9.803586353620544 0,0,0 -80.640625 0 l 0,43.803586353620545 a 40.3203125,9.803586353620544 0,0,0 80.640625 0 l 0,-43.803586353620545" transform="translate(-40.3203125,-31.705379530430818)"></path><g class="label" style="" transform="translate(-32.8203125, -9.5)"><foreignObject width="65.640625" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">NPZ Files</span></div></foreignObject></g></g><g class="node default default" id="flowchart-cytominer-database-48" transform="translate(509.796875, 41.56928253173828)"><rect class="basic label-container" style="" rx="0" ry="0" x="-78.875" y="-17" width="157.75" height="34"></rect><g class="label" style="" transform="translate(-71.375, -9.5)"><foreignObject width="142.75" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">cytominer-database</span></div></foreignObject></g></g><g class="node default default" id="flowchart-sqlite-49" label-offset-y="11.046187120630714" transform="translate(688.1484375, 41.56928253173828)"><path style="" d="M 0,11.046187120630714 a 49.4765625,11.046187120630714 0,0,0 98.953125 0 a 49.4765625,11.046187120630714 0,0,0 -98.953125 0 l 0,45.04618712063071 a 49.4765625,11.046187120630714 0,0,0 98.953125 0 l 0,-45.04618712063071" transform="translate(-49.4765625,-33.56928068094607)"></path><g class="label" style="" transform="translate(-41.9765625, -9.5)"><foreignObject width="83.953125" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">SQLite Files</span></div></foreignObject></g></g><g class="node default default" id="flowchart-cp_sqlite-50" label-offset-y="10.630119270010058" transform="translate(688.1484375, 178.08374404907227)"><path style="" d="M 0,10.630119270010058 a 46.234375,10.630119270010058 0,0,0 92.46875 0 a 46.234375,10.630119270010058 0,0,0 -92.46875 0 l 0,44.630119270010056 a 46.234375,10.630119270010058 0,0,0 92.46875 0 l 0,-44.630119270010056" transform="translate(-46.234375,-32.945178905015084)"></path><g class="label" style="" transform="translate(-38.734375, -9.5)"><foreignObject width="77.46875" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">SQLite File</span></div></foreignObject></g></g><g class="node default default" id="flowchart-in_carta-51" transform="translate(509.796875, 405.72166442871094)"><rect class="basic label-container" style="" rx="0" ry="0" x="-36.71875" y="-17" width="73.4375" height="34"></rect><g class="label" style="" transform="translate(-29.21875, -9.5)"><foreignObject width="58.4375" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">IN Carta</span></div></foreignObject></g></g><g class="node default default" id="flowchart-ic_csv-52" label-offset-y="9.521321879111524" transform="translate(688.1484375, 405.72166442871094)"><path style="" d="M 0,9.521321879111524 a 38.4453125,9.521321879111524 0,0,0 76.890625 0 a 38.4453125,9.521321879111524 0,0,0 -76.890625 0 l 0,43.521321879111525 a 38.4453125,9.521321879111524 0,0,0 76.890625 0 l 0,-43.521321879111525" transform="translate(-38.4453125,-31.281982818667288)"></path><g class="label" style="" transform="translate(-30.9453125, -9.5)"><foreignObject width="61.890625" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CSV files</span></div></foreignObject></g></g><g class="node default default" id="flowchart-pycytominer-53" transform="translate(977.1171875, 178.08374404907227)"><rect class="basic label-container" style="" rx="0" ry="0" x="-52.0390625" y="-17" width="104.078125" height="34"></rect><g class="label" style="" transform="translate(-44.5390625, -9.5)"><foreignObject width="89.078125" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">pycytominer</span></div></foreignObject></g></g><g class="node default default" id="flowchart-CytoTable-54" transform="translate(831.3515625, 178.08374404907227)"><rect class="basic label-container" style="fill:#FDCA88;stroke:#D96026;" rx="0" ry="0" x="-43.7265625" y="-17" width="87.453125" height="34"></rect><g class="label" style="" transform="translate(-36.2265625, -9.5)"><foreignObject width="72.453125" height="19"><div xmlns="http://www.w3.org/1999/xhtml" style="display: inline-block; white-space: nowrap;"><span class="nodeLabel">CytoTable</span></div></foreignObject></g></g></g></g></g></svg>
diff --git a/docs/source/overview.md b/docs/source/overview.md
index f7ca3862..5aacc2e5 100644
--- a/docs/source/overview.md
+++ b/docs/source/overview.md
@@ -100,6 +100,15 @@ Data source compatibility for CytoTable is focused (but not explicitly limited t
   * **Preset specification:** SQLite data sources from CellProfiler may use the configuration preset :code:`convert(..., preset="cellprofiler_sqlite", ...)` (:mod:`convert() <cytotable.convert.convert>`).
 ```
 
+#### IN Carta Data Sources
+
+- __Comma-separated values (.csv)__: [Molecular Devices IN Carta](https://www.moleculardevices.com/products/cellular-imaging-systems/high-content-analysis/in-carta-image-analysis-software) software provides output data in CSV format.
+
+```{eval-rst}
+  * **Manual specification:** CSV data source types may be manually specified by using :code:`convert(..., source_datatype="csv", ...)` (:mod:`convert() <cytotable.convert.convert>`).
+  * **Preset specification:** CSV data sources from In Carta Image Analysis Software may use the configuration preset :code:`convert(..., preset="in-carta", ...)` (:mod:`convert() <cytotable.convert.convert>`).
+```
+
 ## Data Destinations
 
 ### Data Destination Locations
diff --git a/readme.md b/readme.md
index dff87fa2..4cb161c9 100644
--- a/readme.md
+++ b/readme.md
@@ -7,7 +7,7 @@ _Diagram showing data flow relative to this project._
 
 ## Summary
 
-CytoTable enables single-cell morphology data analysis by cleaning and transforming CellProfiler (`.csv` or `.sqlite`), cytominer-database (`.sqlite`), and DeepProfiler (`.npz`) output data at scale.
+CytoTable enables single-cell morphology data analysis by cleaning and transforming CellProfiler (`.csv` or `.sqlite`), cytominer-database (`.sqlite`), and DeepProfiler (`.npz`), and other sources such as IN Carta data output data at scale.
 CytoTable creates parquet files for both independent analysis and for input into [Pycytominer](https://github.com/cytomining/pycytominer).
 The Parquet files will have a unified and documented data model, including referenceable schema where appropriate (for validation within Pycytominer or other projects).
 
diff --git a/tests/conftest.py b/tests/conftest.py
index b71290a8..0350ff99 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -134,6 +134,15 @@ def fixture_data_dirs_cytominerdatabase(data_dir_cytominerdatabase: str) -> List
     ]
 
 
+@pytest.fixture(name="data_dirs_in_carta")
+def fixture_data_dir_in_carta() -> List[str]:
+    """
+    Provide data directories for IN Carta test data
+    """
+
+    return [f"{pathlib.Path(__file__).parent}/data/in-carta/colas-lab"]
+
+
 @pytest.fixture(name="cytominerdatabase_sqlite")
 def fixture_cytominerdatabase_sqlite(
     fx_tempdir: str,
diff --git a/tests/test_convert.py b/tests/test_convert.py
index 8572fd29..8b877dfc 100644
--- a/tests/test_convert.py
+++ b/tests/test_convert.py
@@ -1071,3 +1071,43 @@ def test_cell_health_cellprofiler_to_cytominer_database_legacy(
             ]
         )
     )
+
+
+def test_in_carta_to_parquet(
+    load_parsl_default: None, fx_tempdir: str, data_dirs_in_carta: List[str]
+):
+    """
+    Testing IN Carta preset with CytoTable convert to parquet output.
+    """
+
+    for data_dir in data_dirs_in_carta:
+        # read the directory of data with wildcard
+        with duckdb.connect() as ddb:
+            ddb_result = ddb.execute(
+                f"""
+                SELECT *
+                FROM read_csv_auto('{data_dir}/*.csv')
+                """
+            ).arrow()
+
+        # process the data with cytotable using in-carta preset
+        cytotable_result = convert(
+            source_path=data_dir,
+            dest_path=f"{fx_tempdir}/{pathlib.Path(data_dir).name}",
+            dest_datatype="parquet",
+            source_datatype="csv",
+            preset="in-carta",
+            join=False,
+        )
+
+        # read the result from CytoTable as a table
+        cytotable_result_table = parquet.read_table(
+            # note: we use cast here to explicitly tell mypy about the types involved
+            cast(list, cytotable_result[list(cast(dict, cytotable_result).keys())[0]])[
+                0
+            ]["table"][0]
+        )
+
+        # check the data against one another
+        assert cytotable_result_table.schema.equals(ddb_result.schema)
+        assert cytotable_result_table.shape == ddb_result.shape