diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
new file mode 100644
index 0000000000..33237d4424
--- /dev/null
+++ b/.github/workflows/ci.yaml
@@ -0,0 +1,44 @@
+name: ci
+
+on:
+  pull_request_review:
+    types: [submitted]
+
+jobs:
+  approved:
+    if: github.event.review.state == 'approved'
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        py-version:
+          - 3.7
+          - 3.8
+        mpi: [ 'openmpi' ]
+        install-options: [ '.', '.[hdf5,netcdf]' ]
+        pytorch-version:
+          - 'torch==1.7.1+cpu torchvision==0.8.2+cpu torchaudio==0.7.2'
+          - 'torch==1.8.1+cpu torchvision==0.9.1+cpu torchaudio==0.8.1'
+          - 'torch==1.9.0+cpu torchvision==0.10.0+cpu torchaudio==0.9.0'
+
+
+    name: Python ${{ matrix.py-version }} with ${{ matrix.pytorch-version }}; options ${{ matrix.install-options }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v2
+      - name: Setup MPI
+        uses: mpi4py/setup-mpi@v1
+        with:
+          mpi: ${{ matrix.mpi }}
+      - name: Use Python ${{ matrix.py-version }}
+        uses: actions/setup-python@v2
+        with:
+          python-version: ${{ matrix.py-version }}
+          architecture: x64
+      - name: Test
+        run: |
+          pip install pytest
+          pip install ${{ matrix.pytorch-version }} -f https://download.pytorch.org/whl/torch_stable.html
+          pip install ${{ matrix.install-options }}
+          mpirun -n 3 pytest heat/
+          mpirun -n 4 pytest heat/
diff --git a/.github/workflows/pre-commit.yml b/.github/workflows/pre-commit.yml
deleted file mode 100644
index b52d4afe5c..0000000000
--- a/.github/workflows/pre-commit.yml
+++ /dev/null
@@ -1,14 +0,0 @@
-name: pre-commit
-
-on:
-  pull_request:
-  push:
-    branches: [main]
-
-jobs:
-  pre-commit:
-    runs-on: ubuntu-latest
-    steps:
-    - uses: actions/checkout@v2
-    - uses: actions/setup-python@v2
-    - uses: pre-commit/action@v2.0.0
diff --git a/CHANGELOG.md b/CHANGELOG.md
index ddb06676e4..3dca59403b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,6 +4,7 @@
 - [#876](https://github.com/helmholtz-analytics/heat/pull/876) Make examples work (Lasso and kNN)
 - [#894](https://github.com/helmholtz-analytics/heat/pull/894) Change inclusion of license file
 - [#884](https://github.com/helmholtz-analytics/heat/pull/884) Added capabilities for PyTorch 1.10.0, this is now the recommended version to use.
+- [#937](https://github.com/helmholtz-analytics/heat/pull/937) Modified `ht.nonzero()` to return a tuple of 1-D arrays containing the non-zero indices in each dimension.
 
 ## Bug Fixes
 - [#826](https://github.com/helmholtz-analytics/heat/pull/826) Fixed `__setitem__` handling of distributed `DNDarray` values which have a different shape in the split dimension
diff --git a/CITATION.cff b/CITATION.cff
new file mode 100644
index 0000000000..b655ef2fcc
--- /dev/null
+++ b/CITATION.cff
@@ -0,0 +1,68 @@
+cff-version: 1.2.0
+message: "If you use this software, please cite it as below."
+authors:
+- family-names: "Götz"
+  given-names: "Markus"
+- family-names: "Debus"
+  given-names: "Charlotte"
+- family-names: "Coquelin"
+  given-names: "Daniel"
+- family-names: "Krajsek"
+  given-names: "Kai"
+- family-names: "Comito"
+  given-names: "Claudia"
+- family-names: "Knechtges"
+  given-names: "Philipp"
+- family-names: "Hagemeier"
+  given-names: "Björn"
+- family-names: "Tarnawa"
+  given-names: "Michael"
+- family-names: "Hanselmann"
+  given-names: "Simon"
+- family-names: "Siggel"
+  given-names: "Martin"
+- family-names: "Basermann"
+  given-names: "Achim"
+- family-names: "Streit"
+  given-names: "Achim"
+title: "Heat - Helmholtz Analytics Toolkit"
+version: 1.1.0
+date-released: 2021-09-21
+url: "https://github.com/helmholtz-analytics/heat"
+preferred-citation:
+  type: conference-paper
+  authors:
+  - family-names: "Götz"
+    given-names: "Markus"
+  - family-names: "Debus"
+    given-names: "Charlotte"
+  - family-names: "Coquelin"
+    given-names: "Daniel"
+  - family-names: "Krajsek"
+    given-names: "Kai"
+  - family-names: "Comito"
+    given-names: "Claudia"
+  - family-names: "Knechtges"
+    given-names: "Philipp"
+  - family-names: "Hagemeier"
+    given-names: "Björn"
+  - family-names: "Tarnawa"
+    given-names: "Michael"
+  - family-names: "Hanselmann"
+    given-names: "Simon"
+  - family-names: "Siggel"
+    given-names: "Martin"
+  - family-names: "Basermann"
+    given-names: "Achim"
+  - family-names: "Streit"
+    given-names: "Achim"
+  title: "HeAT -- a Distributed and GPU-accelerated Tensor Framework for Data Analytics"
+  year: 2020
+  collection-title: "2020 IEEE International Conference on Big Data (IEEE Big Data 2020)"
+  collection-doi: 10.1109/BigData50022.2020.9378050
+  conference:
+      name: 2020 IEEE International Conference on Big Data (IEEE Big Data 2020)
+      date-start: 2020-12-10
+      date-end: 2020-12-13
+  start: 276
+  end: 287
diff --git a/doc/images/logo_heAT.pdf b/doc/images/logo_heAT.pdf
deleted file mode 100644
index d839eade2b..0000000000
Binary files a/doc/images/logo_heAT.pdf and /dev/null differ
diff --git a/heat/core/dndarray.py b/heat/core/dndarray.py
index 5ffce7a777..6034d446a7 100644
--- a/heat/core/dndarray.py
+++ b/heat/core/dndarray.py
@@ -872,7 +872,7 @@ def __getitem__(self, key: Union[int, Tuple[int, ...], List[int, ...]]) -> DNDar
             output_split = None
 
         # data are not distributed or split dimension is not affected by indexing
-        if not self.is_distributed or key[self.split] == slice(None):
+        if not self.is_distributed() or key[self.split] == slice(None):
             return DNDarray(
                 self.larray[key],
                 gshape=output_shape,
@@ -1654,7 +1654,7 @@ def __set(arr: DNDarray, value: DNDarray):
             raise Exception("Advanced indexing is not supported yet")
 
         split = self.split
-        if not self.is_distributed or key[split] == slice(None):
+        if not self.is_distributed() or key[split] == slice(None):
             return __set(self[key], value)
 
         if isinstance(key[split], slice):
diff --git a/heat/core/indexing.py b/heat/core/indexing.py
index 6261a072c6..0452000c2f 100644
--- a/heat/core/indexing.py
+++ b/heat/core/indexing.py
@@ -13,12 +13,12 @@
 __all__ = ["nonzero", "where"]
 
 
-def nonzero(x: DNDarray) -> DNDarray:
+def nonzero(x: DNDarray) -> Tuple[DNDarray, ...]:
     """
-    Return a :class:`~heat.core.dndarray.DNDarray` containing the indices of the elements that are non-zero.. (using ``torch.nonzero``)
-    If ``x`` is split then the result is split in the 0th dimension. However, this :class:`~heat.core.dndarray.DNDarray`
+    Return a Tuple of :class:`~heat.core.dndarray.DNDarray`s, one for each dimension of ``x``,
+    containing the indices of the non-zero elements in that dimension. If ``x`` is split then
+    the result is split in the 0th dimension. However, this :class:`~heat.core.dndarray.DNDarray`
     can be UNBALANCED as it contains the indices of the non-zero elements on each node.
-    Returns an array with one entry for each dimension of ``x``, containing the indices of the non-zero elements in that dimension.
     The values in ``x`` are always tested and returned in row-major, C-style order.
     The corresponding non-zero values can be obtained with: ``x[nonzero(x)]``.
 
@@ -32,10 +32,8 @@ def nonzero(x: DNDarray) -> DNDarray:
     >>> import heat as ht
     >>> x = ht.array([[3, 0, 0], [0, 4, 1], [0, 6, 0]], split=0)
     >>> ht.nonzero(x)
-    DNDarray([[0, 0],
-              [1, 1],
-              [1, 2],
-              [2, 1]], dtype=ht.int64, device=cpu:0, split=0)
+    (DNDarray([0, 1, 1, 2], dtype=ht.int64, device=cpu:0, split=None),
+        DNDarray([0, 1, 2, 1], dtype=ht.int64, device=cpu:0, split=None))
     >>> y = ht.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]], split=0)
     >>> y > 3
     DNDarray([[False, False, False],
@@ -48,6 +46,8 @@ def nonzero(x: DNDarray) -> DNDarray:
               [2, 0],
               [2, 1],
               [2, 2]], dtype=ht.int64, device=cpu:0, split=0)
+    (DNDarray([1, 1, 1, 2, 2, 2], dtype=ht.int64, device=cpu:0, split=None),
+        DNDarray([0, 1, 2, 0, 1, 2], dtype=ht.int64, device=cpu:0, split=None))
     >>> y[ht.nonzero(y > 3)]
     DNDarray([4, 5, 6, 7, 8, 9], dtype=ht.int64, device=cpu:0, split=0)
     """
@@ -56,39 +56,42 @@ def nonzero(x: DNDarray) -> DNDarray:
     except AttributeError:
         raise TypeError("Input must be a DNDarray, is {}".format(type(x)))
 
+    lcl_nonzero = torch.nonzero(input=local_x, as_tuple=False).transpose(0, 1)
+
     if x.split is None:
-        # if there is no split then just return the values from torch
-        lcl_nonzero = torch.nonzero(input=local_x, as_tuple=False)
+        # if there is no split then just return the transpose of values from torch
+
         gout = list(lcl_nonzero.size())
         is_split = None
     else:
         # a is split
-        lcl_nonzero = torch.nonzero(input=local_x, as_tuple=False)
         # adjust local indices along split dimension
         _, displs = x.counts_displs()
-        lcl_nonzero[..., x.split] += displs[x.comm.rank]
+        lcl_nonzero[x.split] += displs[x.comm.rank]
         del displs
+
         # get global size of split dimension
         gout = list(lcl_nonzero.size())
-        gout[0] = x.comm.allreduce(gout[0], MPI.SUM)
+        gout[1] = x.comm.allreduce(gout[1], MPI.SUM)
         is_split = 0
 
-    if x.ndim == 1:
-        lcl_nonzero = lcl_nonzero.squeeze(dim=1)
-    for g in range(len(gout) - 1, -1, -1):
-        if gout[g] == 1:
-            del gout[g]
-
-    return DNDarray(
-        lcl_nonzero,
-        gshape=tuple(gout),
-        dtype=types.canonical_heat_type(lcl_nonzero.dtype),
-        split=is_split,
-        device=x.device,
-        comm=x.comm,
-        balanced=False,
+    non_zero_indices = list(
+        [
+            DNDarray(
+                dim_indices,
+                gshape=tuple(gout),
+                dtype=types.canonical_heat_type(lcl_nonzero.dtype),
+                split=is_split,
+                device=x.device,
+                comm=x.comm,
+                balanced=False,
+            )
+            for dim_indices in lcl_nonzero
+        ]
     )
 
+    return tuple(non_zero_indices)
+
 
 DNDarray.nonzero = lambda self: nonzero(self)
 DNDarray.nonzero.__doc__ = nonzero.__doc__
diff --git a/heat/core/tests/test_indexing.py b/heat/core/tests/test_indexing.py
index 4707aa28ab..58c7410456 100644
--- a/heat/core/tests/test_indexing.py
+++ b/heat/core/tests/test_indexing.py
@@ -9,18 +9,18 @@ def test_nonzero(self):
         a = ht.array([[1, 2, 3], [4, 5, 2], [7, 8, 9]], split=None)
         cond = a > 3
         nz = ht.nonzero(cond)
-        self.assertEqual(nz.gshape, (5, 2))
-        self.assertEqual(nz.dtype, ht.int64)
-        self.assertEqual(nz.split, None)
+        self.assertEqual(len(nz), 2)
+        self.assertEqual(len(nz[0]), 5)
+        self.assertEqual(nz[0].dtype, ht.int64)
 
         # split
         a = ht.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]], split=1)
         cond = a > 3
         nz = cond.nonzero()
-        self.assertEqual(nz.gshape, (6, 2))
-        self.assertEqual(nz.dtype, ht.int64)
-        self.assertEqual(nz.split, 0)
-        a[nz] = 10.0
+        self.assertEqual(len(nz), 2)
+        self.assertEqual(len(nz[0]), 6)
+        self.assertEqual(nz[0].dtype, ht.int64)
+        a[nz] = 10
         self.assertEqual(ht.all(a[nz] == 10), 1)
 
     def test_where(self):
diff --git a/scripts/tutorial.ipynb b/scripts/tutorial.ipynb
index f2ce191bd2..95cc6e3465 100644
--- a/scripts/tutorial.ipynb
+++ b/scripts/tutorial.ipynb
@@ -1044,38 +1044,6 @@
     "a + b"
    ]
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The example below will show that it is also possible to use operations on tensors with different split and the proper result calculated. However, this should be used seldomly and with small data amounts only, as it entails sending large amounts of data over the network."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 34,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "(0/2) tensor([[9., 9., 9., 9., 9., 9.],\n",
-       "(0/2)         [9., 9., 9., 9., 9., 9.]])\n",
-       "(1/2) tensor([[9., 9., 9., 9., 9., 9.],\n",
-       "(1/2)         [9., 9., 9., 9., 9., 9.]])"
-      ]
-     },
-     "execution_count": 34,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "a = ht.full((4, 6,), 8, split=0)\n",
-    "b = ht.ones((4, 6,), split=1)\n",
-    "a + b"
-   ]
-  },
   {
    "cell_type": "markdown",
    "metadata": {},