diff --git a/CHANGELOG.rst b/CHANGELOG.rst index f53dc0b4..99c8470b 100644 --- a/CHANGELOG.rst +++ b/CHANGELOG.rst @@ -1,7 +1,7 @@ Changelog ========= -Version v1.1.0 +Version v2.0.0 -------------- New Features @@ -21,8 +21,16 @@ Improvements - Added kwarg: ``raise_missing_property`` to ``NodePopulation.get`` - Undeprecated calling ``Edges.get`` and ``EdgePopulation.get`` with ``properties=None`` +Bug Fixes +~~~~~~~~~ +- Fixed the `Same property with different dtype` issue with ``nodes.get``, ``edges.get`` + Breaking Changes ~~~~~~~~~~~~~~~~ +- ``nodes.get`` and ``edges.get`` (and ``network.get``) no longer return a dataframe + - returns a generator yielding tuples of ``(, )`` instead + - to get the previous behavior (all in one dataframe): ``pd.concat(df for _, df in circuit.nodes.get(*args, **kwargs))`` +- Removed ``Network.property_dtypes``, ``CircuitIds.index_schema`` - ``Circuit.node_sets``, ``Simulation.node_sets`` returns ``NodeSets`` object initialized with empty dict when node sets file is not present - ``NodeSet.resolved`` is no longer available - ``FrameReport.node_set`` returns node_set name instead of resolved node set query diff --git a/bluepysnap/circuit_ids.py b/bluepysnap/circuit_ids.py index f015dc4d..26cb0490 100644 --- a/bluepysnap/circuit_ids.py +++ b/bluepysnap/circuit_ids.py @@ -55,14 +55,6 @@ def __init__(self, index, sort_index=True): index = index.sortlevel()[0] self.index = index - @property - def index_schema(self): - """Return an empty index with the same names and dtypes of the wrapped index.""" - # NOTE: Since pandas 2.1.0, the index needs to contain the explicit dtypes. In pd.concat, - # the dtypes of multi-index are coerced to 'object' if any dataframe has indices with - # dtype='object' - return self.index[:0] - @classmethod def _instance(cls, index, sort_index=True): """The instance returned by the functions.""" diff --git a/bluepysnap/network.py b/bluepysnap/network.py index b0cc61de..6820c241 100644 --- a/bluepysnap/network.py +++ b/bluepysnap/network.py @@ -48,22 +48,6 @@ def _populations(self): def population_names(self): """Should define all sorted NetworkObjects population names from the Circuit.""" - @cached_property - def property_dtypes(self): - """Returns all the NetworkObjects property dtypes for the Circuit.""" - - def _update(d, index, value): - if d.setdefault(index, value) != value: - raise BluepySnapError( - f"Same property with different dtype. {index}: {value}!= {d[index]}" - ) - - res = {} - for pop in self.values(): - for varname, dtype in pop.property_dtypes.items(): - _update(res, varname, dtype) - return pd.Series(res) - def keys(self): """Returns iterator on the NetworkObjectPopulation names. @@ -149,7 +133,7 @@ def ids(self, group=None, sample=None, limit=None): @abc.abstractmethod def get(self, group=None, properties=None): - """Returns the properties of the NetworkObject.""" + """Yields the properties of the NetworkObject.""" ids = self.ids(group) properties = utils.ensure_list(properties) # We don t convert to set properties itself to keep the column order. @@ -159,14 +143,6 @@ def get(self, group=None, properties=None): if unknown_props: raise BluepySnapError(f"Unknown properties required: {unknown_props}") - # Retrieve the dtypes of the selected properties. - # However, the int dtype may not be preserved if some values are NaN. - dtypes = { - column: dtype - for column, dtype in self.property_dtypes.items() - if column in properties_set - } - dataframes = [pd.DataFrame(columns=properties, index=ids.index_schema).astype(dtypes)] for name, pop in sorted(self.items()): # since ids is sorted, global_pop_ids should be sorted as well global_pop_ids = ids.filter_population(name) @@ -177,10 +153,9 @@ def get(self, group=None, properties=None): # However, it's a bit more performant than converting the Series to numpy arrays. pop_df = pd.DataFrame({prop: pop.get(pop_ids, prop) for prop in pop_properties}) pop_df.index = global_pop_ids.index - dataframes.append(pop_df) - res = pd.concat(dataframes) - assert res.index.is_monotonic_increasing, "The index should be already sorted" - return res + + # Sort the columns in the given order + yield name, pop_df[[p for p in properties if p in pop_properties]] @abc.abstractmethod def __getstate__(self): diff --git a/doc/source/notebooks/03_node_properties.ipynb b/doc/source/notebooks/03_node_properties.ipynb index 12e6f08f..259a14a4 100644 --- a/doc/source/notebooks/03_node_properties.ipynb +++ b/doc/source/notebooks/03_node_properties.ipynb @@ -14,13 +14,407 @@ "metadata": {}, "source": [ "## Preamble\n", - "The code in this section is identical to the code in the sections from \"Preamble\" to \"Properties and methods\" from the previous tutorial. It assumumes that you have already downloaded the circuit. If not, take a look to the notebook **01_circuits** (Downloading a circuit)." + "The code in this section is identical to the code in the sections from \"Preamble\" to \"Properties and methods\" from the previous tutorial. It assumes that you have already downloaded the circuit. If not, take a look to the notebook **01_circuits** (Downloading a circuit)." ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "import matplotlib.cm as cm\n", + "%matplotlib inline\n", + "\n", + "import bluepysnap\n", + "\n", + "POINT_SIZE = 1\n", + "SAMPLE_SIZE = 30000\n", + "\n", + "# To keep the plots constant\n", + "np.random.seed(0)\n", + "\n", + "# load the circuit and store the node population\n", + "circuit_path = \"sonata/circuit_sonata.json\"\n", + "circuit = bluepysnap.Circuit(circuit_path)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Node properties and methods\n", + "Node populations provide information about the collection of nodes, and what information is available for each of the nodes themselves.\n", + "\n", + "### Acquiring data from all populations\n", + "\n", + "To gather data from all populations `circuit.nodes.get` can be used. \n", + "\n", + "It returns a generator object of tuples of `(, )`:" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "generator_all_nodes = circuit.nodes.get(properties=['layer', 'synapse_class'])\n", + "generator_all_nodes" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can easily convert this to a dictionary with the population names acting as keys. Let's try that and print out the dataframes by population:" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "---CorticoThalamic_projections---\n", + "\n", + "\n", + "---MedialLemniscus_projections---\n", + "\n", + "\n", + "---thalamus_neurons---\n" + ] + }, + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
layersynapse_class
populationnode_ids
thalamus_neurons0RtINH
1RtINH
2RtINH
3RtINH
4RtINH
.........
100760VPLINH
100761VPLINH
100762VPLINH
100763VPLINH
100764VPLINH
\n", + "

100765 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " layer synapse_class\n", + "population node_ids \n", + "thalamus_neurons 0 Rt INH\n", + " 1 Rt INH\n", + " 2 Rt INH\n", + " 3 Rt INH\n", + " 4 Rt INH\n", + "... ... ...\n", + " 100760 VPL INH\n", + " 100761 VPL INH\n", + " 100762 VPL INH\n", + " 100763 VPL INH\n", + " 100764 VPL INH\n", + "\n", + "[100765 rows x 2 columns]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "dict_all_nodes = dict(generator_all_nodes)\n", + "\n", + "for population, df in dict_all_nodes.items():\n", + " print(f\"---{population}---\")\n", + " if df.empty:\n", + " print('\\n')\n", + " else:\n", + " display(df)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Please note, as with generators in python in general, once the items of the generator are exhausted, it will no longer return anything:" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[]" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "[*generator_all_nodes]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Combining output of `circuit.nodes.get`\n", + "To combine the dataframes from all populations, we can use `pandas.concat`. We can combine the dictionary values by \n", + "```python\n", + "pd.concat(dict_all_nodes.values())\n", + "```\n", + "or we can skip the dictionary creation part by just concatenating the dataframes from the generator:" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
layersynapse_class
populationnode_ids
CorticoThalamic_projections0NaNNaN
1NaNNaN
2NaNNaN
3NaNNaN
4NaNNaN
............
thalamus_neurons100760VPLINH
100761VPLINH
100762VPLINH
100763VPLINH
100764VPLINH
\n", + "

189208 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " layer synapse_class\n", + "population node_ids \n", + "CorticoThalamic_projections 0 NaN NaN\n", + " 1 NaN NaN\n", + " 2 NaN NaN\n", + " 3 NaN NaN\n", + " 4 NaN NaN\n", + "... ... ...\n", + "thalamus_neurons 100760 VPL INH\n", + " 100761 VPL INH\n", + " 100762 VPL INH\n", + " 100763 VPL INH\n", + " 100764 VPL INH\n", + "\n", + "[189208 rows x 2 columns]" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "generator_nodes_all = circuit.nodes.get(properties=['layer', 'synapse_class'])\n", + "df_all_nodes = pd.concat(df for _, df in generator_nodes_all) # \"_, df\": ignore the population names of the tuples\n", + "df_all_nodes" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "However, as can be seen from the output above, combining the dataframes oftentimes results in there being a whole lot of `NaN` values in the dataframe, due to the properties missing from the other population.\n", + "\n", + "Therefore, if you know you're only working with one population, it is strongly recommended to use the node population object.\n", + "\n", + "### Working with node population objects\n", + "\n", + "Accessing a node population is as easy as accessing a dictionary. Just use the same `dict` syntax with the `circuit.nodes` object. Let's try that and print all the available properties for a population:" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, "outputs": [ { "data": { @@ -48,28 +442,12 @@ " 'z'}" ] }, - "execution_count": 1, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "import numpy as np\n", - "import matplotlib.pyplot as plt\n", - "import matplotlib.cm as cm\n", - "%matplotlib inline\n", - "\n", - "import bluepysnap\n", - "\n", - "POINT_SIZE = 1\n", - "SAMPLE_SIZE = 30000\n", - "\n", - "# To keep the plots constant\n", - "np.random.seed(0)\n", - "\n", - "# load the circuit and store the node population\n", - "circuit_path = \"sonata/circuit_sonata.json\"\n", - "circuit = bluepysnap.Circuit(circuit_path)\n", "node_population = circuit.nodes[\"thalamus_neurons\"]\n", "node_population.property_names" ] @@ -78,20 +456,12 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Node properties and methods\n", - "Node populations provide information about the collection of nodes, and what information is available for each of the nodes themselves." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Let's begin by retrieving all nodes with their associated layer, synapse type, and position in 3D space. We can then use this to understand how the synapse types are distributed between layers." + "Let's now retrieve all nodes with their associated layer, synapse type, and position in 3D space. We can then use this to understand how the synapse types are distributed between layers." ] }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 7, "metadata": {}, "outputs": [ { @@ -168,7 +538,7 @@ " VPL 342 342 342" ] }, - "execution_count": 2, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -187,7 +557,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 8, "metadata": {}, "outputs": [ { @@ -215,7 +585,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 9, "metadata": {}, "outputs": [ { @@ -309,7 +679,7 @@ "4 Rt INH 156.274872 572.608337 235.786240" ] }, - "execution_count": 4, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -320,7 +690,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 10, "metadata": {}, "outputs": [ { @@ -356,7 +726,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 11, "metadata": {}, "outputs": [ { @@ -394,16 +764,16 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 12, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 7, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -421,7 +791,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 13, "metadata": {}, "outputs": [ { @@ -469,7 +839,7 @@ " 'CT_afferents': {'population': 'CorticoThalamic_projections'}}" ] }, - "execution_count": 8, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -487,7 +857,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 14, "metadata": {}, "outputs": [], "source": [ @@ -503,7 +873,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 15, "metadata": {}, "outputs": [], "source": [ @@ -519,7 +889,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 16, "metadata": {}, "outputs": [ { @@ -566,7 +936,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 17, "metadata": {}, "outputs": [ { @@ -601,7 +971,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 18, "metadata": {}, "outputs": [ { @@ -610,7 +980,7 @@ "{'Rt_RC', 'VPL_IN', 'VPL_TC'}" ] }, - "execution_count": 13, + "execution_count": 18, "metadata": {}, "output_type": "execute_result" } @@ -628,7 +998,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 19, "metadata": {}, "outputs": [ { @@ -641,7 +1011,7 @@ " ['VPL_IN', 'bAC_IN']], dtype=object)" ] }, - "execution_count": 14, + "execution_count": 19, "metadata": {}, "output_type": "execute_result" } @@ -660,7 +1030,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 20, "metadata": {}, "outputs": [ { @@ -754,7 +1124,7 @@ "28607 mc2;Rt INH 173.007538 552.684753 837.944153" ] }, - "execution_count": 15, + "execution_count": 20, "metadata": {}, "output_type": "execute_result" } diff --git a/doc/source/notebooks/04_edge_properties.ipynb b/doc/source/notebooks/04_edge_properties.ipynb index 64139c01..824d57fb 100644 --- a/doc/source/notebooks/04_edge_properties.ipynb +++ b/doc/source/notebooks/04_edge_properties.ipynb @@ -14,13 +14,45 @@ "metadata": {}, "source": [ "## Preamble\n", - "The code in this section is similar to the code in sections \"Introduction\" and \"Loading\" from the previous tutorial, but applied to edges. It assumumes that you have already downloaded the circuit. If not, take a look to the notebook **01_circuits** (Downloading a circuit)." + "The code in this section is similar to the code in sections \"Introduction\" and \"Loading\" from the previous tutorial, but applied to edges. It assumes that you have already downloaded the circuit. If not, take a look to the notebook **01_circuits** (Downloading a circuit)." ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, + "outputs": [], + "source": [ + "import bluepysnap\n", + "import matplotlib.pyplot as plt\n", + "%matplotlib inline\n", + "\n", + "# load the circuit and store the node population\n", + "circuit_path = \"sonata/circuit_sonata.json\"\n", + "circuit = bluepysnap.Circuit(circuit_path)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Properties and methods\n", + "\n", + "### Getting properties from all populations\n", + "Working with the output of `circuit.edges.get` follows the principles of that of `circuit.nodes.get` and won't be covered here. Please have a look at the previous notebook `03_node_properties.ipynb`.\n", + "\n", + "### Working with edge population objects\n", + "\n", + "\n", + "Edge populations provide information about the collection of edges, and what information is available for each of the edges themselves.\n", + "\n", + "Let's start by grabbing a population and printing out its available properties:" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, "outputs": [ { "data": { @@ -61,20 +93,12 @@ " 'u_syn'}" ] }, - "execution_count": 1, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "import bluepysnap\n", - "import matplotlib.pyplot as plt\n", - "%matplotlib inline\n", - "\n", - "# load the circuit and store the node population\n", - "circuit_path = \"sonata/circuit_sonata.json\"\n", - "circuit = bluepysnap.Circuit(circuit_path)\n", - "\n", "# we can also find other edge names with \"circuit.edges.population_names\"\n", "edge_population = circuit.edges[\"thalamus_neurons__thalamus_neurons__chemical\"]\n", "edge_population.property_names" @@ -84,15 +108,12 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Properties and methods\n", - "Edge populations provide information about the collection of edges, and what information is available for each of the edges themselves.\n", - "\n", - "For example, the edge population `name` and `size` (that is, the number of nodes it contains) can be retrieved:" + "Also, there are additional object level properties. For example, the edge population `name` and `size` (that is, the number of nodes it contains) can be retrieved with:" ] }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 3, "metadata": {}, "outputs": [ { @@ -118,7 +139,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": { "scrolled": true }, @@ -140,19 +161,17 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "metadata": {}, "outputs": [ { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ - "
" + "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], @@ -172,19 +191,17 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "metadata": {}, "outputs": [ { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ - "
" + "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], diff --git a/tests/test_circuit.py b/tests/test_circuit.py index 5b990017..b7aa77d9 100644 --- a/tests/test_circuit.py +++ b/tests/test_circuit.py @@ -1,6 +1,7 @@ import json import pickle +import pandas as pd import pytest from libsonata import SonataError @@ -78,6 +79,7 @@ def test_integration(): edge_ids = circuit.edges.afferent_edges(node_ids) edge_props = circuit.edges.get(edge_ids, properties=["syn_weight", "delay"]) edge_reduced = edge_ids.limit(2) + edge_props = pd.concat(df for _, df in edge_props) edge_props_reduced = edge_props.loc[edge_reduced] assert edge_props_reduced["syn_weight"].tolist() == [1, 1] diff --git a/tests/test_circuit_ids.py b/tests/test_circuit_ids.py index 09c874da..87dac57b 100644 --- a/tests/test_circuit_ids.py +++ b/tests/test_circuit_ids.py @@ -81,12 +81,6 @@ def test_init(self): assert isinstance(self.test_obj_sorted, self.ids_cls) - def test_index_schema(self): - schema = self.test_obj_unsorted.index_schema - index = self.test_obj_unsorted.index - npt.assert_array_equal(schema.dtypes, index.dtypes) - npt.assert_array_equal(schema.names, index.names) - def test_from_arrays(self): tested = self.ids_cls.from_arrays(["a", "b"], [0, 1]) pdt.assert_index_equal(tested.index, self._circuit_ids(["a", "b"], [0, 1])) diff --git a/tests/test_edges.py b/tests/test_edges.py index df21c9d8..b940aaae 100644 --- a/tests/test_edges.py +++ b/tests/test_edges.py @@ -85,80 +85,6 @@ def test_property_names(self): "syn_weight", } - def test_property_dtypes(self): - expected = pd.Series( - data=[ - dtype("float32"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float32"), - dtype("float64"), - dtype("float32"), - dtype("float64"), - dtype("int64"), - dtype("int64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float32"), - dtype("float32"), - dtype("float64"), - dtype("float64"), - IDS_DTYPE, - IDS_DTYPE, - dtype("O"), - dtype("int32"), - ], - index=[ - "syn_weight", - "@dynamics:param1", - "afferent_surface_y", - "afferent_surface_z", - "conductance", - "efferent_center_x", - "delay", - "afferent_center_z", - "efferent_section_id", - "afferent_section_id", - "efferent_center_y", - "afferent_center_x", - "efferent_surface_z", - "afferent_center_y", - "afferent_surface_x", - "efferent_surface_x", - "afferent_section_pos", - "efferent_section_pos", - "efferent_surface_y", - "efferent_center_z", - "@source_node", - "@target_node", - "other1", - "other2", - ], - ).sort_index() - pdt.assert_series_equal(self.test_obj.property_dtypes.sort_index(), expected) - - def test_property_dtypes_fail(self): - a = pd.Series( - data=[dtype("int64"), dtype("float64")], index=["syn_weight", "efferent_surface_z"] - ).sort_index() - b = pd.Series( - data=[dtype("int32"), dtype("float64")], index=["syn_weight", "efferent_surface_z"] - ).sort_index() - - with patch( - "bluepysnap.edges.EdgePopulation.property_dtypes", new_callable=PropertyMock - ) as mock: - mock.side_effect = [a, b] - circuit = Circuit(str(TEST_DATA_DIR / "circuit_config.json")) - test_obj = test_module.Edges(circuit) - with pytest.raises(BluepySnapError): - test_obj.property_dtypes.sort_index() - def test_ids(self): np.random.seed(0) # single edge ID --> CircuitEdgeIds return populations with the 0 id @@ -266,6 +192,8 @@ def test_get(self): assert tested == ids tested = self.test_obj.get(ids, properties=self.test_obj.property_names) + tested = pd.concat(df for _, df in tested) + assert len(tested) == 8 assert len(list(tested)) == 24 @@ -274,9 +202,9 @@ def test_get(self): # the index of the dataframe is indentical to the CircuitEdgeIds index pdt.assert_index_equal(tested.index, ids.index) - pdt.assert_frame_equal( - self.test_obj.get([0, 1, 2, 3], properties=self.test_obj.property_names), tested - ) + tested2 = self.test_obj.get([0, 1, 2, 3], properties=self.test_obj.property_names) + tested2 = pd.concat(df for _, df in tested2) + pdt.assert_frame_equal(tested2, tested) # tested columns tested = self.test_obj.get(ids, properties=["other2", "other1", "@source_node"]) @@ -302,7 +230,8 @@ def test_get(self): names=["population", "edge_ids"], ), ) - pdt.assert_frame_equal(tested, expected) + tested = pd.concat(df for _, df in tested) + pdt.assert_frame_equal(tested[expected.columns], expected) tested = self.test_obj.get( CircuitEdgeIds.from_dict({"default2": [0, 1, 2, 3]}), @@ -325,6 +254,7 @@ def test_get(self): names=["population", "edge_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) with pytest.raises(KeyError, match="'default'"): @@ -336,8 +266,6 @@ def test_get(self): ) expected = pd.DataFrame( { - "other2": np.array([np.NaN, np.NaN, np.NaN, np.NaN], dtype=float), - "other1": np.array([np.NaN, np.NaN, np.NaN, np.NaN], dtype=object), "@source_node": np.array([2, 0, 0, 2], dtype=int), }, index=pd.MultiIndex.from_tuples( @@ -350,6 +278,7 @@ def test_get(self): names=["population", "edge_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) tested = self.test_obj.get(ids, properties="@source_node") @@ -371,6 +300,7 @@ def test_get(self): names=["population", "edge_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) tested = self.test_obj.get(ids, properties="other2") @@ -392,13 +322,14 @@ def test_get(self): names=["population", "edge_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) with pytest.raises(BluepySnapError, match="Unknown properties required: {'unknown'}"): - self.test_obj.get(ids, properties=["other2", "unknown"]) + next(self.test_obj.get(ids, properties=["other2", "unknown"])) with pytest.raises(BluepySnapError, match="Unknown properties required: {'unknown'}"): - self.test_obj.get(ids, properties="unknown") + next(self.test_obj.get(ids, properties="unknown")) def test_afferent_nodes(self): assert self.test_obj.afferent_nodes(0) == CircuitNodeIds.from_arrays(["default"], [2]) @@ -466,8 +397,10 @@ def test_pathway_edges(self): target = CircuitNodeIds.from_dict({"default": [1, 2]}) expected_index = CircuitEdgeIds.from_dict({"default": [1, 2], "default2": [1, 2]}) + tested = self.test_obj.pathway_edges(source=source, target=target, properties=properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.pathway_edges(source=source, target=target, properties=properties), + tested, pd.DataFrame( [ [88.1862], @@ -483,8 +416,10 @@ def test_pathway_edges(self): properties = [Synapse.SOURCE_NODE_ID, "other1"] expected_index = CircuitEdgeIds.from_dict({"default": [1, 2], "default2": [1, 2]}) + tested = self.test_obj.pathway_edges(source=source, target=target, properties=properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.pathway_edges(source=source, target=target, properties=properties), + tested, pd.DataFrame( [ [0, np.nan], @@ -520,8 +455,10 @@ def test_pathway_edges(self): source = CircuitNodeId("default", 0) target = CircuitNodeId("default", 1) expected_index = CircuitEdgeIds.from_dict({"default": [1, 2], "default2": [1, 2]}) + tested = self.test_obj.pathway_edges(source=source, target=target, properties=properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.pathway_edges(source=source, target=target, properties=properties), + tested, pd.DataFrame( [ [0, 1], @@ -555,8 +492,10 @@ def test_afferent_edges(self): assert self.test_obj.afferent_edges(CircuitNodeId("default", 1), None) == expected properties = [Synapse.AXONAL_DELAY] + tested = self.test_obj.afferent_edges(1, properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.afferent_edges(1, properties), + tested, pd.DataFrame( [ [88.1862], @@ -577,10 +516,12 @@ def test_afferent_edges(self): expected_index = CircuitEdgeIds.from_dict( {"default": [0, 1, 2, 3], "default2": [0, 1, 2, 3]} ) + tested = self.test_obj.afferent_edges( + CircuitNodeIds.from_dict({"default": [0, 1]}), properties=properties + ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.afferent_edges( - CircuitNodeIds.from_dict({"default": [0, 1]}), properties=properties - ), + tested, pd.DataFrame( [ [2, np.nan], @@ -606,8 +547,10 @@ def test_efferent_edges(self): assert self.test_obj.efferent_edges(CircuitNodeId("default", 2), None) == expected properties = [Synapse.AXONAL_DELAY] + tested = self.test_obj.efferent_edges(2, properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.efferent_edges(2, properties), + tested, pd.DataFrame( [ [99.8945], @@ -625,8 +568,10 @@ def test_efferent_edges(self): properties = [Synapse.TARGET_NODE_ID, "other1"] expected_index = CircuitEdgeIds.from_dict({"default": [0, 3], "default2": [0, 3]}) + tested = self.test_obj.efferent_edges(2, properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.efferent_edges(2, properties), + tested, pd.DataFrame( [ [0, np.nan], @@ -644,15 +589,17 @@ def test_pair_edges(self): # no connection between 0 and 2 assert self.test_obj.pair_edges(0, 2, None) == CircuitEdgeIds.from_arrays([], []) actual = self.test_obj.pair_edges(0, 2, [Synapse.AXONAL_DELAY]) - assert actual.empty + assert next(actual, None) is None assert self.test_obj.pair_edges(2, 0, None) == CircuitEdgeIds.from_tuples( [("default", 0), ("default2", 0)] ) properties = [Synapse.AXONAL_DELAY] + tested = self.test_obj.pair_edges(2, 0, properties) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal( - self.test_obj.pair_edges(2, 0, properties), + tested, pd.DataFrame( [ [99.8945], @@ -756,7 +703,6 @@ def test_pickle(self, tmp_path): # trigger some cached properties, to makes sure they aren't being pickeld self.test_obj.size self.test_obj.property_names - self.test_obj.property_dtypes with open(pickle_path, "wb") as fd: pickle.dump(self.test_obj, fd) diff --git a/tests/test_nodes.py b/tests/test_nodes.py index ec70b043..84be8af7 100644 --- a/tests/test_nodes.py +++ b/tests/test_nodes.py @@ -79,60 +79,6 @@ def test_property_value(self): assert self.test_obj.property_values("mtype") == {"L2_X", "L7_X", "L9_Z", "L8_Y", "L6_Y"} assert self.test_obj.property_values("other2") == {10, 11, 12, 13} - def test_property_dtypes(self): - expected = pd.Series( - data=[ - dtype("int64"), - dtype("O"), - dtype("O"), - dtype("O"), - dtype("O"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("float64"), - dtype("O"), - dtype("int64"), - ], - index=[ - "layer", - "model_template", - "model_type", - "morphology", - "mtype", - "rotation_angle_xaxis", - "rotation_angle_yaxis", - "rotation_angle_zaxis", - "x", - "y", - "z", - "@dynamics:holding_current", - "other1", - "other2", - ], - ).sort_index() - pdt.assert_series_equal(self.test_obj.property_dtypes.sort_index(), expected) - - def test_property_dtypes_fail(self): - a = pd.Series( - data=[dtype("int64"), dtype("O")], index=["layer", "model_template"] - ).sort_index() - b = pd.Series( - data=[dtype("int32"), dtype("O")], index=["layer", "model_template"] - ).sort_index() - - with patch( - "bluepysnap.nodes.NodePopulation.property_dtypes", new_callable=PropertyMock - ) as mock: - mock.side_effect = [a, b] - circuit = Circuit(str(TEST_DATA_DIR / "circuit_config.json")) - test_obj = test_module.Nodes(circuit) - with pytest.raises(BluepySnapError): - test_obj.property_dtypes.sort_index() - def test_ids(self): np.random.seed(0) @@ -291,6 +237,7 @@ def test_ids(self): def test_get(self): # return all properties for all the ids tested = self.test_obj.get() + tested = pd.concat(df for _, df in tested) assert tested.shape == (self.test_obj.size, len(self.test_obj.property_names)) # put NaN for the undefined values : only values for default2 in dropna @@ -305,6 +252,7 @@ def test_get(self): # tested columns tested = self.test_obj.get(properties=["other2", "other1", "layer"]) + tested = pd.concat(df for _, df in tested) expected = pd.DataFrame( { "other2": np.array([np.NaN, np.NaN, np.NaN, 10, 11, 12, 13], dtype=float), @@ -324,7 +272,7 @@ def test_get(self): names=["population", "node_ids"], ), ) - pdt.assert_frame_equal(tested, expected) + pdt.assert_frame_equal(tested[expected.columns], expected) tested = self.test_obj.get( group={"population": "default2"}, properties=["other2", "other1", "layer"] @@ -345,6 +293,7 @@ def test_get(self): names=["population", "node_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) with pytest.raises(KeyError, match="'default'"): @@ -355,8 +304,6 @@ def test_get(self): ) expected = pd.DataFrame( { - "other2": np.array([np.NaN, np.NaN, np.NaN], dtype=float), - "other1": np.array([np.NaN, np.NaN, np.NaN], dtype=object), "layer": np.array([2, 6, 6], dtype=int), }, index=pd.MultiIndex.from_tuples( @@ -368,6 +315,7 @@ def test_get(self): names=["population", "node_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) tested = self.test_obj.get(properties="layer") @@ -388,6 +336,7 @@ def test_get(self): names=["population", "node_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) tested = self.test_obj.get(properties="other2") @@ -408,13 +357,14 @@ def test_get(self): names=["population", "node_ids"], ), ) + tested = pd.concat(df for _, df in tested) pdt.assert_frame_equal(tested, expected) with pytest.raises(BluepySnapError, match="Unknown properties required: {'unknown'}"): - self.test_obj.get(properties=["other2", "unknown"]) + next(self.test_obj.get(properties=["other2", "unknown"])) with pytest.raises(BluepySnapError, match="Unknown properties required: {'unknown'}"): - self.test_obj.get(properties="unknown") + next(self.test_obj.get(properties="unknown")) def test_functionality_with_separate_node_set(self): with pytest.raises(BluepySnapError, match="Undefined node set"): @@ -427,12 +377,11 @@ def test_functionality_with_separate_node_set(self): ) with pytest.raises(BluepySnapError, match="Undefined node set"): - self.test_obj.get("ExtraLayer2") + next(self.test_obj.get("ExtraLayer2")) - pdt.assert_frame_equal( - self.test_obj.get(node_sets["ExtraLayer2"]), - self.test_obj.get("Layer2"), - ) + tested = pd.concat(df for _, df in self.test_obj.get(node_sets["ExtraLayer2"])) + expected = pd.concat(df for _, df in self.test_obj.get("Layer2")) + pdt.assert_frame_equal(tested, expected) def test_pickle(self, tmp_path): pickle_path = tmp_path / "pickle.pkl" @@ -440,7 +389,6 @@ def test_pickle(self, tmp_path): # trigger some cached properties, to makes sure they aren't being pickeld self.test_obj.size self.test_obj.property_names - self.test_obj.property_dtypes with open(pickle_path, "wb") as fd: pickle.dump(self.test_obj, fd)