1 year ago · a9cfde524c
--- a/taipy/core/data/based_custom_exposed_type.py
+++ b/taipy/core/data/based_custom_exposed_type.py
@@ -30,5 +30,5 @@ class BasedCustomExposedType:
 
				         return self.__column_names
			
 
				 
			
 
				     @property
			
 
				-    def to_json(self):
			
 
				+    def to_dict(self):
			
 
				         return {col: getattr(self, col) for col in self.__column_names}
			
--- a/taipy/core/data/csv.py
+++ b/taipy/core/data/csv.py
@@ -11,6 +11,7 @@
 
				 
			
 
				 import csv
			
 
				 import os
			
 
				+from dataclasses import asdict, is_dataclass
			
 
				 from datetime import datetime, timedelta
			
 
				 from os.path import isfile
			
 
				 from typing import Any, Dict, List, Optional, Set
			
@@ -225,19 +226,22 @@ class CSVDataNode(DataNode, _AbstractFileDataNode, _AbstractTabularDataNode):
 
				             return data
			
 
				         elif exposed_type == self._EXPOSED_TYPE_NUMPY and isinstance(data, np.ndarray):
			
 
				             return pd.DataFrame(data)
			
 
				-        elif (
			
 
				-            isinstance(data, list)
			
 
				-            and not isinstance(exposed_type, str)
			
 
				-            and all(isinstance(row, exposed_type) for row in data)
			
 
				-        ):
			
 
				-            return pd.DataFrame.from_records([row.to_dict() for row in data])
			
 
				+        elif isinstance(data, list) and not isinstance(exposed_type, str):
			
 
				+            if all(is_dataclass(row) for row in data):
			
 
				+                return pd.DataFrame.from_records([asdict(row) for row in data])
			
 
				+            # return pd.DataFrame.from_records([row.to_dict() for row in data])
			
 
				         else:
			
 
				             return pd.DataFrame(data)
			
 
				 
			
 
				     def _write(self, data: Any):
			
 
				-        self.__convert_data_to_dataframe(data).to_csv(
			
 
				-            self._path, index=False, encoding=self.properties[self.__ENCODING_KEY]
			
 
				-        )
			
 
				+        if self.properties[self.__HAS_HEADER_PROPERTY]:
			
 
				+            self.__convert_data_to_dataframe(data).to_csv(
			
 
				+                self._path, index=False, encoding=self.properties[self.__ENCODING_KEY]
			
 
				+            )
			
 
				+        else:
			
 
				+            self.__convert_data_to_dataframe(data).to_csv(
			
 
				+                self._path, index=False, encoding=self.properties[self.__ENCODING_KEY], header=None
			
 
				+            )
			
 
				 
			
 
				     def write_with_column_names(self, data: Any, columns: Optional[List[str]] = None, job_id: Optional[JobId] = None):
			
 
				         """Write a selection of columns.
			
--- a/tests/core/data/test_csv_data_node.py
+++ b/tests/core/data/test_csv_data_node.py
@@ -14,10 +14,8 @@ import pathlib
 
				 from datetime import datetime
			
 
				 from time import sleep
			
 
				 
			
 
				-import numpy as np
			
 
				 import pandas as pd
			
 
				 import pytest
			
 
				-from pandas.testing import assert_frame_equal
			
 
				 
			
 
				 from taipy.config.common.scope import Scope
			
 
				 from taipy.config.config import Config
			
@@ -25,8 +23,7 @@ from taipy.config.exceptions.exceptions import InvalidConfigurationId
 
				 from taipy.core.data._data_manager import _DataManager
			
 
				 from taipy.core.data.csv import CSVDataNode
			
 
				 from taipy.core.data.data_node_id import DataNodeId
			
 
				-from taipy.core.data.operator import JoinOperator, Operator
			
 
				-from taipy.core.exceptions.exceptions import InvalidExposedType, NoData
			
 
				+from taipy.core.exceptions.exceptions import InvalidExposedType
			
 
				 
			
 
				 
			
 
				 @pytest.fixture(scope="function", autouse=True)
			
@@ -65,9 +62,7 @@ class TestCSVDataNode:
 
				         assert dn.exposed_type == "pandas"
			
 
				 
			
 
				         with pytest.raises(InvalidConfigurationId):
			
 
				-            dn = CSVDataNode(
			
 
				-                "foo bar", Scope.SCENARIO, properties={"path": path, "has_header": False, "name": "super name"}
			
 
				-            )
			
 
				+            CSVDataNode("foo bar", Scope.SCENARIO, properties={"path": path, "has_header": False, "name": "super name"})
			
 
				 
			
 
				     def test_modin_deprecated_in_favor_of_pandas(self):
			
 
				         path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
@@ -117,146 +112,6 @@ class TestCSVDataNode:
 
				         dn = CSVDataNode("foo", Scope.SCENARIO, DataNodeId("dn_id"), properties=properties)
			
 
				         assert os.path.exists(dn.path) is exists
			
 
				 
			
 
				-    def test_read_with_header_pandas(self):
			
 
				-        not_existing_csv = CSVDataNode("foo", Scope.SCENARIO, properties={"path": "WRONG.csv", "has_header": True})
			
 
				-        with pytest.raises(NoData):
			
 
				-            assert not_existing_csv.read() is None
			
 
				-            not_existing_csv.read_or_raise()
			
 
				-
			
 
				-        path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				-        # # Create CSVDataNode without exposed_type (Default is pandas.DataFrame)
			
 
				-        csv_data_node_as_pandas = CSVDataNode("bar", Scope.SCENARIO, properties={"path": path})
			
 
				-        data_pandas = csv_data_node_as_pandas.read()
			
 
				-        assert isinstance(data_pandas, pd.DataFrame)
			
 
				-        assert len(data_pandas) == 10
			
 
				-        assert np.array_equal(data_pandas.to_numpy(), pd.read_csv(path).to_numpy())
			
 
				-
			
 
				-    def test_read_with_header_numpy(self):
			
 
				-        path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				-        # Create CSVDataNode with numpy exposed_type
			
 
				-        csv_data_node_as_numpy = CSVDataNode(
			
 
				-            "bar", Scope.SCENARIO, properties={"path": path, "has_header": True, "exposed_type": "numpy"}
			
 
				-        )
			
 
				-        data_numpy = csv_data_node_as_numpy.read()
			
 
				-        assert isinstance(data_numpy, np.ndarray)
			
 
				-        assert len(data_numpy) == 10
			
 
				-        assert np.array_equal(data_numpy, pd.read_csv(path).to_numpy())
			
 
				-
			
 
				-    def test_read_with_header_custom_exposed_type(self):
			
 
				-        path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				-        csv_data_node_as_pandas = CSVDataNode("bar", Scope.SCENARIO, properties={"path": path})
			
 
				-        data_pandas = csv_data_node_as_pandas.read()
			
 
				-
			
 
				-        path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				-        # Create the same CSVDataNode but with custom exposed_type
			
 
				-        csv_data_node_as_custom_object = CSVDataNode(
			
 
				-            "bar", Scope.SCENARIO, properties={"path": path, "exposed_type": MyCustomObject}
			
 
				-        )
			
 
				-        data_custom = csv_data_node_as_custom_object.read()
			
 
				-        assert isinstance(data_custom, list)
			
 
				-        assert len(data_custom) == 10
			
 
				-
			
 
				-        for (_, row_pandas), row_custom in zip(data_pandas.iterrows(), data_custom):
			
 
				-            assert isinstance(row_custom, MyCustomObject)
			
 
				-            assert row_pandas["id"] == row_custom.id
			
 
				-            assert str(row_pandas["integer"]) == row_custom.integer
			
 
				-            assert row_pandas["text"] == row_custom.text
			
 
				-
			
 
				-    def test_read_without_header(self):
			
 
				-        not_existing_csv = CSVDataNode("foo", Scope.SCENARIO, properties={"path": "WRONG.csv", "has_header": False})
			
 
				-        with pytest.raises(NoData):
			
 
				-            assert not_existing_csv.read() is None
			
 
				-            not_existing_csv.read_or_raise()
			
 
				-
			
 
				-        path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				-        # Create CSVDataNode without exposed_type (Default is pandas.DataFrame)
			
 
				-        csv_data_node_as_pandas = CSVDataNode("bar", Scope.SCENARIO, properties={"path": path, "has_header": False})
			
 
				-        data_pandas = csv_data_node_as_pandas.read()
			
 
				-        assert isinstance(data_pandas, pd.DataFrame)
			
 
				-        assert len(data_pandas) == 11
			
 
				-        assert np.array_equal(data_pandas.to_numpy(), pd.read_csv(path, header=None).to_numpy())
			
 
				-
			
 
				-        # Create CSVDataNode with numpy exposed_type
			
 
				-        csv_data_node_as_numpy = CSVDataNode(
			
 
				-            "qux", Scope.SCENARIO, properties={"path": path, "has_header": False, "exposed_type": "numpy"}
			
 
				-        )
			
 
				-        data_numpy = csv_data_node_as_numpy.read()
			
 
				-        assert isinstance(data_numpy, np.ndarray)
			
 
				-        assert len(data_numpy) == 11
			
 
				-        assert np.array_equal(data_numpy, pd.read_csv(path, header=None).to_numpy())
			
 
				-
			
 
				-        # Create the same CSVDataNode but with custom exposed_type
			
 
				-        csv_data_node_as_custom_object = CSVDataNode(
			
 
				-            "quux", Scope.SCENARIO, properties={"path": path, "has_header": False, "exposed_type": MyCustomObject}
			
 
				-        )
			
 
				-        data_custom = csv_data_node_as_custom_object.read()
			
 
				-        assert isinstance(data_custom, list)
			
 
				-        assert len(data_custom) == 11
			
 
				-
			
 
				-        for (_, row_pandas), row_custom in zip(data_pandas.iterrows(), data_custom):
			
 
				-            assert isinstance(row_custom, MyCustomObject)
			
 
				-            assert row_pandas[0] == row_custom.id
			
 
				-            assert str(row_pandas[1]) == row_custom.integer
			
 
				-            assert row_pandas[2] == row_custom.text
			
 
				-
			
 
				-    @pytest.mark.parametrize(
			
 
				-        "content",
			
 
				-        [
			
 
				-            ([{"a": 11, "b": 22, "c": 33}, {"a": 44, "b": 55, "c": 66}]),
			
 
				-            (pd.DataFrame([{"a": 11, "b": 22, "c": 33}, {"a": 44, "b": 55, "c": 66}])),
			
 
				-            ([[11, 22, 33], [44, 55, 66]]),
			
 
				-        ],
			
 
				-    )
			
 
				-    def test_append(self, csv_file, default_data_frame, content):
			
 
				-        csv_dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file})
			
 
				-        assert_frame_equal(csv_dn.read(), default_data_frame)
			
 
				-
			
 
				-        csv_dn.append(content)
			
 
				-        assert_frame_equal(
			
 
				-            csv_dn.read(),
			
 
				-            pd.concat([default_data_frame, pd.DataFrame(content, columns=["a", "b", "c"])]).reset_index(drop=True),
			
 
				-        )
			
 
				-
			
 
				-    @pytest.mark.parametrize(
			
 
				-        "content,columns",
			
 
				-        [
			
 
				-            ([{"a": 11, "b": 22, "c": 33}, {"a": 44, "b": 55, "c": 66}], None),
			
 
				-            ([[11, 22, 33], [44, 55, 66]], None),
			
 
				-            ([[11, 22, 33], [44, 55, 66]], ["e", "f", "g"]),
			
 
				-        ],
			
 
				-    )
			
 
				-    def test_write(self, csv_file, default_data_frame, content, columns):
			
 
				-        csv_dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file})
			
 
				-        assert np.array_equal(csv_dn.read().values, default_data_frame.values)
			
 
				-        if not columns:
			
 
				-            csv_dn.write(content)
			
 
				-            df = pd.DataFrame(content)
			
 
				-        else:
			
 
				-            csv_dn.write_with_column_names(content, columns)
			
 
				-            df = pd.DataFrame(content, columns=columns)
			
 
				-        assert np.array_equal(csv_dn.read().values, df.values)
			
 
				-
			
 
				-        csv_dn.write(None)
			
 
				-        assert len(csv_dn.read()) == 0
			
 
				-
			
 
				-    def test_write_with_different_encoding(self, csv_file):
			
 
				-        data = pd.DataFrame([{"≥a": 1, "b": 2}])
			
 
				-
			
 
				-        utf8_dn = CSVDataNode("utf8_dn", Scope.SCENARIO, properties={"default_path": csv_file})
			
 
				-        utf16_dn = CSVDataNode("utf16_dn", Scope.SCENARIO, properties={"default_path": csv_file, "encoding": "utf-16"})
			
 
				-
			
 
				-        # If a file is written with utf-8 encoding, it can only be read with utf-8, not utf-16 encoding
			
 
				-        utf8_dn.write(data)
			
 
				-        assert np.array_equal(utf8_dn.read(), data)
			
 
				-        with pytest.raises(UnicodeError):
			
 
				-            utf16_dn.read()
			
 
				-
			
 
				-        # If a file is written with utf-16 encoding, it can only be read with utf-16, not utf-8 encoding
			
 
				-        utf16_dn.write(data)
			
 
				-        assert np.array_equal(utf16_dn.read(), data)
			
 
				-        with pytest.raises(UnicodeError):
			
 
				-            utf8_dn.read()
			
 
				-
			
 
				     def test_set_path(self):
			
 
				         dn = CSVDataNode("foo", Scope.SCENARIO, properties={"default_path": "foo.csv"})
			
 
				         assert dn.path == "foo.csv"
			
@@ -280,93 +135,6 @@ class TestCSVDataNode:
 
				         dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": path, "exposed_type": "pandas"})
			
 
				         assert isinstance(dn.read(), pd.DataFrame)
			
 
				 
			
 
				-    def test_filter_pandas_exposed_type(self, csv_file):
			
 
				-        dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file, "exposed_type": "pandas"})
			
 
				-        dn.write(
			
 
				-            [
			
 
				-                {"foo": 1, "bar": 1},
			
 
				-                {"foo": 1, "bar": 2},
			
 
				-                {"foo": 1},
			
 
				-                {"foo": 2, "bar": 2},
			
 
				-                {"bar": 2},
			
 
				-            ]
			
 
				-        )
			
 
				-
			
 
				-        # Test datanode indexing and slicing
			
 
				-        assert dn["foo"].equals(pd.Series([1, 1, 1, 2, None]))
			
 
				-        assert dn["bar"].equals(pd.Series([1, 2, None, 2, 2]))
			
 
				-        assert dn[:2].equals(pd.DataFrame([{"foo": 1.0, "bar": 1.0}, {"foo": 1.0, "bar": 2.0}]))
			
 
				-
			
 
				-        # Test filter data
			
 
				-        filtered_by_filter_method = dn.filter(("foo", 1, Operator.EQUAL))
			
 
				-        filtered_by_indexing = dn[dn["foo"] == 1]
			
 
				-        expected_data = pd.DataFrame([{"foo": 1.0, "bar": 1.0}, {"foo": 1.0, "bar": 2.0}, {"foo": 1.0}])
			
 
				-        assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				-        assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				-
			
 
				-        filtered_by_filter_method = dn.filter(("foo", 1, Operator.NOT_EQUAL))
			
 
				-        filtered_by_indexing = dn[dn["foo"] != 1]
			
 
				-        expected_data = pd.DataFrame([{"foo": 2.0, "bar": 2.0}, {"bar": 2.0}])
			
 
				-        assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				-        assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				-
			
 
				-        filtered_by_filter_method = dn.filter(("bar", 2, Operator.EQUAL))
			
 
				-        filtered_by_indexing = dn[dn["bar"] == 2]
			
 
				-        expected_data = pd.DataFrame([{"foo": 1.0, "bar": 2.0}, {"foo": 2.0, "bar": 2.0}, {"bar": 2.0}])
			
 
				-        assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				-        assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				-
			
 
				-        filtered_by_filter_method = dn.filter([("bar", 1, Operator.EQUAL), ("bar", 2, Operator.EQUAL)], JoinOperator.OR)
			
 
				-        filtered_by_indexing = dn[(dn["bar"] == 1) | (dn["bar"] == 2)]
			
 
				-        expected_data = pd.DataFrame(
			
 
				-            [
			
 
				-                {"foo": 1.0, "bar": 1.0},
			
 
				-                {"foo": 1.0, "bar": 2.0},
			
 
				-                {"foo": 2.0, "bar": 2.0},
			
 
				-                {"bar": 2.0},
			
 
				-            ]
			
 
				-        )
			
 
				-        assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				-        assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				-
			
 
				-    def test_filter_numpy_exposed_type(self, csv_file):
			
 
				-        dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file, "exposed_type": "numpy"})
			
 
				-        dn.write(
			
 
				-            np.array(
			
 
				-                [
			
 
				-                    [1, 1],
			
 
				-                    [1, 2],
			
 
				-                    [1, 3],
			
 
				-                    [2, 1],
			
 
				-                    [2, 2],
			
 
				-                    [2, 3],
			
 
				-                ]
			
 
				-            )
			
 
				-        )
			
 
				-
			
 
				-        # Test datanode indexing and slicing
			
 
				-        assert np.array_equal(dn[0], np.array([1, 1]))
			
 
				-        assert np.array_equal(dn[1], np.array([1, 2]))
			
 
				-        assert np.array_equal(dn[:3], np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				-        assert np.array_equal(dn[:, 0], np.array([1, 1, 1, 2, 2, 2]))
			
 
				-        assert np.array_equal(dn[1:4, :1], np.array([[1], [1], [2]]))
			
 
				-
			
 
				-        # Test filter data
			
 
				-        assert np.array_equal(dn.filter((0, 1, Operator.EQUAL)), np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				-        assert np.array_equal(dn[dn[:, 0] == 1], np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				-
			
 
				-        assert np.array_equal(dn.filter((0, 1, Operator.NOT_EQUAL)), np.array([[2, 1], [2, 2], [2, 3]]))
			
 
				-        assert np.array_equal(dn[dn[:, 0] != 1], np.array([[2, 1], [2, 2], [2, 3]]))
			
 
				-
			
 
				-        assert np.array_equal(dn.filter((1, 2, Operator.EQUAL)), np.array([[1, 2], [2, 2]]))
			
 
				-        assert np.array_equal(dn[dn[:, 1] == 2], np.array([[1, 2], [2, 2]]))
			
 
				-
			
 
				-        assert np.array_equal(
			
 
				-            dn.filter([(1, 1, Operator.EQUAL), (1, 2, Operator.EQUAL)], JoinOperator.OR),
			
 
				-            np.array([[1, 1], [1, 2], [2, 1], [2, 2]]),
			
 
				-        )
			
 
				-        assert np.array_equal(dn[(dn[:, 1] == 1) | (dn[:, 1] == 2)], np.array([[1, 1], [1, 2], [2, 1], [2, 2]]))
			
 
				-
			
 
				     def test_raise_error_invalid_exposed_type(self):
			
 
				         path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/example.csv")
			
 
				         with pytest.raises(InvalidExposedType):
			
--- a/tests/core/data/test_filter_csv_data_node.py
+++ b/tests/core/data/test_filter_csv_data_node.py
@@ -0,0 +1,126 @@
 
				+# Copyright 2021-2024 Avaiga Private Limited
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
			
 
				+# the License. You may obtain a copy of the License at
			
 
				+#
			
 
				+#        http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
			
 
				+# an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
			
 
				+# specific language governing permissions and limitations under the License.
			
 
				+
			
 
				+import os
			
 
				+import pathlib
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+import pytest
			
 
				+from pandas.testing import assert_frame_equal
			
 
				+
			
 
				+from taipy.config.common.scope import Scope
			
 
				+from taipy.core.data.csv import CSVDataNode
			
 
				+from taipy.core.data.operator import JoinOperator, Operator
			
 
				+
			
 
				+
			
 
				+@pytest.fixture(scope="function", autouse=True)
			
 
				+def cleanup():
			
 
				+    yield
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/temp.csv")
			
 
				+    if os.path.isfile(path):
			
 
				+        os.remove(path)
			
 
				+
			
 
				+
			
 
				+class MyCustomObject:
			
 
				+    def __init__(self, id, integer, text):
			
 
				+        self.id = id
			
 
				+        self.integer = integer
			
 
				+        self.text = text
			
 
				+
			
 
				+
			
 
				+def test_filter_pandas_exposed_type(csv_file):
			
 
				+    dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file, "exposed_type": "pandas"})
			
 
				+    dn.write(
			
 
				+        [
			
 
				+            {"foo": 1, "bar": 1},
			
 
				+            {"foo": 1, "bar": 2},
			
 
				+            {"foo": 1},
			
 
				+            {"foo": 2, "bar": 2},
			
 
				+            {"bar": 2},
			
 
				+        ]
			
 
				+    )
			
 
				+
			
 
				+    # Test datanode indexing and slicing
			
 
				+    assert dn["foo"].equals(pd.Series([1, 1, 1, 2, None]))
			
 
				+    assert dn["bar"].equals(pd.Series([1, 2, None, 2, 2]))
			
 
				+    assert dn[:2].equals(pd.DataFrame([{"foo": 1.0, "bar": 1.0}, {"foo": 1.0, "bar": 2.0}]))
			
 
				+
			
 
				+    # Test filter data
			
 
				+    filtered_by_filter_method = dn.filter(("foo", 1, Operator.EQUAL))
			
 
				+    filtered_by_indexing = dn[dn["foo"] == 1]
			
 
				+    expected_data = pd.DataFrame([{"foo": 1.0, "bar": 1.0}, {"foo": 1.0, "bar": 2.0}, {"foo": 1.0}])
			
 
				+    assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				+    assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				+
			
 
				+    filtered_by_filter_method = dn.filter(("foo", 1, Operator.NOT_EQUAL))
			
 
				+    filtered_by_indexing = dn[dn["foo"] != 1]
			
 
				+    expected_data = pd.DataFrame([{"foo": 2.0, "bar": 2.0}, {"bar": 2.0}])
			
 
				+    assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				+    assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				+
			
 
				+    filtered_by_filter_method = dn.filter(("bar", 2, Operator.EQUAL))
			
 
				+    filtered_by_indexing = dn[dn["bar"] == 2]
			
 
				+    expected_data = pd.DataFrame([{"foo": 1.0, "bar": 2.0}, {"foo": 2.0, "bar": 2.0}, {"bar": 2.0}])
			
 
				+    assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				+    assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				+
			
 
				+    filtered_by_filter_method = dn.filter([("bar", 1, Operator.EQUAL), ("bar", 2, Operator.EQUAL)], JoinOperator.OR)
			
 
				+    filtered_by_indexing = dn[(dn["bar"] == 1) | (dn["bar"] == 2)]
			
 
				+    expected_data = pd.DataFrame(
			
 
				+        [
			
 
				+            {"foo": 1.0, "bar": 1.0},
			
 
				+            {"foo": 1.0, "bar": 2.0},
			
 
				+            {"foo": 2.0, "bar": 2.0},
			
 
				+            {"bar": 2.0},
			
 
				+        ]
			
 
				+    )
			
 
				+    assert_frame_equal(filtered_by_filter_method.reset_index(drop=True), expected_data)
			
 
				+    assert_frame_equal(filtered_by_indexing.reset_index(drop=True), expected_data)
			
 
				+
			
 
				+
			
 
				+def test_filter_numpy_exposed_type(csv_file):
			
 
				+    dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file, "exposed_type": "numpy"})
			
 
				+    dn.write(
			
 
				+        np.array(
			
 
				+            [
			
 
				+                [1, 1],
			
 
				+                [1, 2],
			
 
				+                [1, 3],
			
 
				+                [2, 1],
			
 
				+                [2, 2],
			
 
				+                [2, 3],
			
 
				+            ]
			
 
				+        )
			
 
				+    )
			
 
				+
			
 
				+    # Test datanode indexing and slicing
			
 
				+    assert np.array_equal(dn[0], np.array([1, 1]))
			
 
				+    assert np.array_equal(dn[1], np.array([1, 2]))
			
 
				+    assert np.array_equal(dn[:3], np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				+    assert np.array_equal(dn[:, 0], np.array([1, 1, 1, 2, 2, 2]))
			
 
				+    assert np.array_equal(dn[1:4, :1], np.array([[1], [1], [2]]))
			
 
				+
			
 
				+    # Test filter data
			
 
				+    assert np.array_equal(dn.filter((0, 1, Operator.EQUAL)), np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				+    assert np.array_equal(dn[dn[:, 0] == 1], np.array([[1, 1], [1, 2], [1, 3]]))
			
 
				+
			
 
				+    assert np.array_equal(dn.filter((0, 1, Operator.NOT_EQUAL)), np.array([[2, 1], [2, 2], [2, 3]]))
			
 
				+    assert np.array_equal(dn[dn[:, 0] != 1], np.array([[2, 1], [2, 2], [2, 3]]))
			
 
				+
			
 
				+    assert np.array_equal(dn.filter((1, 2, Operator.EQUAL)), np.array([[1, 2], [2, 2]]))
			
 
				+    assert np.array_equal(dn[dn[:, 1] == 2], np.array([[1, 2], [2, 2]]))
			
 
				+
			
 
				+    assert np.array_equal(
			
 
				+        dn.filter([(1, 1, Operator.EQUAL), (1, 2, Operator.EQUAL)], JoinOperator.OR),
			
 
				+        np.array([[1, 1], [1, 2], [2, 1], [2, 2]]),
			
 
				+    )
			
 
				+    assert np.array_equal(dn[(dn[:, 1] == 1) | (dn[:, 1] == 2)], np.array([[1, 1], [1, 2], [2, 1], [2, 2]]))
			
--- a/tests/core/data/test_read_csv_data_node.py
+++ b/tests/core/data/test_read_csv_data_node.py
@@ -0,0 +1,125 @@
 
				+# Copyright 2021-2024 Avaiga Private Limited
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
			
 
				+# the License. You may obtain a copy of the License at
			
 
				+#
			
 
				+#        http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
			
 
				+# an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
			
 
				+# specific language governing permissions and limitations under the License.
			
 
				+
			
 
				+import dataclasses
			
 
				+import os
			
 
				+import pathlib
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+import pytest
			
 
				+
			
 
				+from taipy.config.common.scope import Scope
			
 
				+from taipy.core.data.csv import CSVDataNode
			
 
				+from taipy.core.exceptions.exceptions import NoData
			
 
				+
			
 
				+DATA_SAMPLE_PATH = "data_sample/example.csv"
			
 
				+
			
 
				+
			
 
				+@dataclasses.dataclass
			
 
				+class MyCustomObject:
			
 
				+    id: int
			
 
				+    integer: int
			
 
				+    text: str
			
 
				+
			
 
				+
			
 
				+def test_raise_no_data_with_header():
			
 
				+    not_existing_csv = CSVDataNode("foo", Scope.SCENARIO, properties={"path": "WRONG.csv", "has_header": True})
			
 
				+    with pytest.raises(NoData):
			
 
				+        assert not_existing_csv.read() is None
			
 
				+        not_existing_csv.read_or_raise()
			
 
				+
			
 
				+
			
 
				+def test_read_with_header_pandas():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+
			
 
				+    csv_data_node_as_pandas = CSVDataNode("bar", Scope.SCENARIO, properties={"path": path})
			
 
				+    data_pandas = csv_data_node_as_pandas.read()
			
 
				+    assert isinstance(data_pandas, pd.DataFrame)
			
 
				+    assert len(data_pandas) == 10
			
 
				+    assert np.array_equal(data_pandas.to_numpy(), pd.read_csv(path).to_numpy())
			
 
				+
			
 
				+
			
 
				+def test_read_with_header_numpy():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+
			
 
				+    csv_data_node_as_numpy = CSVDataNode(
			
 
				+        "bar", Scope.SCENARIO, properties={"path": path, "has_header": True, "exposed_type": "numpy"}
			
 
				+    )
			
 
				+    data_numpy = csv_data_node_as_numpy.read()
			
 
				+    assert isinstance(data_numpy, np.ndarray)
			
 
				+    assert len(data_numpy) == 10
			
 
				+    assert np.array_equal(data_numpy, pd.read_csv(path).to_numpy())
			
 
				+
			
 
				+
			
 
				+def test_read_with_header_custom_exposed_type():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+    data_pandas = pd.read_csv(path)
			
 
				+
			
 
				+    csv_data_node_as_custom_object = CSVDataNode(
			
 
				+        "bar", Scope.SCENARIO, properties={"path": path, "exposed_type": MyCustomObject}
			
 
				+    )
			
 
				+    data_custom = csv_data_node_as_custom_object.read()
			
 
				+    assert isinstance(data_custom, list)
			
 
				+    assert len(data_custom) == 10
			
 
				+
			
 
				+    for (_, row_pandas), row_custom in zip(data_pandas.iterrows(), data_custom):
			
 
				+        assert isinstance(row_custom, MyCustomObject)
			
 
				+        assert row_pandas["id"] == row_custom.id
			
 
				+        assert str(row_pandas["integer"]) == row_custom.integer
			
 
				+        assert row_pandas["text"] == row_custom.text
			
 
				+
			
 
				+
			
 
				+def test_raise_no_data_without_header():
			
 
				+    not_existing_csv = CSVDataNode("foo", Scope.SCENARIO, properties={"path": "WRONG.csv", "has_header": False})
			
 
				+    with pytest.raises(NoData):
			
 
				+        assert not_existing_csv.read() is None
			
 
				+        not_existing_csv.read_or_raise()
			
 
				+
			
 
				+
			
 
				+def test_read_without_header_pandas():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+
			
 
				+    csv_data_node_as_pandas = CSVDataNode("bar", Scope.SCENARIO, properties={"path": path, "has_header": False})
			
 
				+    data_pandas = csv_data_node_as_pandas.read()
			
 
				+    assert isinstance(data_pandas, pd.DataFrame)
			
 
				+    assert len(data_pandas) == 11
			
 
				+    assert np.array_equal(data_pandas.to_numpy(), pd.read_csv(path, header=None).to_numpy())
			
 
				+
			
 
				+
			
 
				+def test_read_without_header_numpy():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+
			
 
				+    csv_data_node_as_numpy = CSVDataNode(
			
 
				+        "qux", Scope.SCENARIO, properties={"path": path, "has_header": False, "exposed_type": "numpy"}
			
 
				+    )
			
 
				+    data_numpy = csv_data_node_as_numpy.read()
			
 
				+    assert isinstance(data_numpy, np.ndarray)
			
 
				+    assert len(data_numpy) == 11
			
 
				+    assert np.array_equal(data_numpy, pd.read_csv(path, header=None).to_numpy())
			
 
				+
			
 
				+
			
 
				+def test_read_without_header_custom_exposed_type():
			
 
				+    path = os.path.join(pathlib.Path(__file__).parent.resolve(), DATA_SAMPLE_PATH)
			
 
				+
			
 
				+    csv_data_node_as_custom_object = CSVDataNode(
			
 
				+        "quux", Scope.SCENARIO, properties={"path": path, "has_header": False, "exposed_type": MyCustomObject}
			
 
				+    )
			
 
				+    data_custom = csv_data_node_as_custom_object.read()
			
 
				+    assert isinstance(data_custom, list)
			
 
				+    assert len(data_custom) == 11
			
 
				+
			
 
				+    data_pandas = pd.read_csv(path, header=None)
			
 
				+    for (_, row_pandas), row_custom in zip(data_pandas.iterrows(), data_custom):
			
 
				+        assert isinstance(row_custom, MyCustomObject)
			
 
				+        assert row_pandas[0] == row_custom.id
			
 
				+        assert str(row_pandas[1]) == row_custom.integer
			
 
				+        assert row_pandas[2] == row_custom.text
			
--- a/tests/core/data/test_write_csv_data_node.py
+++ b/tests/core/data/test_write_csv_data_node.py
@@ -0,0 +1,180 @@
 
				+# Copyright 2021-2024 Avaiga Private Limited
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
			
 
				+# the License. You may obtain a copy of the License at
			
 
				+#
			
 
				+#        http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
			
 
				+# an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
			
 
				+# specific language governing permissions and limitations under the License.
			
 
				+
			
 
				+import dataclasses
			
 
				+import os
			
 
				+import pathlib
			
 
				+
			
 
				+import numpy as np
			
 
				+import pandas as pd
			
 
				+import pytest
			
 
				+from pandas.testing import assert_frame_equal
			
 
				+
			
 
				+from taipy.config.common.scope import Scope
			
 
				+from taipy.core.data.csv import CSVDataNode
			
 
				+
			
 
				+
			
 
				+@pytest.fixture(scope="function")
			
 
				+def tmp_csv_file():
			
 
				+    return os.path.join(pathlib.Path(__file__).parent.resolve(), "data_sample/temp.csv")
			
 
				+
			
 
				+
			
 
				+@pytest.fixture(scope="function", autouse=True)
			
 
				+def cleanup(tmp_csv_file):
			
 
				+    yield
			
 
				+    if os.path.isfile(tmp_csv_file):
			
 
				+        os.remove(tmp_csv_file)
			
 
				+
			
 
				+
			
 
				+@dataclasses.dataclass
			
 
				+class MyCustomObject:
			
 
				+    id: int
			
 
				+    integer: int
			
 
				+    text: str
			
 
				+
			
 
				+    def __eq__(self, val) -> bool:
			
 
				+        return self.id == val.id and self.integer == val.integer and self.text == val.text
			
 
				+
			
 
				+    def __post_init__(self):
			
 
				+        for field in dataclasses.fields(self):
			
 
				+            value = getattr(self, field.name)
			
 
				+            if not isinstance(value, field.type):
			
 
				+                setattr(self, field.name, field.type(value))
			
 
				+
			
 
				+
			
 
				+@pytest.mark.parametrize(
			
 
				+    "content",
			
 
				+    [
			
 
				+        ([{"a": 11, "b": 22, "c": 33}, {"a": 44, "b": 55, "c": 66}]),
			
 
				+        (pd.DataFrame([{"a": 11, "b": 22, "c": 33}, {"a": 44, "b": 55, "c": 66}])),
			
 
				+        ([[11, 22, 33], [44, 55, 66]]),
			
 
				+    ],
			
 
				+)
			
 
				+def test_append(csv_file, default_data_frame, content):
			
 
				+    csv_dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": csv_file})
			
 
				+    assert_frame_equal(csv_dn.read(), default_data_frame)
			
 
				+
			
 
				+    csv_dn.append(content)
			
 
				+    assert_frame_equal(
			
 
				+        csv_dn.read(),
			
 
				+        pd.concat([default_data_frame, pd.DataFrame(content, columns=["a", "b", "c"])]).reset_index(drop=True),
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def test_write_with_header_pandas(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": tmp_csv_file})
			
 
				+
			
 
				+    df = pd.DataFrame([{"a": 1, "b": 2, "c": 3}, {"a": 4, "b": 5, "c": 6}])
			
 
				+    csv_dn.write(df)
			
 
				+    assert pd.DataFrame.equals(csv_dn.read(), df)
			
 
				+
			
 
				+    csv_dn.write(df["a"])
			
 
				+    assert pd.DataFrame.equals(csv_dn.read(), df[["a"]])
			
 
				+
			
 
				+    series = pd.Series([1, 2, 3])
			
 
				+    csv_dn.write(series)
			
 
				+    assert np.array_equal(csv_dn.read().to_numpy(), pd.DataFrame(series).to_numpy())
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read().empty
			
 
				+
			
 
				+
			
 
				+def test_write_with_header_numpy(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode("bar", Scope.SCENARIO, properties={"path": tmp_csv_file, "exposed_type": "numpy"})
			
 
				+
			
 
				+    arr = np.array([[1], [2], [3], [4], [5]])
			
 
				+    csv_dn.write(arr)
			
 
				+    assert np.array_equal(csv_dn.read(), arr)
			
 
				+
			
 
				+    arr = arr[0:3]
			
 
				+    csv_dn.write(arr)
			
 
				+    assert np.array_equal(csv_dn.read(), arr)
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read().size == 0
			
 
				+
			
 
				+
			
 
				+def test_write_with_header_custom_exposed_type(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode("bar", Scope.SCENARIO, properties={"path": tmp_csv_file, "exposed_type": MyCustomObject})
			
 
				+
			
 
				+    data = [MyCustomObject(0, 1, "hi"), MyCustomObject(1, 2, "world"), MyCustomObject(2, 3, "text")]
			
 
				+    csv_dn.write(data)
			
 
				+    assert all(actual == expected for actual, expected in zip(csv_dn.read(), data))
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read() == []
			
 
				+
			
 
				+
			
 
				+def test_write_without_header_pandas(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode("foo", Scope.SCENARIO, properties={"path": tmp_csv_file, "has_header": False})
			
 
				+
			
 
				+    df = pd.DataFrame([*zip([1, 2, 3], [4, 5, 6])])
			
 
				+    csv_dn.write(df)
			
 
				+    assert pd.DataFrame.equals(csv_dn.read(), df)
			
 
				+
			
 
				+    csv_dn.write(df[0])
			
 
				+    assert pd.DataFrame.equals(csv_dn.read(), df[[0]])
			
 
				+
			
 
				+    series = pd.Series([1, 2, 3])
			
 
				+    csv_dn.write(series)
			
 
				+    assert np.array_equal(csv_dn.read().to_numpy(), pd.DataFrame(series).to_numpy())
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read().empty
			
 
				+
			
 
				+
			
 
				+def test_write_without_header_numpy(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode(
			
 
				+        "bar", Scope.SCENARIO, properties={"path": tmp_csv_file, "exposed_type": "numpy", "has_header": False}
			
 
				+    )
			
 
				+
			
 
				+    arr = np.array([[1], [2], [3], [4], [5]])
			
 
				+    csv_dn.write(arr)
			
 
				+    assert np.array_equal(csv_dn.read(), arr)
			
 
				+
			
 
				+    arr = arr[0:3]
			
 
				+    csv_dn.write(arr)
			
 
				+    assert np.array_equal(csv_dn.read(), arr)
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read().size == 0
			
 
				+
			
 
				+
			
 
				+def test_write_without_header_custom_exposed_type(tmp_csv_file):
			
 
				+    csv_dn = CSVDataNode(
			
 
				+        "bar", Scope.SCENARIO, properties={"path": tmp_csv_file, "exposed_type": MyCustomObject, "has_header": False}
			
 
				+    )
			
 
				+
			
 
				+    data = [MyCustomObject(0, 1, "hi"), MyCustomObject(1, 2, "world"), MyCustomObject(2, 3, "text")]
			
 
				+    csv_dn.write(data)
			
 
				+    assert all(actual == expected for actual, expected in zip(csv_dn.read(), data))
			
 
				+
			
 
				+    csv_dn.write(None)
			
 
				+    assert csv_dn.read() == []
			
 
				+
			
 
				+
			
 
				+def test_write_with_different_encoding(csv_file):
			
 
				+    data = pd.DataFrame([{"≥a": 1, "b": 2}])
			
 
				+
			
 
				+    utf8_dn = CSVDataNode("utf8_dn", Scope.SCENARIO, properties={"default_path": csv_file})
			
 
				+    utf16_dn = CSVDataNode("utf16_dn", Scope.SCENARIO, properties={"default_path": csv_file, "encoding": "utf-16"})
			
 
				+
			
 
				+    # If a file is written with utf-8 encoding, it can only be read with utf-8, not utf-16 encoding
			
 
				+    utf8_dn.write(data)
			
 
				+    assert np.array_equal(utf8_dn.read(), data)
			
 
				+    with pytest.raises(UnicodeError):
			
 
				+        utf16_dn.read()
			
 
				+
			
 
				+    # If a file is written with utf-16 encoding, it can only be read with utf-16, not utf-8 encoding
			
 
				+    utf16_dn.write(data)
			
 
				+    assert np.array_equal(utf16_dn.read(), data)
			
 
				+    with pytest.raises(UnicodeError):
			
 
				+        utf8_dn.read()