test_sequence_manager.py 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899
  1. # Copyright 2021-2025 Avaiga Private Limited
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
  4. # the License. You may obtain a copy of the License at
  5. #
  6. # http://www.apache.org/licenses/LICENSE-2.0
  7. #
  8. # Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
  9. # an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
  10. # specific language governing permissions and limitations under the License.
  11. from typing import Callable, Iterable, Optional
  12. from unittest import mock
  13. from unittest.mock import ANY
  14. import pytest
  15. from taipy import Scope
  16. from taipy.common.config import Config
  17. from taipy.core._orchestrator._orchestrator import _Orchestrator
  18. from taipy.core._version._version_manager import _VersionManager
  19. from taipy.core.common import _utils
  20. from taipy.core.common._utils import _Subscriber
  21. from taipy.core.data._data_manager import _DataManager
  22. from taipy.core.data.in_memory import InMemoryDataNode
  23. from taipy.core.exceptions.exceptions import (
  24. InvalidSequenceId,
  25. ModelNotFound,
  26. NonExistingSequence,
  27. SequenceAlreadyExists,
  28. SequenceBelongsToNonExistingScenario,
  29. )
  30. from taipy.core.job._job_manager import _JobManager
  31. from taipy.core.scenario._scenario_manager import _ScenarioManager
  32. from taipy.core.scenario.scenario import Scenario
  33. from taipy.core.sequence._sequence_manager import _SequenceManager
  34. from taipy.core.sequence._sequence_manager_factory import _SequenceManagerFactory
  35. from taipy.core.sequence.sequence import Sequence
  36. from taipy.core.sequence.sequence_id import SequenceId
  37. from taipy.core.task._task_manager import _TaskManager
  38. from taipy.core.task.task import Task
  39. from taipy.core.task.task_id import TaskId
  40. from tests.core.utils.NotifyMock import NotifyMock
  41. def test_breakdown_sequence_id():
  42. with pytest.raises(InvalidSequenceId):
  43. _SequenceManager._breakdown_sequence_id("scenario_id")
  44. with pytest.raises(InvalidSequenceId):
  45. _SequenceManager._breakdown_sequence_id("sequence_id")
  46. with pytest.raises(InvalidSequenceId):
  47. _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_id")
  48. with pytest.raises(InvalidSequenceId):
  49. _SequenceManager._breakdown_sequence_id("SCENARIO_scenario_id")
  50. with pytest.raises(InvalidSequenceId):
  51. _SequenceManager._breakdown_sequence_id("sequence_SCENARIO_scenario_id")
  52. with pytest.raises(InvalidSequenceId):
  53. _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_scenario_id")
  54. sequence_name, scenario_id = _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_SCENARIO_scenario")
  55. assert sequence_name == "sequence" and scenario_id == "SCENARIO_scenario"
  56. sequence_name, scenario_id = _SequenceManager._breakdown_sequence_id("SEQUENCEsequenceSCENARIO_scenario")
  57. assert sequence_name == "sequence" and scenario_id == "SCENARIO_scenario"
  58. def test_raise_sequence_does_not_belong_to_scenario():
  59. with pytest.raises(SequenceBelongsToNonExistingScenario):
  60. sequence = Sequence({"name": "sequence_name"}, [], "SEQUENCE_sequence_name_SCENARIO_scenario_id")
  61. _SequenceManager._update(sequence)
  62. def __init():
  63. input_dn = InMemoryDataNode("foo", Scope.SCENARIO)
  64. output_dn = InMemoryDataNode("foo", Scope.SCENARIO)
  65. _DataManager._repository._save(input_dn)
  66. _DataManager._repository._save(output_dn)
  67. task = Task("task", {}, print, [input_dn], [output_dn], TaskId("Task_task_id"))
  68. _TaskManager._repository._save(task)
  69. scenario = Scenario("scenario", {task}, {}, set())
  70. _ScenarioManager._repository._save(scenario)
  71. return scenario, task
  72. def test_save_and_get_sequence_no_existing_sequence():
  73. scenario, _ = __init()
  74. sequence_name_1 = "p1"
  75. sequence_id_1 = SequenceId(f"SEQUENCE_{sequence_name_1}_{scenario.id}")
  76. sequence_name_2 = "p2"
  77. sequence_id_2 = SequenceId(f"SEQUENCE_{sequence_name_2}_{scenario.id}")
  78. assert _SequenceManager._get(sequence_id_1) is None
  79. assert _SequenceManager._get(sequence_id_2) is None
  80. assert _SequenceManager._get("sequence") is None
  81. def test_save_and_get():
  82. scenario, task = __init()
  83. sequence_name_1 = "p1"
  84. sequence_id_1 = SequenceId(f"SEQUENCE_{sequence_name_1}_{scenario.id}")
  85. sequence_name_2 = "p2"
  86. sequence_id_2 = SequenceId(f"SEQUENCE_{sequence_name_2}_{scenario.id}")
  87. scenario.add_sequences({sequence_name_1: []})
  88. sequence_1 = scenario.sequences[sequence_name_1]
  89. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  90. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  91. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  92. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  93. assert _SequenceManager._get(sequence_id_2) is None
  94. # Save a second sequence. Now, we expect to have a total of two sequences stored
  95. scenario.add_sequences({sequence_name_2: [task]})
  96. sequence_2 = scenario.sequences[sequence_name_2]
  97. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  98. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  99. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  100. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  101. assert _SequenceManager._get(sequence_id_2).id == sequence_2.id
  102. assert len(_SequenceManager._get(sequence_id_2).tasks) == 1
  103. assert _SequenceManager._get(sequence_2).id == sequence_2.id
  104. assert len(_SequenceManager._get(sequence_2).tasks) == 1
  105. assert _TaskManager._get(task.id).id == task.id
  106. # We save the first sequence again. We expect an exception and nothing to change
  107. with pytest.raises(SequenceAlreadyExists):
  108. scenario.add_sequence(sequence_name_1, [])
  109. sequence_1 = scenario.sequences[sequence_name_1]
  110. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  111. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  112. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  113. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  114. assert _SequenceManager._get(sequence_id_2).id == sequence_2.id
  115. assert len(_SequenceManager._get(sequence_id_2).tasks) == 1
  116. assert _SequenceManager._get(sequence_2).id == sequence_2.id
  117. assert len(_SequenceManager._get(sequence_2).tasks) == 1
  118. assert _TaskManager._get(task.id).id == task.id
  119. def test_task_parent_id_set_only_when_create():
  120. scenario, task = __init()
  121. sequence_name_1 = "p1"
  122. with mock.patch("taipy.core.task._task_manager._TaskManager._update") as mck:
  123. scenario.add_sequences({sequence_name_1: [task]})
  124. mck.assert_called_once()
  125. with mock.patch("taipy.core.task._task_manager._TaskManager._update") as mck:
  126. scenario.sequences[sequence_name_1]
  127. mck.assert_not_called()
  128. def test_get_all_on_multiple_versions_environment():
  129. # Create 5 sequences from Scenario with 2 versions each
  130. for version in range(1, 3):
  131. for i in range(5):
  132. _ScenarioManager._repository._save(
  133. Scenario(
  134. f"config_id_{i+version}",
  135. [],
  136. {},
  137. [],
  138. f"SCENARIO_id_{i}_v{version}",
  139. version=f"{version}.0",
  140. sequences={"sequence": {}},
  141. )
  142. )
  143. _VersionManager._set_experiment_version("1.0")
  144. assert len(_SequenceManager._get_all()) == 5
  145. assert (
  146. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 1
  147. )
  148. assert (
  149. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  150. )
  151. _VersionManager._set_experiment_version("2.0")
  152. assert len(_SequenceManager._get_all()) == 5
  153. assert (
  154. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  155. )
  156. assert (
  157. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 1
  158. )
  159. _VersionManager._set_development_version("1.0")
  160. assert len(_SequenceManager._get_all()) == 5
  161. assert (
  162. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 1
  163. )
  164. assert (
  165. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 0
  166. )
  167. _VersionManager._set_development_version("2.0")
  168. assert len(_SequenceManager._get_all()) == 5
  169. assert (
  170. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  171. )
  172. assert (
  173. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 1
  174. )
  175. def test_is_submittable():
  176. dn = InMemoryDataNode("dn", Scope.SCENARIO, properties={"default_data": 10})
  177. _DataManager._repository._save(dn)
  178. task = Task("task", {}, print, [dn])
  179. _TaskManager._repository._save(task)
  180. scenario = Scenario("scenario", {task}, {}, set())
  181. _ScenarioManager._repository._save(scenario)
  182. rc = _SequenceManager._is_submittable("some_sequence")
  183. assert not rc
  184. assert "Entity 'some_sequence' does not exist in the repository." in rc.reasons
  185. scenario.add_sequences({"sequence": [task]})
  186. sequence = scenario.sequences["sequence"]
  187. assert len(_SequenceManager._get_all()) == 1
  188. assert _SequenceManager._is_submittable(sequence)
  189. assert _SequenceManager._is_submittable(sequence.id)
  190. assert not _SequenceManager._is_submittable("Sequence_temp")
  191. assert not _SequenceManager._is_submittable("SEQUENCE_temp_SCENARIO_scenario")
  192. scenario.dn.edit_in_progress = True
  193. assert not _SequenceManager._is_submittable(sequence)
  194. assert not _SequenceManager._is_submittable(sequence.id)
  195. scenario.dn.edit_in_progress = False
  196. assert _SequenceManager._is_submittable(sequence)
  197. assert _SequenceManager._is_submittable(sequence.id)
  198. def test_submit():
  199. data_node_1 = InMemoryDataNode("foo", Scope.SCENARIO, "s1")
  200. data_node_2 = InMemoryDataNode("bar", Scope.SCENARIO, "s2")
  201. data_node_3 = InMemoryDataNode("baz", Scope.SCENARIO, "s3")
  202. data_node_4 = InMemoryDataNode("qux", Scope.SCENARIO, "s4")
  203. data_node_5 = InMemoryDataNode("quux", Scope.SCENARIO, "s5")
  204. data_node_6 = InMemoryDataNode("quuz", Scope.SCENARIO, "s6")
  205. data_node_7 = InMemoryDataNode("corge", Scope.SCENARIO, "s7")
  206. _DataManager._repository._save(data_node_1)
  207. _DataManager._repository._save(data_node_2)
  208. _DataManager._repository._save(data_node_3)
  209. _DataManager._repository._save(data_node_4)
  210. _DataManager._repository._save(data_node_5)
  211. _DataManager._repository._save(data_node_6)
  212. _DataManager._repository._save(data_node_7)
  213. task_1 = Task(
  214. "grault",
  215. {},
  216. print,
  217. [data_node_1, data_node_2],
  218. [data_node_3, data_node_4],
  219. TaskId("t1"),
  220. )
  221. task_2 = Task("garply", {}, print, [data_node_3], [data_node_5], TaskId("t2"))
  222. task_3 = Task("waldo", {}, print, [data_node_5, data_node_4], [data_node_6], TaskId("t3"))
  223. task_4 = Task("fred", {}, print, [data_node_4], [data_node_7], TaskId("t4"))
  224. _TaskManager._repository._save(task_1)
  225. _TaskManager._repository._save(task_2)
  226. _TaskManager._repository._save(task_3)
  227. _TaskManager._repository._save(task_4)
  228. scenario = Scenario("sce", {task_1, task_2, task_3, task_4}, {})
  229. sequence_name = "sequence"
  230. sequence_id = Sequence._new_id(sequence_name, scenario.id)
  231. class MockOrchestrator(_Orchestrator):
  232. submit_calls = []
  233. @classmethod
  234. def _lock_dn_output_and_create_job(
  235. cls,
  236. task: Task,
  237. submit_id: str,
  238. submit_entity_id: str,
  239. callbacks: Optional[Iterable[Callable]] = None,
  240. force: bool = False,
  241. ):
  242. cls.submit_calls.append(task)
  243. return super()._lock_dn_output_and_create_job(task, submit_id, submit_entity_id, callbacks, force)
  244. with mock.patch("taipy.core.task._task_manager._TaskManager._orchestrator", new=MockOrchestrator):
  245. # sequence does not exist. We expect an exception to be raised
  246. with pytest.raises(NonExistingSequence):
  247. _SequenceManager._submit(sequence_id)
  248. _ScenarioManager._repository._save(scenario)
  249. scenario.add_sequences({sequence_name: [task_4, task_2, task_1, task_3]})
  250. # sequence, and tasks does exist. We expect the tasks to be submitted
  251. # in a specific order
  252. sequence = scenario.sequences[sequence_name]
  253. _SequenceManager._submit(sequence.id)
  254. calls_ids = [t.id for t in _TaskManager._orchestrator().submit_calls]
  255. tasks_ids = [task_1.id, task_2.id, task_4.id, task_3.id]
  256. assert calls_ids == tasks_ids
  257. _SequenceManager._submit(sequence)
  258. calls_ids = [t.id for t in _TaskManager._orchestrator().submit_calls]
  259. tasks_ids = tasks_ids * 2
  260. assert set(calls_ids) == set(tasks_ids)
  261. def test_assign_sequence_as_parent_of_task():
  262. dn_config_1 = Config.configure_data_node("dn_1", "in_memory", scope=Scope.SCENARIO)
  263. dn_config_2 = Config.configure_data_node("dn_2", "in_memory", scope=Scope.SCENARIO)
  264. dn_config_3 = Config.configure_data_node("dn_3", "in_memory", scope=Scope.SCENARIO)
  265. task_config_1 = Config.configure_task("task_1", print, [dn_config_1], [dn_config_2])
  266. task_config_2 = Config.configure_task("task_2", print, [dn_config_2], [dn_config_3])
  267. task_config_3 = Config.configure_task("task_3", print, [dn_config_2], [dn_config_3])
  268. tasks = _TaskManager._bulk_get_or_create([task_config_1, task_config_2, task_config_3], "scenario_id")
  269. sequence_1 = _SequenceManager._create("sequence_1", [tasks[0], tasks[1]], scenario_id="scenario_id")
  270. sequence_2 = _SequenceManager._create("sequence_2", [tasks[0], tasks[2]], scenario_id="scenario_id")
  271. tasks_1 = list(sequence_1.tasks.values())
  272. tasks_2 = list(sequence_2.tasks.values())
  273. assert len(tasks_1) == 2
  274. assert len(tasks_2) == 2
  275. assert tasks_1[0].parent_ids == {sequence_1.id, sequence_2.id}
  276. assert tasks_2[0].parent_ids == {sequence_1.id, sequence_2.id}
  277. assert tasks_1[1].parent_ids == {sequence_1.id}
  278. assert tasks_2[1].parent_ids == {sequence_2.id}
  279. g = 0
  280. def mock_function_no_input_no_output():
  281. global g
  282. g += 1
  283. def mock_function_one_input_no_output(inp):
  284. global g
  285. g += inp
  286. def mock_function_no_input_one_output():
  287. global g
  288. return g
  289. def test_submit_sequence_from_tasks_with_one_or_no_input_output():
  290. # test no input and no output Task
  291. task_no_input_no_output = Task("task_no_input_no_output", {}, mock_function_no_input_no_output)
  292. scenario_1 = Scenario("scenario_1", {task_no_input_no_output}, {})
  293. _TaskManager._repository._save(task_no_input_no_output)
  294. _ScenarioManager._repository._save(scenario_1)
  295. scenario_1.add_sequences({"my_sequence_1": [task_no_input_no_output]})
  296. sequence_1 = scenario_1.sequences["my_sequence_1"]
  297. assert len(sequence_1._get_sorted_tasks()) == 1
  298. _SequenceManager._submit(sequence_1)
  299. assert g == 1
  300. # test one input and no output Task
  301. data_node_input = InMemoryDataNode("input_dn", Scope.SCENARIO, properties={"default_data": 2})
  302. task_one_input_no_output = Task(
  303. "task_one_input_no_output", {}, mock_function_one_input_no_output, input=[data_node_input]
  304. )
  305. scenario_2 = Scenario("scenario_2", {task_one_input_no_output}, {})
  306. _DataManager._repository._save(data_node_input)
  307. data_node_input.unlock_edit()
  308. _TaskManager._repository._save(task_one_input_no_output)
  309. _ScenarioManager._repository._save(scenario_2)
  310. scenario_2.add_sequences({"my_sequence_2": [task_one_input_no_output]})
  311. sequence_2 = scenario_2.sequences["my_sequence_2"]
  312. assert len(sequence_2._get_sorted_tasks()) == 1
  313. _SequenceManager._submit(sequence_2)
  314. assert g == 3
  315. # test no input and one output Task
  316. data_node_output = InMemoryDataNode("output_dn", Scope.SCENARIO, properties={"default_data": None})
  317. task_no_input_one_output = Task(
  318. "task_no_input_one_output", {}, mock_function_no_input_one_output, output=[data_node_output]
  319. )
  320. scenario_3 = Scenario("scenario_3", {task_no_input_one_output}, {})
  321. _DataManager._repository._save(data_node_output)
  322. assert data_node_output.read() is None
  323. _TaskManager._repository._save(task_no_input_one_output)
  324. _ScenarioManager._repository._save(scenario_3)
  325. scenario_3.add_sequences({"my_sequence_3": [task_no_input_one_output]})
  326. sequence_3 = scenario_3.sequences["my_sequence_3"]
  327. assert len(sequence_2._get_sorted_tasks()) == 1
  328. _SequenceManager._submit(sequence_3)
  329. assert data_node_output.read() == 3
  330. def mult_by_two(nb: int):
  331. return nb * 2
  332. def mult_by_3(nb: int):
  333. return nb * 3
  334. def test_get_or_create_data():
  335. # only create intermediate data node once
  336. dn_config_1 = Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)
  337. dn_config_2 = Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0)
  338. dn_config_6 = Config.configure_data_node("baz", "in_memory", Scope.SCENARIO, default_data=0)
  339. task_config_mult_by_two = Config.configure_task("mult_by_two", mult_by_two, [dn_config_1], dn_config_2)
  340. task_config_mult_by_3 = Config.configure_task("mult_by_3", mult_by_3, [dn_config_2], dn_config_6)
  341. # dn_1 ---> mult_by_two ---> dn_2 ---> mult_by_3 ---> dn_6
  342. scenario_config = Config.configure_scenario("scenario", [task_config_mult_by_two, task_config_mult_by_3])
  343. assert len(_DataManager._get_all()) == 0
  344. assert len(_TaskManager._get_all()) == 0
  345. scenario = _ScenarioManager._create(scenario_config)
  346. scenario.add_sequences({"by_6": list(scenario.tasks.values())})
  347. sequence = scenario.sequences["by_6"]
  348. assert sequence.properties["name"] == "by_6"
  349. assert len(_DataManager._get_all()) == 3
  350. assert len(_TaskManager._get_all()) == 2
  351. assert len(sequence._get_sorted_tasks()) == 2
  352. assert sequence.foo.read() == 1
  353. assert sequence.bar.read() == 0
  354. assert sequence.baz.read() == 0
  355. assert sequence._get_sorted_tasks()[0][0].config_id == task_config_mult_by_two.id
  356. assert sequence._get_sorted_tasks()[1][0].config_id == task_config_mult_by_3.id
  357. _SequenceManager._submit(sequence.id)
  358. assert sequence.foo.read() == 1
  359. assert sequence.bar.read() == 2
  360. assert sequence.baz.read() == 6
  361. sequence.foo.write("new data value")
  362. assert sequence.foo.read() == "new data value"
  363. assert sequence.bar.read() == 2
  364. assert sequence.baz.read() == 6
  365. sequence.bar.write(7)
  366. assert sequence.foo.read() == "new data value"
  367. assert sequence.bar.read() == 7
  368. assert sequence.baz.read() == 6
  369. with pytest.raises(AttributeError):
  370. sequence.WRONG.write(7)
  371. def notify1(*args, **kwargs): ...
  372. def notify2(*args, **kwargs): ...
  373. def notify_multi_param(*args, **kwargs): ...
  374. def test_sequence_notification_subscribe(mocker):
  375. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  376. task_configs = [
  377. Config.configure_task(
  378. "mult_by_two",
  379. mult_by_two,
  380. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  381. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  382. )
  383. ]
  384. tasks = _TaskManager._bulk_get_or_create(task_configs=task_configs)
  385. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_1": {"tasks": tasks}})
  386. _ScenarioManager._repository._save(scenario)
  387. sequence = scenario.sequences["by_1"]
  388. notify_1 = NotifyMock(sequence)
  389. notify_1.__name__ = "notify_1"
  390. notify_1.__module__ = "notify_1"
  391. notify_2 = NotifyMock(sequence)
  392. notify_2.__name__ = "notify_2"
  393. notify_2.__module__ = "notify_2"
  394. # Mocking this because NotifyMock is a class that does not loads correctly when getting the sequence
  395. # from the storage.
  396. mocker.patch.object(
  397. _utils,
  398. "_load_fct",
  399. side_effect=[notify_1, notify_1, notify_2, notify_2, notify_2, notify_2],
  400. )
  401. # test subscription
  402. callback = mock.MagicMock()
  403. _SequenceManager._submit(sequence.id, [callback])
  404. callback.assert_called()
  405. # test sequence subscribe notification
  406. _SequenceManager._subscribe(callback=notify_1, sequence=sequence)
  407. _SequenceManager._submit(sequence.id)
  408. notify_1.assert_called_3_times()
  409. notify_1.reset()
  410. # test sequence unsubscribe notification
  411. # test subscribe notification only on new job
  412. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  413. _SequenceManager._subscribe(callback=notify_2, sequence=sequence)
  414. _SequenceManager._submit(sequence)
  415. notify_1.assert_not_called()
  416. notify_2.assert_called_3_times()
  417. def test_sequence_notification_subscribe_multi_param(mocker):
  418. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  419. task_configs = [
  420. Config.configure_task(
  421. "mult_by_two",
  422. mult_by_two,
  423. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  424. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  425. )
  426. ]
  427. tasks = _TaskManager._bulk_get_or_create(task_configs)
  428. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_6": {"tasks": tasks}})
  429. _ScenarioManager._repository._save(scenario)
  430. sequence = scenario.sequences["by_6"]
  431. notify = mocker.Mock()
  432. # test sequence subscribe notification
  433. _SequenceManager._subscribe(callback=notify, params=["foobar", 123, 1.2], sequence=sequence)
  434. mocker.patch.object(_SequenceManager, "_get", return_value=sequence)
  435. _SequenceManager._submit(sequence.id)
  436. # as the callback is called with Sequence/Scenario and Job objects
  437. # we can assert that is called with params plus a sequence object that we know
  438. # of and a job object that is represented by ANY in this case
  439. notify.assert_called_with("foobar", 123, 1.2, sequence, ANY)
  440. def test_sequence_notification_unsubscribe(mocker):
  441. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  442. task_configs = [
  443. Config.configure_task(
  444. "mult_by_two",
  445. mult_by_two,
  446. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  447. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  448. )
  449. ]
  450. tasks = _TaskManager._bulk_get_or_create(task_configs)
  451. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_6": {"tasks": tasks}})
  452. _ScenarioManager._repository._save(scenario)
  453. sequence = scenario.sequences["by_6"]
  454. notify_1 = notify1
  455. notify_2 = notify2
  456. _SequenceManager._subscribe(callback=notify_1, sequence=sequence)
  457. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  458. _SequenceManager._subscribe(callback=notify_2, sequence=sequence)
  459. _SequenceManager._submit(sequence.id)
  460. with pytest.raises(ValueError):
  461. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  462. _SequenceManager._unsubscribe(callback=notify_2, sequence=sequence)
  463. def test_sequence_notification_unsubscribe_multi_param():
  464. task_configs = [
  465. Config.configure_task(
  466. "mult_by_two",
  467. mult_by_two,
  468. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  469. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  470. )
  471. ]
  472. tasks = _TaskManager._bulk_get_or_create(task_configs)
  473. scenario = Scenario("scenario", tasks, {}, sequences={"by_6": {"tasks": tasks}})
  474. _ScenarioManager._repository._save(scenario)
  475. sequence = scenario.sequences["by_6"]
  476. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 0], sequence=sequence)
  477. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 1], sequence=sequence)
  478. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 2], sequence=sequence)
  479. assert len(sequence.subscribers) == 3
  480. sequence.unsubscribe(notify_multi_param)
  481. assert len(sequence.subscribers) == 2
  482. assert _Subscriber(notify_multi_param, ["foobar", 123, 0]) not in sequence.subscribers
  483. sequence.unsubscribe(notify_multi_param, ["foobar", 123, 2])
  484. assert len(sequence.subscribers) == 1
  485. assert _Subscriber(notify_multi_param, ["foobar", 123, 2]) not in sequence.subscribers
  486. with pytest.raises(ValueError):
  487. sequence.unsubscribe(notify_multi_param, ["foobar", 123, 10000])
  488. def test_sequence_notification_subscribe_all():
  489. task_configs = [
  490. Config.configure_task(
  491. "mult_by_two",
  492. mult_by_two,
  493. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  494. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  495. )
  496. ]
  497. tasks = _TaskManager._bulk_get_or_create(task_configs)
  498. scenario = Scenario("scenario", tasks, {}, sequences={"by_6": {"tasks": tasks}, "other_sequence": {"tasks": tasks}})
  499. _ScenarioManager._repository._save(scenario)
  500. sequence = scenario.sequences["by_6"]
  501. other_sequence = scenario.sequences["other_sequence"]
  502. notify_1 = NotifyMock(sequence)
  503. _SequenceManager._subscribe(notify_1)
  504. assert len(_SequenceManager._get(sequence.id).subscribers) == 1
  505. assert len(_SequenceManager._get(other_sequence.id).subscribers) == 1
  506. def test_delete():
  507. sequence_id = "SEQUENCE_sequence_SCENARIO_scenario_id_1"
  508. with pytest.raises(ModelNotFound):
  509. _SequenceManager._delete(sequence_id)
  510. scenario_1 = Scenario("scenario_1", set(), {}, scenario_id="SCENARIO_scenario_id_1")
  511. scenario_2 = Scenario("scenario_2", set(), {}, scenario_id="SCENARIO_scenario_id_2")
  512. _ScenarioManager._repository._save(scenario_1)
  513. _ScenarioManager._repository._save(scenario_2)
  514. with pytest.raises(ModelNotFound):
  515. _SequenceManager._delete(SequenceId(sequence_id))
  516. scenario_1.add_sequences({"sequence": []})
  517. assert len(_SequenceManager._get_all()) == 1
  518. _SequenceManager._delete(SequenceId(sequence_id))
  519. assert len(_SequenceManager._get_all()) == 0
  520. scenario_1.add_sequences({"sequence": [], "sequence_1": []})
  521. assert len(_SequenceManager._get_all()) == 2
  522. _SequenceManager._delete(SequenceId(sequence_id))
  523. assert len(_SequenceManager._get_all()) == 1
  524. with pytest.raises(SequenceAlreadyExists):
  525. scenario_1.add_sequences({"sequence_1": [], "sequence_2": [], "sequence_3": []})
  526. scenario_1.add_sequences({"sequence_2": [], "sequence_3": []})
  527. scenario_2.add_sequences({"sequence_1_2": [], "sequence_2_2": []})
  528. assert len(_SequenceManager._get_all()) == 5
  529. _SequenceManager._delete_all()
  530. assert len(_SequenceManager._get_all()) == 0
  531. scenario_1.add_sequences({"sequence_1": [], "sequence_2": [], "sequence_3": [], "sequence_4": []})
  532. scenario_2.add_sequences({"sequence_1_2": [], "sequence_2_2": []})
  533. assert len(_SequenceManager._get_all()) == 6
  534. _SequenceManager._delete_many(
  535. [
  536. "SEQUENCE_sequence_1_SCENARIO_scenario_id_1",
  537. "SEQUENCE_sequence_2_SCENARIO_scenario_id_1",
  538. "SEQUENCE_sequence_1_2_SCENARIO_scenario_id_2",
  539. ]
  540. )
  541. assert len(_SequenceManager._get_all()) == 3
  542. with pytest.raises(ModelNotFound):
  543. _SequenceManager._delete_many(
  544. ["SEQUENCE_sequence_1_SCENARIO_scenario_id_1", "SEQUENCE_sequence_2_SCENARIO_scenario_id_1"]
  545. )
  546. def test_delete_version():
  547. scenario_1_0 = Scenario(
  548. "scenario_config",
  549. [],
  550. {},
  551. scenario_id="SCENARIO_id_1_v1_0",
  552. version="1.0",
  553. sequences={"sequence_1": {}, "sequence_2": {}},
  554. )
  555. scenario_1_1 = Scenario(
  556. "scenario_config",
  557. [],
  558. {},
  559. scenario_id="SCENARIO_id_1_v1_1",
  560. version="1.1",
  561. sequences={"sequence_1": {}, "sequence_2": {}},
  562. )
  563. _ScenarioManager._repository._save(scenario_1_0)
  564. _ScenarioManager._repository._save(scenario_1_1)
  565. _VersionManager._set_experiment_version("1.1")
  566. assert len(_ScenarioManager._get_all()) == 1
  567. assert len(_SequenceManager._get_all()) == 2
  568. _VersionManager._set_experiment_version("1.0")
  569. assert len(_ScenarioManager._get_all()) == 1
  570. assert len(_SequenceManager._get_all()) == 2
  571. _SequenceManager._delete_by_version("1.0")
  572. assert len(_ScenarioManager._get_all()) == 1
  573. assert len(_SequenceManager._get_all()) == 0
  574. assert len(scenario_1_0.sequences) == 0
  575. assert len(scenario_1_1.sequences) == 2
  576. _VersionManager._set_experiment_version("1.1")
  577. assert len(_ScenarioManager._get_all()) == 1
  578. assert len(_SequenceManager._get_all()) == 2
  579. assert len(scenario_1_0.sequences) == 0
  580. assert len(scenario_1_1.sequences) == 2
  581. _SequenceManager._delete_by_version("1.1")
  582. assert len(_ScenarioManager._get_all()) == 1
  583. assert len(_SequenceManager._get_all()) == 0
  584. def test_exists():
  585. scenario = Scenario("scenario", [], {}, scenario_id="SCENARIO_scenario", sequences={"sequence": {}})
  586. _ScenarioManager._repository._save(scenario)
  587. assert len(_ScenarioManager._get_all()) == 1
  588. assert len(_SequenceManager._get_all()) == 1
  589. assert not _SequenceManager._exists("SEQUENCE_sequence_not_exist_SCENARIO_scenario")
  590. assert not _SequenceManager._exists("SEQUENCE_sequence_SCENARIO_scenario_id")
  591. assert _SequenceManager._exists("SEQUENCE_sequence_SCENARIO_scenario")
  592. assert _SequenceManager._exists(scenario.sequences["sequence"])
  593. def test_hard_delete_one_single_sequence_with_scenario_data_nodes():
  594. dn_input_config = Config.configure_data_node("my_input", "in_memory", scope=Scope.SCENARIO, default_data="testing")
  595. dn_output_config = Config.configure_data_node("my_output", "in_memory", scope=Scope.SCENARIO)
  596. task_config = Config.configure_task("task_config", print, dn_input_config, dn_output_config)
  597. tasks = _TaskManager._bulk_get_or_create([task_config])
  598. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  599. _ScenarioManager._repository._save(scenario)
  600. sequence = scenario.sequences["sequence"]
  601. sequence.submit()
  602. assert len(_ScenarioManager._get_all()) == 1
  603. assert len(_SequenceManager._get_all()) == 1
  604. assert len(_TaskManager._get_all()) == 1
  605. assert len(_DataManager._get_all()) == 2
  606. assert len(_JobManager._get_all()) == 1
  607. _SequenceManager._hard_delete(sequence.id)
  608. assert len(_ScenarioManager._get_all()) == 1
  609. assert len(_SequenceManager._get_all()) == 0
  610. assert len(_TaskManager._get_all()) == 1
  611. assert len(_DataManager._get_all()) == 2
  612. assert len(_JobManager._get_all()) == 1
  613. def test_hard_delete_one_single_sequence_with_cycle_data_nodes():
  614. dn_input_config = Config.configure_data_node("my_input", "in_memory", scope=Scope.CYCLE, default_data="testing")
  615. dn_output_config = Config.configure_data_node("my_output", "in_memory", scope=Scope.CYCLE)
  616. task_config = Config.configure_task("task_config", print, dn_input_config, dn_output_config)
  617. tasks = _TaskManager._bulk_get_or_create([task_config])
  618. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  619. _ScenarioManager._repository._save(scenario)
  620. sequence = scenario.sequences["sequence"]
  621. sequence.submit()
  622. assert len(_ScenarioManager._get_all()) == 1
  623. assert len(_SequenceManager._get_all()) == 1
  624. assert len(_TaskManager._get_all()) == 1
  625. assert len(_DataManager._get_all()) == 2
  626. assert len(_JobManager._get_all()) == 1
  627. _SequenceManager._hard_delete(sequence.id)
  628. assert len(_ScenarioManager._get_all()) == 1
  629. assert len(_SequenceManager._get_all()) == 0
  630. assert len(_TaskManager._get_all()) == 1
  631. assert len(_DataManager._get_all()) == 2
  632. assert len(_JobManager._get_all()) == 1
  633. def test_hard_delete_shared_entities():
  634. input_dn = Config.configure_data_node("my_input", "in_memory", default_data="testing")
  635. intermediate_dn = Config.configure_data_node("my_inter", "in_memory")
  636. output_dn = Config.configure_data_node("my_output", "in_memory")
  637. task_1 = Config.configure_task("task_1", print, input_dn, intermediate_dn)
  638. task_2 = Config.configure_task("task_2", print, intermediate_dn, output_dn)
  639. scenario_config = Config.configure_scenario("sc", [task_1, task_2])
  640. import taipy as tp
  641. scenario_1 = tp.create_scenario(scenario_config, name="scenario_1")
  642. scenario_1.add_sequence("sequence", [scenario_1.task_1, scenario_1.task_2])
  643. scenario_2 = tp.create_scenario(scenario_config, name="scenario_2")
  644. scenario_2.add_sequence("sequence", [scenario_2.task_1, scenario_2.task_2])
  645. sequence_1 = scenario_1.sequences["sequence"]
  646. sequence_2 = scenario_2.sequences["sequence"]
  647. _SequenceManager._submit(sequence_1.id)
  648. _SequenceManager._submit(sequence_2.id)
  649. assert len(_ScenarioManager._get_all()) == 2
  650. assert len(_SequenceManager._get_all()) == 2
  651. assert len(_TaskManager._get_all()) == 4
  652. assert len(_DataManager._get_all()) == 6
  653. assert len(_JobManager._get_all()) == 4
  654. _SequenceManager._hard_delete(sequence_1.id)
  655. assert len(_ScenarioManager._get_all()) == 2
  656. assert len(_SequenceManager._get_all()) == 1
  657. assert len(_TaskManager._get_all()) == 4
  658. assert len(_DataManager._get_all()) == 6
  659. assert len(_JobManager._get_all()) == 4
  660. def my_print(a, b):
  661. print(a + b) # noqa: T201
  662. def test_submit_task_with_input_dn_wrong_file_path(caplog):
  663. csv_dn_cfg = Config.configure_csv_data_node("wrong_csv_file_path", default_path="wrong_path.csv")
  664. pickle_dn_cfg = Config.configure_pickle_data_node("wrong_pickle_file_path", default_path="wrong_path.pickle")
  665. parquet_dn_cfg = Config.configure_parquet_data_node("wrong_parquet_file_path", default_path="wrong_path.parquet")
  666. json_dn_cfg = Config.configure_parquet_data_node("wrong_json_file_path", default_path="wrong_path.json")
  667. task_cfg = Config.configure_task("task", my_print, [csv_dn_cfg, pickle_dn_cfg], parquet_dn_cfg)
  668. task_2_cfg = Config.configure_task("task2", my_print, [csv_dn_cfg, parquet_dn_cfg], json_dn_cfg)
  669. tasks = _TaskManager._bulk_get_or_create([task_cfg, task_2_cfg])
  670. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  671. _ScenarioManager._repository._save(scenario)
  672. sequence = scenario.sequences["sequence"]
  673. pip_manager = _SequenceManagerFactory._build_manager()
  674. pip_manager._submit(sequence)
  675. stdout = caplog.text
  676. expected_outputs = [
  677. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  678. f"path : {input_dn.path} "
  679. for input_dn in sequence.get_inputs()
  680. ]
  681. not_expected_outputs = [
  682. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  683. f"path : {input_dn.path} "
  684. for input_dn in sequence.data_nodes.values()
  685. if input_dn not in sequence.get_inputs()
  686. ]
  687. assert all(expected_output in stdout for expected_output in expected_outputs)
  688. assert all(expected_output not in stdout for expected_output in not_expected_outputs)
  689. def test_submit_task_with_one_input_dn_wrong_file_path(caplog):
  690. csv_dn_cfg = Config.configure_csv_data_node("wrong_csv_file_path", default_path="wrong_path.csv")
  691. pickle_dn_cfg = Config.configure_pickle_data_node("wrong_pickle_file_path", default_data="value")
  692. parquet_dn_cfg = Config.configure_parquet_data_node("wrong_parquet_file_path", default_path="wrong_path.parquet")
  693. json_dn_cfg = Config.configure_parquet_data_node("wrong_json_file_path", default_path="wrong_path.json")
  694. task_cfg = Config.configure_task("task", my_print, [csv_dn_cfg, pickle_dn_cfg], parquet_dn_cfg)
  695. task_2_cfg = Config.configure_task("task2", my_print, [csv_dn_cfg, parquet_dn_cfg], json_dn_cfg)
  696. tasks = _TaskManager._bulk_get_or_create([task_cfg, task_2_cfg])
  697. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  698. _ScenarioManager._repository._save(scenario)
  699. sequence = scenario.sequences["sequence"]
  700. pip_manager = _SequenceManagerFactory._build_manager()
  701. pip_manager._submit(sequence)
  702. stdout = caplog.text
  703. expected_outputs = [
  704. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  705. f"path : {input_dn.path} "
  706. for input_dn in sequence.get_inputs()
  707. if input_dn.config_id == "wrong_csv_file_path"
  708. ]
  709. not_expected_outputs = [
  710. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  711. f"path : {input_dn.path} "
  712. for input_dn in sequence.data_nodes.values()
  713. if input_dn.config_id != "wrong_csv_file_path"
  714. ]
  715. assert all(expected_output in stdout for expected_output in expected_outputs)
  716. assert all(expected_output not in stdout for expected_output in not_expected_outputs)