test_sequence_manager.py 39 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976
  1. # Copyright 2023 Avaiga Private Limited
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
  4. # the License. You may obtain a copy of the License at
  5. #
  6. # http://www.apache.org/licenses/LICENSE-2.0
  7. #
  8. # Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
  9. # an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
  10. # specific language governing permissions and limitations under the License.
  11. import json
  12. from pathlib import Path
  13. from typing import Callable, Iterable, Optional
  14. from unittest import mock
  15. from unittest.mock import ANY
  16. import pytest
  17. from taipy.config.common.scope import Scope
  18. from taipy.config.config import Config
  19. from taipy.core._orchestrator._orchestrator import _Orchestrator
  20. from taipy.core._orchestrator._orchestrator_factory import _OrchestratorFactory
  21. from taipy.core._version._version_manager import _VersionManager
  22. from taipy.core.common import _utils
  23. from taipy.core.common._utils import _Subscriber
  24. from taipy.core.config.job_config import JobConfig
  25. from taipy.core.data._data_manager import _DataManager
  26. from taipy.core.data.in_memory import InMemoryDataNode
  27. from taipy.core.exceptions.exceptions import (
  28. InvalidSequenceId,
  29. ModelNotFound,
  30. NonExistingSequence,
  31. SequenceBelongsToNonExistingScenario,
  32. )
  33. from taipy.core.job._job_manager import _JobManager
  34. from taipy.core.scenario._scenario_manager import _ScenarioManager
  35. from taipy.core.scenario.scenario import Scenario
  36. from taipy.core.sequence._sequence_manager import _SequenceManager
  37. from taipy.core.sequence._sequence_manager_factory import _SequenceManagerFactory
  38. from taipy.core.sequence.sequence import Sequence
  39. from taipy.core.sequence.sequence_id import SequenceId
  40. from taipy.core.task._task_manager import _TaskManager
  41. from taipy.core.task.task import Task
  42. from taipy.core.task.task_id import TaskId
  43. from tests.core.utils.NotifyMock import NotifyMock
  44. def test_breakdown_sequence_id():
  45. with pytest.raises(InvalidSequenceId):
  46. _SequenceManager._breakdown_sequence_id("scenario_id")
  47. with pytest.raises(InvalidSequenceId):
  48. _SequenceManager._breakdown_sequence_id("sequence_id")
  49. with pytest.raises(InvalidSequenceId):
  50. _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_id")
  51. with pytest.raises(InvalidSequenceId):
  52. _SequenceManager._breakdown_sequence_id("SCENARIO_scenario_id")
  53. with pytest.raises(InvalidSequenceId):
  54. _SequenceManager._breakdown_sequence_id("sequence_SCENARIO_scenario_id")
  55. with pytest.raises(InvalidSequenceId):
  56. _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_scenario_id")
  57. sequence_name, scenario_id = _SequenceManager._breakdown_sequence_id("SEQUENCE_sequence_SCENARIO_scenario")
  58. assert sequence_name == "sequence" and scenario_id == "SCENARIO_scenario"
  59. sequence_name, scenario_id = _SequenceManager._breakdown_sequence_id("SEQUENCEsequenceSCENARIO_scenario")
  60. assert sequence_name == "sequence" and scenario_id == "SCENARIO_scenario"
  61. def test_raise_sequence_does_not_belong_to_scenario():
  62. with pytest.raises(SequenceBelongsToNonExistingScenario):
  63. sequence = Sequence({"name": "sequence_name"}, [], "SEQUENCE_sequence_name_SCENARIO_scenario_id")
  64. _SequenceManager._set(sequence)
  65. def __init():
  66. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  67. _OrchestratorFactory._build_dispatcher()
  68. input_dn = InMemoryDataNode("foo", Scope.SCENARIO)
  69. output_dn = InMemoryDataNode("foo", Scope.SCENARIO)
  70. task = Task("task", {}, print, [input_dn], [output_dn], TaskId("task_id"))
  71. scenario = Scenario("scenario", set([task]), {}, set())
  72. _ScenarioManager._set(scenario)
  73. return scenario, task
  74. def test_set_and_get_sequence_no_existing_sequence():
  75. scenario, task = __init()
  76. sequence_name_1 = "p1"
  77. sequence_id_1 = SequenceId(f"SEQUENCE_{sequence_name_1}_{scenario.id}")
  78. sequence_name_2 = "p2"
  79. sequence_id_2 = SequenceId(f"SEQUENCE_{sequence_name_2}_{scenario.id}")
  80. assert _SequenceManager._get(sequence_id_1) is None
  81. assert _SequenceManager._get(sequence_id_2) is None
  82. assert _SequenceManager._get("sequence") is None
  83. def test_set_and_get():
  84. scenario, task = __init()
  85. sequence_name_1 = "p1"
  86. sequence_id_1 = SequenceId(f"SEQUENCE_{sequence_name_1}_{scenario.id}")
  87. sequence_name_2 = "p2"
  88. sequence_id_2 = SequenceId(f"SEQUENCE_{sequence_name_2}_{scenario.id}")
  89. scenario.add_sequences({sequence_name_1: []})
  90. sequence_1 = scenario.sequences[sequence_name_1]
  91. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  92. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  93. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  94. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  95. assert _SequenceManager._get(sequence_id_2) is None
  96. # Save a second sequence. Now, we expect to have a total of two sequences stored
  97. _TaskManager._set(task)
  98. scenario.add_sequences({sequence_name_2: [task]})
  99. sequence_2 = scenario.sequences[sequence_name_2]
  100. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  101. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  102. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  103. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  104. assert _SequenceManager._get(sequence_id_2).id == sequence_2.id
  105. assert len(_SequenceManager._get(sequence_id_2).tasks) == 1
  106. assert _SequenceManager._get(sequence_2).id == sequence_2.id
  107. assert len(_SequenceManager._get(sequence_2).tasks) == 1
  108. assert _TaskManager._get(task.id).id == task.id
  109. # We save the first sequence again. We expect nothing to change
  110. scenario.add_sequence(sequence_name_1, [])
  111. sequence_1 = scenario.sequences[sequence_name_1]
  112. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  113. assert len(_SequenceManager._get(sequence_id_1).tasks) == 0
  114. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  115. assert len(_SequenceManager._get(sequence_1).tasks) == 0
  116. assert _SequenceManager._get(sequence_id_2).id == sequence_2.id
  117. assert len(_SequenceManager._get(sequence_id_2).tasks) == 1
  118. assert _SequenceManager._get(sequence_2).id == sequence_2.id
  119. assert len(_SequenceManager._get(sequence_2).tasks) == 1
  120. assert _TaskManager._get(task.id).id == task.id
  121. # We save a third sequence with same name as the first one.
  122. # We expect the first sequence to be updated
  123. scenario.add_sequences({sequence_name_1: [task]})
  124. sequence_3 = scenario.sequences[sequence_name_1]
  125. assert _SequenceManager._get(sequence_id_1).id == sequence_1.id
  126. assert _SequenceManager._get(sequence_id_1).id == sequence_3.id
  127. assert len(_SequenceManager._get(sequence_id_1).tasks) == 1
  128. assert _SequenceManager._get(sequence_1).id == sequence_1.id
  129. assert len(_SequenceManager._get(sequence_1).tasks) == 1
  130. assert _SequenceManager._get(sequence_id_2).id == sequence_2.id
  131. assert len(_SequenceManager._get(sequence_id_2).tasks) == 1
  132. assert _SequenceManager._get(sequence_2).id == sequence_2.id
  133. assert len(_SequenceManager._get(sequence_2).tasks) == 1
  134. assert _TaskManager._get(task.id).id == task.id
  135. def test_get_all_on_multiple_versions_environment():
  136. # Create 5 sequences from Scenario with 2 versions each
  137. for version in range(1, 3):
  138. for i in range(5):
  139. _ScenarioManager._set(
  140. Scenario(
  141. f"config_id_{i+version}",
  142. [],
  143. {},
  144. [],
  145. f"SCENARIO_id_{i}_v{version}",
  146. version=f"{version}.0",
  147. sequences={"sequence": {}},
  148. )
  149. )
  150. _VersionManager._set_experiment_version("1.0")
  151. assert len(_SequenceManager._get_all()) == 5
  152. assert (
  153. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 1
  154. )
  155. assert (
  156. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  157. )
  158. _VersionManager._set_experiment_version("2.0")
  159. assert len(_SequenceManager._get_all()) == 5
  160. assert (
  161. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  162. )
  163. assert (
  164. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 1
  165. )
  166. _VersionManager._set_development_version("1.0")
  167. assert len(_SequenceManager._get_all()) == 5
  168. assert (
  169. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 1
  170. )
  171. assert (
  172. len(_SequenceManager._get_all_by(filters=[{"version": "1.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 0
  173. )
  174. _VersionManager._set_development_version("2.0")
  175. assert len(_SequenceManager._get_all()) == 5
  176. assert (
  177. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v1"}])) == 0
  178. )
  179. assert (
  180. len(_SequenceManager._get_all_by(filters=[{"version": "2.0", "id": "SEQUENCE_sequence_SCENARIO_id_1_v2"}])) == 1
  181. )
  182. def test_is_submittable():
  183. dn = InMemoryDataNode("dn", Scope.SCENARIO, properties={"default_data": 10})
  184. task = Task("task", {}, print, [dn])
  185. scenario = Scenario("scenario", set([task]), {}, set())
  186. _ScenarioManager._set(scenario)
  187. scenario.add_sequences({"sequence": [task]})
  188. sequence = scenario.sequences["sequence"]
  189. assert len(_SequenceManager._get_all()) == 1
  190. assert _SequenceManager._is_submittable(sequence)
  191. assert _SequenceManager._is_submittable(sequence.id)
  192. assert not _SequenceManager._is_submittable("Sequence_temp")
  193. assert not _SequenceManager._is_submittable("SEQUENCE_temp_SCENARIO_scenario")
  194. scenario.dn.edit_in_progress = True
  195. assert not _SequenceManager._is_submittable(sequence)
  196. assert not _SequenceManager._is_submittable(sequence.id)
  197. scenario.dn.edit_in_progress = False
  198. assert _SequenceManager._is_submittable(sequence)
  199. assert _SequenceManager._is_submittable(sequence.id)
  200. def test_submit():
  201. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  202. _OrchestratorFactory._build_dispatcher()
  203. data_node_1 = InMemoryDataNode("foo", Scope.SCENARIO, "s1")
  204. data_node_2 = InMemoryDataNode("bar", Scope.SCENARIO, "s2")
  205. data_node_3 = InMemoryDataNode("baz", Scope.SCENARIO, "s3")
  206. data_node_4 = InMemoryDataNode("qux", Scope.SCENARIO, "s4")
  207. data_node_5 = InMemoryDataNode("quux", Scope.SCENARIO, "s5")
  208. data_node_6 = InMemoryDataNode("quuz", Scope.SCENARIO, "s6")
  209. data_node_7 = InMemoryDataNode("corge", Scope.SCENARIO, "s7")
  210. task_1 = Task(
  211. "grault",
  212. {},
  213. print,
  214. [data_node_1, data_node_2],
  215. [data_node_3, data_node_4],
  216. TaskId("t1"),
  217. )
  218. task_2 = Task("garply", {}, print, [data_node_3], [data_node_5], TaskId("t2"))
  219. task_3 = Task("waldo", {}, print, [data_node_5, data_node_4], [data_node_6], TaskId("t3"))
  220. task_4 = Task("fred", {}, print, [data_node_4], [data_node_7], TaskId("t4"))
  221. scenario = Scenario("sce", {task_1, task_2, task_3, task_4}, {})
  222. sequence_name = "sequence"
  223. sequence_id = Sequence._new_id(sequence_name, scenario.id)
  224. class MockOrchestrator(_Orchestrator):
  225. submit_calls = []
  226. @classmethod
  227. def _lock_dn_output_and_create_job(
  228. cls,
  229. task: Task,
  230. submit_id: str,
  231. submit_entity_id: str,
  232. callbacks: Optional[Iterable[Callable]] = None,
  233. force: bool = False,
  234. ):
  235. cls.submit_calls.append(task)
  236. return super()._lock_dn_output_and_create_job(task, submit_id, submit_entity_id, callbacks, force)
  237. with mock.patch("taipy.core.task._task_manager._TaskManager._orchestrator", new=MockOrchestrator):
  238. # sequence does not exists. We expect an exception to be raised
  239. with pytest.raises(NonExistingSequence):
  240. _SequenceManager._submit(sequence_id)
  241. _ScenarioManager._set(scenario)
  242. scenario.add_sequences({sequence_name: [task_4, task_2, task_1, task_3]})
  243. # sequence, and tasks does exist. We expect the tasks to be submitted
  244. # in a specific order
  245. _TaskManager._set(task_1)
  246. _TaskManager._set(task_2)
  247. _TaskManager._set(task_3)
  248. _TaskManager._set(task_4)
  249. sequence = scenario.sequences[sequence_name]
  250. _SequenceManager._submit(sequence.id)
  251. calls_ids = [t.id for t in _TaskManager._orchestrator().submit_calls]
  252. tasks_ids = [task_1.id, task_2.id, task_4.id, task_3.id]
  253. assert calls_ids == tasks_ids
  254. _SequenceManager._submit(sequence)
  255. calls_ids = [t.id for t in _TaskManager._orchestrator().submit_calls]
  256. tasks_ids = tasks_ids * 2
  257. assert set(calls_ids) == set(tasks_ids)
  258. def test_assign_sequence_as_parent_of_task():
  259. dn_config_1 = Config.configure_data_node("dn_1", "in_memory", scope=Scope.SCENARIO)
  260. dn_config_2 = Config.configure_data_node("dn_2", "in_memory", scope=Scope.SCENARIO)
  261. dn_config_3 = Config.configure_data_node("dn_3", "in_memory", scope=Scope.SCENARIO)
  262. task_config_1 = Config.configure_task("task_1", print, [dn_config_1], [dn_config_2])
  263. task_config_2 = Config.configure_task("task_2", print, [dn_config_2], [dn_config_3])
  264. task_config_3 = Config.configure_task("task_3", print, [dn_config_2], [dn_config_3])
  265. tasks = _TaskManager._bulk_get_or_create([task_config_1, task_config_2, task_config_3], "scenario_id")
  266. sequence_1 = _SequenceManager._create("sequence_1", [tasks[0], tasks[1]], scenario_id="scenario_id")
  267. sequence_2 = _SequenceManager._create("sequence_2", [tasks[0], tasks[2]], scenario_id="scenario_id")
  268. tasks_1 = list(sequence_1.tasks.values())
  269. tasks_2 = list(sequence_2.tasks.values())
  270. assert len(tasks_1) == 2
  271. assert len(tasks_2) == 2
  272. assert tasks_1[0].parent_ids == {sequence_1.id, sequence_2.id}
  273. assert tasks_2[0].parent_ids == {sequence_1.id, sequence_2.id}
  274. assert tasks_1[1].parent_ids == {sequence_1.id}
  275. assert tasks_2[1].parent_ids == {sequence_2.id}
  276. g = 0
  277. def mock_function_no_input_no_output():
  278. global g
  279. g += 1
  280. def mock_function_one_input_no_output(inp):
  281. global g
  282. g += inp
  283. def mock_function_no_input_one_output():
  284. global g
  285. return g
  286. def test_submit_sequence_from_tasks_with_one_or_no_input_output():
  287. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  288. _OrchestratorFactory._build_dispatcher()
  289. # test no input and no output Task
  290. task_no_input_no_output = Task("task_no_input_no_output", {}, mock_function_no_input_no_output)
  291. scenario_1 = Scenario("scenario_1", {task_no_input_no_output}, {})
  292. _TaskManager._set(task_no_input_no_output)
  293. _ScenarioManager._set(scenario_1)
  294. scenario_1.add_sequences({"my_sequence_1": [task_no_input_no_output]})
  295. sequence_1 = scenario_1.sequences["my_sequence_1"]
  296. assert len(sequence_1._get_sorted_tasks()) == 1
  297. _SequenceManager._submit(sequence_1)
  298. assert g == 1
  299. # test one input and no output Task
  300. data_node_input = InMemoryDataNode("input_dn", Scope.SCENARIO, properties={"default_data": 2})
  301. task_one_input_no_output = Task(
  302. "task_one_input_no_output", {}, mock_function_one_input_no_output, input=[data_node_input]
  303. )
  304. scenario_2 = Scenario("scenario_2", {task_one_input_no_output}, {})
  305. _DataManager._set(data_node_input)
  306. data_node_input.unlock_edit()
  307. _TaskManager._set(task_one_input_no_output)
  308. _ScenarioManager._set(scenario_2)
  309. scenario_2.add_sequences({"my_sequence_2": [task_one_input_no_output]})
  310. sequence_2 = scenario_2.sequences["my_sequence_2"]
  311. assert len(sequence_2._get_sorted_tasks()) == 1
  312. _SequenceManager._submit(sequence_2)
  313. assert g == 3
  314. # test no input and one output Task
  315. data_node_output = InMemoryDataNode("output_dn", Scope.SCENARIO, properties={"default_data": None})
  316. task_no_input_one_output = Task(
  317. "task_no_input_one_output", {}, mock_function_no_input_one_output, output=[data_node_output]
  318. )
  319. scenario_3 = Scenario("scenario_3", {task_no_input_one_output}, {})
  320. _DataManager._set(data_node_output)
  321. assert data_node_output.read() is None
  322. _TaskManager._set(task_no_input_one_output)
  323. _ScenarioManager._set(scenario_3)
  324. scenario_3.add_sequences({"my_sequence_3": [task_no_input_one_output]})
  325. sequence_3 = scenario_3.sequences["my_sequence_3"]
  326. assert len(sequence_2._get_sorted_tasks()) == 1
  327. _SequenceManager._submit(sequence_3)
  328. assert data_node_output.read() == 3
  329. def mult_by_two(nb: int):
  330. return nb * 2
  331. def mult_by_3(nb: int):
  332. return nb * 3
  333. def test_get_or_create_data():
  334. # only create intermediate data node once
  335. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  336. dn_config_1 = Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)
  337. dn_config_2 = Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0)
  338. dn_config_6 = Config.configure_data_node("baz", "in_memory", Scope.SCENARIO, default_data=0)
  339. task_config_mult_by_two = Config.configure_task("mult_by_two", mult_by_two, [dn_config_1], dn_config_2)
  340. task_config_mult_by_3 = Config.configure_task("mult_by_3", mult_by_3, [dn_config_2], dn_config_6)
  341. # dn_1 ---> mult_by_two ---> dn_2 ---> mult_by_3 ---> dn_6
  342. scenario_config = Config.configure_scenario("scenario", [task_config_mult_by_two, task_config_mult_by_3])
  343. _OrchestratorFactory._build_dispatcher()
  344. assert len(_DataManager._get_all()) == 0
  345. assert len(_TaskManager._get_all()) == 0
  346. scenario = _ScenarioManager._create(scenario_config)
  347. scenario.add_sequences({"by_6": list(scenario.tasks.values())})
  348. sequence = scenario.sequences["by_6"]
  349. assert sequence.name == "by_6"
  350. assert len(_DataManager._get_all()) == 3
  351. assert len(_TaskManager._get_all()) == 2
  352. assert len(sequence._get_sorted_tasks()) == 2
  353. assert sequence.foo.read() == 1
  354. assert sequence.bar.read() == 0
  355. assert sequence.baz.read() == 0
  356. assert sequence._get_sorted_tasks()[0][0].config_id == task_config_mult_by_two.id
  357. assert sequence._get_sorted_tasks()[1][0].config_id == task_config_mult_by_3.id
  358. _SequenceManager._submit(sequence.id)
  359. assert sequence.foo.read() == 1
  360. assert sequence.bar.read() == 2
  361. assert sequence.baz.read() == 6
  362. sequence.foo.write("new data value")
  363. assert sequence.foo.read() == "new data value"
  364. assert sequence.bar.read() == 2
  365. assert sequence.baz.read() == 6
  366. sequence.bar.write(7)
  367. assert sequence.foo.read() == "new data value"
  368. assert sequence.bar.read() == 7
  369. assert sequence.baz.read() == 6
  370. with pytest.raises(AttributeError):
  371. sequence.WRONG.write(7)
  372. def notify1(*args, **kwargs):
  373. ...
  374. def notify2(*args, **kwargs):
  375. ...
  376. def notify_multi_param(*args, **kwargs):
  377. ...
  378. def test_sequence_notification_subscribe(mocker):
  379. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  380. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  381. task_configs = [
  382. Config.configure_task(
  383. "mult_by_two",
  384. mult_by_two,
  385. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  386. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  387. )
  388. ]
  389. _OrchestratorFactory._build_dispatcher()
  390. tasks = _TaskManager._bulk_get_or_create(task_configs=task_configs)
  391. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_1": {"tasks": tasks}})
  392. _ScenarioManager._set(scenario)
  393. sequence = scenario.sequences["by_1"]
  394. notify_1 = NotifyMock(sequence)
  395. notify_1.__name__ = "notify_1"
  396. notify_1.__module__ = "notify_1"
  397. notify_2 = NotifyMock(sequence)
  398. notify_2.__name__ = "notify_2"
  399. notify_2.__module__ = "notify_2"
  400. # Mocking this because NotifyMock is a class that does not loads correctly when getting the sequence
  401. # from the storage.
  402. mocker.patch.object(_utils, "_load_fct", side_effect=[notify_1, notify_1, notify_2, notify_2, notify_2, notify_2])
  403. # test subscription
  404. callback = mock.MagicMock()
  405. _SequenceManager._submit(sequence.id, [callback])
  406. callback.assert_called()
  407. # test sequence subscribe notification
  408. _SequenceManager._subscribe(callback=notify_1, sequence=sequence)
  409. _SequenceManager._submit(sequence.id)
  410. notify_1.assert_called_3_times()
  411. notify_1.reset()
  412. # test sequence unsubscribe notification
  413. # test subscribe notification only on new job
  414. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  415. _SequenceManager._subscribe(callback=notify_2, sequence=sequence)
  416. _SequenceManager._submit(sequence)
  417. notify_1.assert_not_called()
  418. notify_2.assert_called_3_times()
  419. def test_sequence_notification_subscribe_multi_param(mocker):
  420. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  421. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  422. task_configs = [
  423. Config.configure_task(
  424. "mult_by_two",
  425. mult_by_two,
  426. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  427. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  428. )
  429. ]
  430. _OrchestratorFactory._build_dispatcher()
  431. tasks = _TaskManager._bulk_get_or_create(task_configs)
  432. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_6": {"tasks": tasks}})
  433. _ScenarioManager._set(scenario)
  434. sequence = scenario.sequences["by_6"]
  435. notify = mocker.Mock()
  436. # test sequence subscribe notification
  437. _SequenceManager._subscribe(callback=notify, params=["foobar", 123, 1.2], sequence=sequence)
  438. mocker.patch.object(_SequenceManager, "_get", return_value=sequence)
  439. _SequenceManager._submit(sequence.id)
  440. # as the callback is called with Sequence/Scenario and Job objects
  441. # we can assert that is called with params plus a sequence object that we know
  442. # of and a job object that is represented by ANY in this case
  443. notify.assert_called_with("foobar", 123, 1.2, sequence, ANY)
  444. def test_sequence_notification_unsubscribe(mocker):
  445. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  446. mocker.patch("taipy.core._entity._reload._Reloader._reload", side_effect=lambda m, o: o)
  447. task_configs = [
  448. Config.configure_task(
  449. "mult_by_two",
  450. mult_by_two,
  451. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  452. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  453. )
  454. ]
  455. _OrchestratorFactory._build_dispatcher()
  456. tasks = _TaskManager._bulk_get_or_create(task_configs)
  457. scenario = Scenario("scenario", set(tasks), {}, sequences={"by_6": {"tasks": tasks}})
  458. _ScenarioManager._set(scenario)
  459. sequence = scenario.sequences["by_6"]
  460. notify_1 = notify1
  461. notify_2 = notify2
  462. _SequenceManager._subscribe(callback=notify_1, sequence=sequence)
  463. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  464. _SequenceManager._subscribe(callback=notify_2, sequence=sequence)
  465. _SequenceManager._submit(sequence.id)
  466. with pytest.raises(ValueError):
  467. _SequenceManager._unsubscribe(callback=notify_1, sequence=sequence)
  468. _SequenceManager._unsubscribe(callback=notify_2, sequence=sequence)
  469. def test_sequence_notification_unsubscribe_multi_param():
  470. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  471. task_configs = [
  472. Config.configure_task(
  473. "mult_by_two",
  474. mult_by_two,
  475. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  476. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  477. )
  478. ]
  479. _OrchestratorFactory._build_dispatcher()
  480. tasks = _TaskManager._bulk_get_or_create(task_configs)
  481. scenario = Scenario("scenario", tasks, {}, sequences={"by_6": {"tasks": tasks}})
  482. _ScenarioManager._set(scenario)
  483. sequence = scenario.sequences["by_6"]
  484. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 0], sequence=sequence)
  485. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 1], sequence=sequence)
  486. _SequenceManager._subscribe(callback=notify_multi_param, params=["foobar", 123, 2], sequence=sequence)
  487. assert len(sequence.subscribers) == 3
  488. sequence.unsubscribe(notify_multi_param)
  489. assert len(sequence.subscribers) == 2
  490. assert _Subscriber(notify_multi_param, ["foobar", 123, 0]) not in sequence.subscribers
  491. sequence.unsubscribe(notify_multi_param, ["foobar", 123, 2])
  492. assert len(sequence.subscribers) == 1
  493. assert _Subscriber(notify_multi_param, ["foobar", 123, 2]) not in sequence.subscribers
  494. with pytest.raises(ValueError):
  495. sequence.unsubscribe(notify_multi_param, ["foobar", 123, 10000])
  496. def test_sequence_notification_subscribe_all():
  497. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  498. task_configs = [
  499. Config.configure_task(
  500. "mult_by_two",
  501. mult_by_two,
  502. [Config.configure_data_node("foo", "in_memory", Scope.SCENARIO, default_data=1)],
  503. Config.configure_data_node("bar", "in_memory", Scope.SCENARIO, default_data=0),
  504. )
  505. ]
  506. _OrchestratorFactory._build_dispatcher()
  507. tasks = _TaskManager._bulk_get_or_create(task_configs)
  508. scenario = Scenario("scenario", tasks, {}, sequences={"by_6": {"tasks": tasks}, "other_sequence": {"tasks": tasks}})
  509. _ScenarioManager._set(scenario)
  510. sequence = scenario.sequences["by_6"]
  511. other_sequence = scenario.sequences["other_sequence"]
  512. notify_1 = NotifyMock(sequence)
  513. _SequenceManager._subscribe(notify_1)
  514. assert len(_SequenceManager._get(sequence.id).subscribers) == 1
  515. assert len(_SequenceManager._get(other_sequence.id).subscribers) == 1
  516. def test_delete():
  517. sequence_id = "SEQUENCE_sequence_SCENARIO_scenario_id_1"
  518. with pytest.raises(ModelNotFound):
  519. _SequenceManager._delete(sequence_id)
  520. scenario_1 = Scenario("scenario_1", [], {}, scenario_id="SCENARIO_scenario_id_1")
  521. scenario_2 = Scenario("scenario_2", [], {}, scenario_id="SCENARIO_scenario_id_2")
  522. _ScenarioManager._set(scenario_1)
  523. _ScenarioManager._set(scenario_2)
  524. with pytest.raises(ModelNotFound):
  525. _SequenceManager._delete(sequence_id)
  526. scenario_1.add_sequences({"sequence": {}})
  527. assert len(_SequenceManager._get_all()) == 1
  528. _SequenceManager._delete(sequence_id)
  529. assert len(_SequenceManager._get_all()) == 0
  530. scenario_1.add_sequences({"sequence": {}, "sequence_1": {}})
  531. assert len(_SequenceManager._get_all()) == 2
  532. _SequenceManager._delete(sequence_id)
  533. assert len(_SequenceManager._get_all()) == 1
  534. scenario_1.add_sequences({"sequence_1": {}, "sequence_2": {}, "sequence_3": {}})
  535. scenario_2.add_sequences({"sequence_1_2": {}, "sequence_2_2": {}})
  536. assert len(_SequenceManager._get_all()) == 5
  537. _SequenceManager._delete_all()
  538. assert len(_SequenceManager._get_all()) == 0
  539. scenario_1.add_sequences({"sequence_1": {}, "sequence_2": {}, "sequence_3": {}, "sequence_4": {}})
  540. scenario_2.add_sequences({"sequence_1_2": {}, "sequence_2_2": {}})
  541. assert len(_SequenceManager._get_all()) == 6
  542. _SequenceManager._delete_many(
  543. [
  544. "SEQUENCE_sequence_1_SCENARIO_scenario_id_1",
  545. "SEQUENCE_sequence_2_SCENARIO_scenario_id_1",
  546. "SEQUENCE_sequence_1_2_SCENARIO_scenario_id_2",
  547. ]
  548. )
  549. assert len(_SequenceManager._get_all()) == 3
  550. with pytest.raises(ModelNotFound):
  551. _SequenceManager._delete_many(
  552. ["SEQUENCE_sequence_1_SCENARIO_scenario_id_1", "SEQUENCE_sequence_2_SCENARIO_scenario_id_1"]
  553. )
  554. def test_delete_version():
  555. scenario_1_0 = Scenario(
  556. "scenario_config",
  557. [],
  558. {},
  559. scenario_id="SCENARIO_id_1_v1_0",
  560. version="1.0",
  561. sequences={"sequence_1": {}, "sequence_2": {}},
  562. )
  563. scenario_1_1 = Scenario(
  564. "scenario_config",
  565. [],
  566. {},
  567. scenario_id="SCENARIO_id_1_v1_1",
  568. version="1.1",
  569. sequences={"sequence_1": {}, "sequence_2": {}},
  570. )
  571. _ScenarioManager._set(scenario_1_0)
  572. _ScenarioManager._set(scenario_1_1)
  573. _VersionManager._set_experiment_version("1.1")
  574. assert len(_ScenarioManager._get_all()) == 1
  575. assert len(_SequenceManager._get_all()) == 2
  576. _VersionManager._set_experiment_version("1.0")
  577. assert len(_ScenarioManager._get_all()) == 1
  578. assert len(_SequenceManager._get_all()) == 2
  579. _SequenceManager._delete_by_version("1.0")
  580. assert len(_ScenarioManager._get_all()) == 1
  581. assert len(_SequenceManager._get_all()) == 0
  582. assert len(scenario_1_0.sequences) == 0
  583. assert len(scenario_1_1.sequences) == 2
  584. _VersionManager._set_experiment_version("1.1")
  585. assert len(_ScenarioManager._get_all()) == 1
  586. assert len(_SequenceManager._get_all()) == 2
  587. assert len(scenario_1_0.sequences) == 0
  588. assert len(scenario_1_1.sequences) == 2
  589. _SequenceManager._delete_by_version("1.1")
  590. assert len(_ScenarioManager._get_all()) == 1
  591. assert len(_SequenceManager._get_all()) == 0
  592. def test_exists():
  593. scenario = Scenario("scenario", [], {}, scenario_id="SCENARIO_scenario", sequences={"sequence": {}})
  594. _ScenarioManager._set(scenario)
  595. assert len(_ScenarioManager._get_all()) == 1
  596. assert len(_SequenceManager._get_all()) == 1
  597. assert not _SequenceManager._exists("SEQUENCE_sequence_not_exist_SCENARIO_scenario")
  598. assert not _SequenceManager._exists("SEQUENCE_sequence_SCENARIO_scenario_id")
  599. assert _SequenceManager._exists("SEQUENCE_sequence_SCENARIO_scenario")
  600. assert _SequenceManager._exists(scenario.sequences["sequence"])
  601. def test_export(tmpdir_factory):
  602. path = tmpdir_factory.mktemp("data")
  603. task = Task("task", {}, print, id=TaskId("task_id"))
  604. scenario = Scenario(
  605. "scenario",
  606. set([task]),
  607. {},
  608. set(),
  609. version="1.0",
  610. sequences={"sequence_1": {}, "sequence_2": {"tasks": [task], "properties": {"xyz": "acb"}}},
  611. )
  612. _TaskManager._set(task)
  613. _ScenarioManager._set(scenario)
  614. sequence_1 = scenario.sequences["sequence_1"]
  615. sequence_2 = scenario.sequences["sequence_2"]
  616. _SequenceManager._export(sequence_1.id, Path(path))
  617. export_sequence_json_file_path = f"{path}/sequences/{sequence_1.id}.json"
  618. with open(export_sequence_json_file_path, "rb") as f:
  619. sequence_json_file = json.load(f)
  620. expected_json = {
  621. "id": sequence_1.id,
  622. "owner_id": scenario.id,
  623. "parent_ids": [scenario.id],
  624. "name": "sequence_1",
  625. "tasks": [],
  626. "properties": {},
  627. "subscribers": [],
  628. }
  629. assert expected_json == sequence_json_file
  630. _SequenceManager._export(sequence_2.id, Path(path))
  631. export_sequence_json_file_path = f"{path}/sequences/{sequence_2.id}.json"
  632. with open(export_sequence_json_file_path, "rb") as f:
  633. sequence_json_file = json.load(f)
  634. expected_json = {
  635. "id": sequence_2.id,
  636. "owner_id": scenario.id,
  637. "parent_ids": [scenario.id],
  638. "name": "sequence_2",
  639. "tasks": [task.id],
  640. "properties": {"xyz": "acb"},
  641. "subscribers": [],
  642. }
  643. assert expected_json == sequence_json_file
  644. def test_hard_delete_one_single_sequence_with_scenario_data_nodes():
  645. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  646. dn_input_config = Config.configure_data_node("my_input", "in_memory", scope=Scope.SCENARIO, default_data="testing")
  647. dn_output_config = Config.configure_data_node("my_output", "in_memory", scope=Scope.SCENARIO)
  648. task_config = Config.configure_task("task_config", print, dn_input_config, dn_output_config)
  649. _OrchestratorFactory._build_dispatcher()
  650. tasks = _TaskManager._bulk_get_or_create([task_config])
  651. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  652. _ScenarioManager._set(scenario)
  653. sequence = scenario.sequences["sequence"]
  654. sequence.submit()
  655. assert len(_ScenarioManager._get_all()) == 1
  656. assert len(_SequenceManager._get_all()) == 1
  657. assert len(_TaskManager._get_all()) == 1
  658. assert len(_DataManager._get_all()) == 2
  659. assert len(_JobManager._get_all()) == 1
  660. _SequenceManager._hard_delete(sequence.id)
  661. assert len(_ScenarioManager._get_all()) == 1
  662. assert len(_SequenceManager._get_all()) == 0
  663. assert len(_TaskManager._get_all()) == 1
  664. assert len(_DataManager._get_all()) == 2
  665. assert len(_JobManager._get_all()) == 1
  666. def test_hard_delete_one_single_sequence_with_cycle_data_nodes():
  667. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  668. dn_input_config = Config.configure_data_node("my_input", "in_memory", scope=Scope.CYCLE, default_data="testing")
  669. dn_output_config = Config.configure_data_node("my_output", "in_memory", scope=Scope.CYCLE)
  670. task_config = Config.configure_task("task_config", print, dn_input_config, dn_output_config)
  671. _OrchestratorFactory._build_dispatcher()
  672. tasks = _TaskManager._bulk_get_or_create([task_config])
  673. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  674. _ScenarioManager._set(scenario)
  675. sequence = scenario.sequences["sequence"]
  676. sequence.submit()
  677. assert len(_ScenarioManager._get_all()) == 1
  678. assert len(_SequenceManager._get_all()) == 1
  679. assert len(_TaskManager._get_all()) == 1
  680. assert len(_DataManager._get_all()) == 2
  681. assert len(_JobManager._get_all()) == 1
  682. _SequenceManager._hard_delete(sequence.id)
  683. assert len(_ScenarioManager._get_all()) == 1
  684. assert len(_SequenceManager._get_all()) == 0
  685. assert len(_TaskManager._get_all()) == 1
  686. assert len(_DataManager._get_all()) == 2
  687. assert len(_JobManager._get_all()) == 1
  688. def test_hard_delete_shared_entities():
  689. Config.configure_job_executions(mode=JobConfig._DEVELOPMENT_MODE)
  690. input_dn = Config.configure_data_node("my_input", "in_memory", scope=Scope.SCENARIO, default_data="testing")
  691. intermediate_dn = Config.configure_data_node("my_inter", "in_memory", scope=Scope.GLOBAL, default_data="testing")
  692. output_dn = Config.configure_data_node("my_output", "in_memory", scope=Scope.GLOBAL, default_data="testing")
  693. task_1 = Config.configure_task("task_1", print, input_dn, intermediate_dn)
  694. task_2 = Config.configure_task("task_2", print, intermediate_dn, output_dn)
  695. _OrchestratorFactory._build_dispatcher()
  696. tasks_scenario_1 = _TaskManager._bulk_get_or_create([task_1, task_2], scenario_id="scenario_id_1")
  697. tasks_scenario_2 = _TaskManager._bulk_get_or_create([task_1, task_2], scenario_id="scenario_id_2")
  698. scenario_1 = Scenario("scenario_1", tasks_scenario_1, {}, sequences={"sequence": {"tasks": tasks_scenario_1}})
  699. scenario_2 = Scenario("scenario_2", tasks_scenario_2, {}, sequences={"sequence": {"tasks": tasks_scenario_2}})
  700. _ScenarioManager._set(scenario_1)
  701. _ScenarioManager._set(scenario_2)
  702. sequence_1 = scenario_1.sequences["sequence"]
  703. sequence_2 = scenario_2.sequences["sequence"]
  704. _SequenceManager._submit(sequence_1.id)
  705. _SequenceManager._submit(sequence_2.id)
  706. assert len(_ScenarioManager._get_all()) == 2
  707. assert len(_SequenceManager._get_all()) == 2
  708. assert len(_TaskManager._get_all()) == 3
  709. assert len(_DataManager._get_all()) == 4
  710. assert len(_JobManager._get_all()) == 4
  711. _SequenceManager._hard_delete(sequence_1.id)
  712. assert len(_ScenarioManager._get_all()) == 2
  713. assert len(_SequenceManager._get_all()) == 1
  714. assert len(_TaskManager._get_all()) == 3
  715. assert len(_DataManager._get_all()) == 4
  716. assert len(_JobManager._get_all()) == 4
  717. def my_print(a, b):
  718. print(a + b)
  719. def test_submit_task_with_input_dn_wrong_file_path(caplog):
  720. csv_dn_cfg = Config.configure_csv_data_node("wrong_csv_file_path", default_path="wrong_path.csv")
  721. pickle_dn_cfg = Config.configure_pickle_data_node("wrong_pickle_file_path", default_path="wrong_path.pickle")
  722. parquet_dn_cfg = Config.configure_parquet_data_node("wrong_parquet_file_path", default_path="wrong_path.parquet")
  723. json_dn_cfg = Config.configure_parquet_data_node("wrong_json_file_path", default_path="wrong_path.json")
  724. task_cfg = Config.configure_task("task", my_print, [csv_dn_cfg, pickle_dn_cfg], parquet_dn_cfg)
  725. task_2_cfg = Config.configure_task("task2", my_print, [csv_dn_cfg, parquet_dn_cfg], json_dn_cfg)
  726. tasks = _TaskManager._bulk_get_or_create([task_cfg, task_2_cfg])
  727. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  728. _ScenarioManager._set(scenario)
  729. sequence = scenario.sequences["sequence"]
  730. pip_manager = _SequenceManagerFactory._build_manager()
  731. pip_manager._submit(sequence)
  732. stdout = caplog.text
  733. expected_outputs = [
  734. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  735. f"path : {input_dn.path} "
  736. for input_dn in sequence.get_inputs()
  737. ]
  738. not_expected_outputs = [
  739. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  740. f"path : {input_dn.path} "
  741. for input_dn in sequence.data_nodes.values()
  742. if input_dn not in sequence.get_inputs()
  743. ]
  744. assert all(expected_output in stdout for expected_output in expected_outputs)
  745. assert all(expected_output not in stdout for expected_output in not_expected_outputs)
  746. def test_submit_task_with_one_input_dn_wrong_file_path(caplog):
  747. csv_dn_cfg = Config.configure_csv_data_node("wrong_csv_file_path", default_path="wrong_path.csv")
  748. pickle_dn_cfg = Config.configure_pickle_data_node("wrong_pickle_file_path", default_data="value")
  749. parquet_dn_cfg = Config.configure_parquet_data_node("wrong_parquet_file_path", default_path="wrong_path.parquet")
  750. json_dn_cfg = Config.configure_parquet_data_node("wrong_json_file_path", default_path="wrong_path.json")
  751. task_cfg = Config.configure_task("task", my_print, [csv_dn_cfg, pickle_dn_cfg], parquet_dn_cfg)
  752. task_2_cfg = Config.configure_task("task2", my_print, [csv_dn_cfg, parquet_dn_cfg], json_dn_cfg)
  753. tasks = _TaskManager._bulk_get_or_create([task_cfg, task_2_cfg])
  754. scenario = Scenario("scenario", tasks, {}, sequences={"sequence": {"tasks": tasks}})
  755. _ScenarioManager._set(scenario)
  756. sequence = scenario.sequences["sequence"]
  757. pip_manager = _SequenceManagerFactory._build_manager()
  758. pip_manager._submit(sequence)
  759. stdout = caplog.text
  760. expected_outputs = [
  761. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  762. f"path : {input_dn.path} "
  763. for input_dn in sequence.get_inputs()
  764. if input_dn.config_id == "wrong_csv_file_path"
  765. ]
  766. not_expected_outputs = [
  767. f"{input_dn.id} cannot be read because it has never been written. Hint: The data node may refer to a wrong "
  768. f"path : {input_dn.path} "
  769. for input_dn in sequence.data_nodes.values()
  770. if input_dn.config_id != "wrong_csv_file_path"
  771. ]
  772. assert all(expected_output in stdout for expected_output in expected_outputs)
  773. assert all(expected_output not in stdout for expected_output in not_expected_outputs)