From 11ff829a1b4544a9d6dc405c63c8b347f411d827 Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Wed, 6 Mar 2024 10:38:31 +0300
Subject: [PATCH 1/6] Fixing Dict memoization sorting before normalizing keys
 is unsafe'

---
 parsl/dataflow/dflow.py                       |   3 +-
 parsl/dataflow/memoization.py                 |  15 +++++---
 .../tests/test_python_apps/test_memoize_3.py  |  32 ++++++++++++++++++
 runinfo/000/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/000/checkpoint/tasks.pkl              | Bin 0 -> 328 bytes
 runinfo/001/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/001/checkpoint/tasks.pkl              |   0
 runinfo/002/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/002/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/003/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/003/checkpoint/tasks.pkl              |   0
 runinfo/004/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/004/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/005/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/005/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/006/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/006/checkpoint/tasks.pkl              | Bin 0 -> 164 bytes
 runinfo/007/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/007/checkpoint/tasks.pkl              | Bin 0 -> 328 bytes
 runinfo/008/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/008/checkpoint/tasks.pkl              |   0
 runinfo/009/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/009/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/010/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/010/checkpoint/tasks.pkl              |   0
 runinfo/011/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/011/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/012/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/012/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/013/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/013/checkpoint/tasks.pkl              | Bin 0 -> 164 bytes
 runinfo/014/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/014/checkpoint/tasks.pkl              | Bin 0 -> 328 bytes
 runinfo/015/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/015/checkpoint/tasks.pkl              |   0
 runinfo/016/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/016/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/017/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/017/checkpoint/tasks.pkl              |   0
 runinfo/018/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/018/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/019/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/019/checkpoint/tasks.pkl              | Bin 0 -> 415 bytes
 runinfo/020/checkpoint/dfk.pkl                | Bin 0 -> 78 bytes
 runinfo/020/checkpoint/tasks.pkl              | Bin 0 -> 164 bytes
 45 files changed, 45 insertions(+), 5 deletions(-)
 create mode 100644 parsl/tests/test_python_apps/test_memoize_3.py
 create mode 100644 runinfo/000/checkpoint/dfk.pkl
 create mode 100644 runinfo/000/checkpoint/tasks.pkl
 create mode 100644 runinfo/001/checkpoint/dfk.pkl
 create mode 100644 runinfo/001/checkpoint/tasks.pkl
 create mode 100644 runinfo/002/checkpoint/dfk.pkl
 create mode 100644 runinfo/002/checkpoint/tasks.pkl
 create mode 100644 runinfo/003/checkpoint/dfk.pkl
 create mode 100644 runinfo/003/checkpoint/tasks.pkl
 create mode 100644 runinfo/004/checkpoint/dfk.pkl
 create mode 100644 runinfo/004/checkpoint/tasks.pkl
 create mode 100644 runinfo/005/checkpoint/dfk.pkl
 create mode 100644 runinfo/005/checkpoint/tasks.pkl
 create mode 100644 runinfo/006/checkpoint/dfk.pkl
 create mode 100644 runinfo/006/checkpoint/tasks.pkl
 create mode 100644 runinfo/007/checkpoint/dfk.pkl
 create mode 100644 runinfo/007/checkpoint/tasks.pkl
 create mode 100644 runinfo/008/checkpoint/dfk.pkl
 create mode 100644 runinfo/008/checkpoint/tasks.pkl
 create mode 100644 runinfo/009/checkpoint/dfk.pkl
 create mode 100644 runinfo/009/checkpoint/tasks.pkl
 create mode 100644 runinfo/010/checkpoint/dfk.pkl
 create mode 100644 runinfo/010/checkpoint/tasks.pkl
 create mode 100644 runinfo/011/checkpoint/dfk.pkl
 create mode 100644 runinfo/011/checkpoint/tasks.pkl
 create mode 100644 runinfo/012/checkpoint/dfk.pkl
 create mode 100644 runinfo/012/checkpoint/tasks.pkl
 create mode 100644 runinfo/013/checkpoint/dfk.pkl
 create mode 100644 runinfo/013/checkpoint/tasks.pkl
 create mode 100644 runinfo/014/checkpoint/dfk.pkl
 create mode 100644 runinfo/014/checkpoint/tasks.pkl
 create mode 100644 runinfo/015/checkpoint/dfk.pkl
 create mode 100644 runinfo/015/checkpoint/tasks.pkl
 create mode 100644 runinfo/016/checkpoint/dfk.pkl
 create mode 100644 runinfo/016/checkpoint/tasks.pkl
 create mode 100644 runinfo/017/checkpoint/dfk.pkl
 create mode 100644 runinfo/017/checkpoint/tasks.pkl
 create mode 100644 runinfo/018/checkpoint/dfk.pkl
 create mode 100644 runinfo/018/checkpoint/tasks.pkl
 create mode 100644 runinfo/019/checkpoint/dfk.pkl
 create mode 100644 runinfo/019/checkpoint/tasks.pkl
 create mode 100644 runinfo/020/checkpoint/dfk.pkl
 create mode 100644 runinfo/020/checkpoint/tasks.pkl

diff --git a/parsl/dataflow/dflow.py b/parsl/dataflow/dflow.py
index 707e2abc23..f45ac37629 100644
--- a/parsl/dataflow/dflow.py
+++ b/parsl/dataflow/dflow.py
@@ -730,7 +730,8 @@ def launch_task(self, task_record: TaskRecord) -> Future:
 
         return exec_fu
 
-    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any], Callable]:
+    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any],
+                                                                                                                   Callable]:
         """Look for inputs of the app that are files. Give the data manager
         the opportunity to replace a file with a data future for that file,
         for example wrapping the result of a staging action.
diff --git a/parsl/dataflow/memoization.py b/parsl/dataflow/memoization.py
index e4d657ccaa..2f2126ecba 100644
--- a/parsl/dataflow/memoization.py
+++ b/parsl/dataflow/memoization.py
@@ -5,7 +5,7 @@
 import pickle
 from parsl.dataflow.taskrecord import TaskRecord
 
-from typing import Dict, Any, List, Optional, TYPE_CHECKING
+from typing import Dict, Any, List, Optional, TYPE_CHECKING  # avoid circular imports
 
 if TYPE_CHECKING:
     from parsl import DataFlowKernel  # import loop at runtime - needed for typechecking - TODO turn into "if typing:"
@@ -14,7 +14,9 @@
 
 import types
 
-logger = logging.getLogger(__name__)
+logger = logging.getLogger(__name__)  # logger named name for logging purposes
+
+# memoization function with a single dispatch decorator
 
 
 @singledispatch
@@ -49,6 +51,8 @@ def id_for_memo(obj: object, output_ref: bool = False) -> bytes:
     logger.error("id_for_memo attempted on unknown type {}".format(type(obj)))
     raise ValueError("unknown type for memoization: {}".format(type(obj)))
 
+# type specific implementations - handle how each type should be serialized for memoization
+
 
 @id_for_memo.register(str)
 @id_for_memo.register(int)
@@ -94,10 +98,13 @@ def id_for_memo_dict(denormalized_dict: dict, output_ref: bool = False) -> bytes
     if type(denormalized_dict) is not dict:
         raise ValueError("id_for_memo_dict cannot work on subclasses of dict")
 
-    keys = sorted(denormalized_dict)
+    # keys = sorted(denormalized_dict)  Line that sirosen commented on
+    # Proposed solution was to normalize the keys and then sort them
+    keymap = {id_for_memo(k): k for k in denormalized_dict}
+    normed_keys = sorted(keymap.values())
 
     normalized_list = []
-    for k in keys:
+    for k in normed_keys:
         normalized_list.append(id_for_memo(k))
         normalized_list.append(id_for_memo(denormalized_dict[k], output_ref=output_ref))
     return pickle.dumps(normalized_list)
diff --git a/parsl/tests/test_python_apps/test_memoize_3.py b/parsl/tests/test_python_apps/test_memoize_3.py
new file mode 100644
index 0000000000..4047189853
--- /dev/null
+++ b/parsl/tests/test_python_apps/test_memoize_3.py
@@ -0,0 +1,32 @@
+import pytest
+import enum
+
+# Define an enum - collection of related consonants
+
+
+class Foo(enum.Enum):
+    x = enum.auto()
+    y = enum.auto()
+
+
+# Test function demonstrating the issue with unstable sorting when keys
+# are hashable but not comparable.
+
+
+def test_unstable_sorting():
+    # Functions
+    def foo():
+        return 1
+
+    def bar():
+        return 2
+
+    # Dictionary with problematic keys
+    d = {foo: 1, bar: 2}
+
+    # Sort the dictionary, it should raise a TypeError
+    with pytest.raises(TypeError):
+        sorted(d)
+
+    # Create a dictionary with enum keys
+    d_enum = {Foo.x: 1, Foo.y: 2}
diff --git a/runinfo/000/checkpoint/dfk.pkl b/runinfo/000/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..42edab3d8438858722522a1d2ff2b2566a85118e
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo7DLq^ziN)FR$@!&uB~!dvO7#HP*BZY7

literal 0
HcmV?d00001

diff --git a/runinfo/000/checkpoint/tasks.pkl b/runinfo/000/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..43e10cac9d644b7092cfbcc3694bf083dc02c4e4
GIT binary patch
literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

literal 0
HcmV?d00001

diff --git a/runinfo/001/checkpoint/dfk.pkl b/runinfo/001/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..3b662b2a7ce40652259ddb87761adb1199075d13
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo-DLq^ziN)FR$@!&uB~!dvOZ5QQ?Ha)V

literal 0
HcmV?d00001

diff --git a/runinfo/001/checkpoint/tasks.pkl b/runinfo/001/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/002/checkpoint/dfk.pkl b/runinfo/002/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..b7795f14043475d3207618f7e947cba1b5e2c367
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFodDLq^ziN)FR$@!&uB~!dvOZ5QR02;yo

literal 0
HcmV?d00001

diff --git a/runinfo/002/checkpoint/tasks.pkl b/runinfo/002/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..7b870b571ee3af2cde33315d7631506c09db5746
GIT binary patch
literal 415
zcmZ|Jy-Gtt5I|vzC|FoYTCowW!p!c@&%S|;zJbN;WR?h`VsgPoNG-R#zORL?dmiB9
z99KX0Cx3k{ck^mz``t2MS58o{aCm72DHmg^+zJqM%ZZoyJU%_%56^F}%j10Z5&P-o
zusqycOq=8XBxGw`8auXxNKw@s(9J|8ZLyEY+tVSb);oEZ2xjcnlQ0PhSgP6u(}=uW
y56Of%%t&hYR6@ihEQcZkVU*Aj`82*{j|!RrLP4+wH!ux1LSj|hj>zw;Y4Z!F;(tv5

literal 0
HcmV?d00001

diff --git a/runinfo/003/checkpoint/dfk.pkl b/runinfo/003/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..82262c516874b881152e766b37fc7d7df977d510
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFpIDLq^ziN)FR$@!&uB~!dvOZ5QR6B@$+

literal 0
HcmV?d00001

diff --git a/runinfo/003/checkpoint/tasks.pkl b/runinfo/003/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/004/checkpoint/dfk.pkl b/runinfo/004/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..bf23f7ba146299594b0e0f8f05bc638535b94501
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFoNDLq^ziN)FR$@!&uB~!dvOZ5QRCK|*5

literal 0
HcmV?d00001

diff --git a/runinfo/004/checkpoint/tasks.pkl b/runinfo/004/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..6d31d3eac987ec92e1ce522d417dc9fcfb450c0b
GIT binary patch
literal 415
zcmZ|I!A(Ok41i&TDkKgpz@<HMs_e!|><!=mJH(Eo7NLS@pTq^J1H5CHkO|m;N?gf5
z!1tdPU-uV(efGO~u`P#fpI5DNP;!$ZSX9Up<pjtrc~abjK41HX`P*^#y6;c()w>_2
zmt%j-x6}IcKgq5tr6KcK1qZ_vy|Feg23crC{w#+iU<~9XrA-5fiAZwAT1<f~Hj@$g
zeKRDvTD4%YDuk#}8kw^sa0H22%ZPlw9FhX06rB(}WUX%CT0oTjJZg+1@?kZte*vt-
BgMt76

literal 0
HcmV?d00001

diff --git a/runinfo/005/checkpoint/dfk.pkl b/runinfo/005/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..4a1d3a294535cef6a891df6546111cd01ac0f9a3
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFp2DLq^ziN)FR$@!&uB~!dvOZ5QRIU2<P

literal 0
HcmV?d00001

diff --git a/runinfo/005/checkpoint/tasks.pkl b/runinfo/005/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..6d31d3eac987ec92e1ce522d417dc9fcfb450c0b
GIT binary patch
literal 415
zcmZ|I!A(Ok41i&TDkKgpz@<HMs_e!|><!=mJH(Eo7NLS@pTq^J1H5CHkO|m;N?gf5
z!1tdPU-uV(efGO~u`P#fpI5DNP;!$ZSX9Up<pjtrc~abjK41HX`P*^#y6;c()w>_2
zmt%j-x6}IcKgq5tr6KcK1qZ_vy|Feg23crC{w#+iU<~9XrA-5fiAZwAT1<f~Hj@$g
zeKRDvTD4%YDuk#}8kw^sa0H22%ZPlw9FhX06rB(}WUX%CT0oTjJZg+1@?kZte*vt-
BgMt76

literal 0
HcmV?d00001

diff --git a/runinfo/006/checkpoint/dfk.pkl b/runinfo/006/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..874a78154e124a450df2def432081f4178f774da
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFotDLq^ziN)FR$@!&uB~!eaO7#HQLmI;X

literal 0
HcmV?d00001

diff --git a/runinfo/006/checkpoint/tasks.pkl b/runinfo/006/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..71fbd07dddf46427ceb72493bcabe20884ffd5ac
GIT binary patch
literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C?uO0S(+Fc7@MUSrkW(0q$HUqSth2Km>DG|n_DCq
z8BFQnOsz;xEhx#%&zs`c!&a19T$)od#ham2uK~M>mTBe|=BbHE=Ejx=DVAmi$ti|L
WW@%;?$tETiDM^MYxJ+a!)dK*E88W{B

literal 0
HcmV?d00001

diff --git a/runinfo/007/checkpoint/dfk.pkl b/runinfo/007/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..8236f8554ae87b051eb7dac29e0795bb13e01133
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFpYDLq^ziN)FR$@!&uB~!dvO7#HQTpGpz

literal 0
HcmV?d00001

diff --git a/runinfo/007/checkpoint/tasks.pkl b/runinfo/007/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..43e10cac9d644b7092cfbcc3694bf083dc02c4e4
GIT binary patch
literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

literal 0
HcmV?d00001

diff --git a/runinfo/008/checkpoint/dfk.pkl b/runinfo/008/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..2914824d73d087f1771f5da0945e61cd1969b8dc
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFoFDLq^ziN)FR$@!&uB~!dvOZ5QRavI10

literal 0
HcmV?d00001

diff --git a/runinfo/008/checkpoint/tasks.pkl b/runinfo/008/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/009/checkpoint/dfk.pkl b/runinfo/009/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..316ee2c87b2306fe33e8b242379276c8fe98c903
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo_DLq^ziN)FR$@!&uB~!dvOZ5QRg&N5K

literal 0
HcmV?d00001

diff --git a/runinfo/009/checkpoint/tasks.pkl b/runinfo/009/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..44f968dcff09c91c986b0c79d9bb35ed4c1c6515
GIT binary patch
literal 415
zcmZ|HJxW9|5CC9{MX?e=dn*x(WhTk|q_VZqJ4|LLtRO1xKClt?0I#rk-oay9*qZME
z-(mHAfAr^bxtUj6+ijQms&ayYg~LlLNVynO<yL^8TTZ;pr}5$OwtsqkSsv%(_t;I(
z`{m*Cd|Ds=FCkmw(%7*jM2f2BfNmx#X@h-K{+ta<wcg3QL@;Boo`gwAz*5yNm`3I8
z#js46!;GYMPbEZL!g44w5Jm|dm0u^rl07PD1_%Yg8r;A%+z5$PZ8IwGuBY`cKn#D>

literal 0
HcmV?d00001

diff --git a/runinfo/010/checkpoint/dfk.pkl b/runinfo/010/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..85fbf53152b6d6a15658ae85865d755c4f62b0d2
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH;-DLq^ziN)FR$@!&uB~!dvOZ5QQ?i#@W

literal 0
HcmV?d00001

diff --git a/runinfo/010/checkpoint/tasks.pkl b/runinfo/010/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/011/checkpoint/dfk.pkl b/runinfo/011/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..ac39ce6997d92b494dd6a61892b73e336e6b00d6
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<oDLq^ziN)FR$@!&uB~!dvOZ5QR0UE*p

literal 0
HcmV?d00001

diff --git a/runinfo/011/checkpoint/tasks.pkl b/runinfo/011/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..900a1d7324a11fcfa04be8d5017b29c3a395daf5
GIT binary patch
literal 415
zcmZ|IF-}7<41i&VsuD8?pc7)M?8Zs#3m_J_L+m&z5~5YxC$S)PWO!q^4X5EGRAMFn
z0lxpd_<Fqh>!aV#i)}e>`@CwEgOZyR!J<N*C?`N}$&=zH^!eJ~&G)C5-CKX2mj^#i
zuc!XBTTbiq|0KJrl!nX~6&wsx^v2q}7-XRl`ExrY0b?L9DQy}+Ohl3^)?x}|v6+m>
z@0%gX)v5)HRUt%;(#V`8fg?!FT1MpOYDfx@QglM_khQvjYXMRA%cwDq$cMXW{R_*X
BgS7wv

literal 0
HcmV?d00001

diff --git a/runinfo/012/checkpoint/dfk.pkl b/runinfo/012/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..6a2fb46970d2bda2108060e837baa7bca94b0bde
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<IDLq^ziN)FR$@!&uB~!dvOZ5QR6dJ<-

literal 0
HcmV?d00001

diff --git a/runinfo/012/checkpoint/tasks.pkl b/runinfo/012/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..900a1d7324a11fcfa04be8d5017b29c3a395daf5
GIT binary patch
literal 415
zcmZ|IF-}7<41i&VsuD8?pc7)M?8Zs#3m_J_L+m&z5~5YxC$S)PWO!q^4X5EGRAMFn
z0lxpd_<Fqh>!aV#i)}e>`@CwEgOZyR!J<N*C?`N}$&=zH^!eJ~&G)C5-CKX2mj^#i
zuc!XBTTbiq|0KJrl!nX~6&wsx^v2q}7-XRl`ExrY0b?L9DQy}+Ohl3^)?x}|v6+m>
z@0%gX)v5)HRUt%;(#V`8fg?!FT1MpOYDfx@QglM_khQvjYXMRA%cwDq$cMXW{R_*X
BgS7wv

literal 0
HcmV?d00001

diff --git a/runinfo/013/checkpoint/dfk.pkl b/runinfo/013/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..0dbeb2acdee59325a15dffe59d9b9df63b0b5ae0
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<|DLq^ziN)FR$@!&uB~!eaO7#HQ9vZ;_

literal 0
HcmV?d00001

diff --git a/runinfo/013/checkpoint/tasks.pkl b/runinfo/013/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..71fbd07dddf46427ceb72493bcabe20884ffd5ac
GIT binary patch
literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C?uO0S(+Fc7@MUSrkW(0q$HUqSth2Km>DG|n_DCq
z8BFQnOsz;xEhx#%&zs`c!&a19T$)od#ham2uK~M>mTBe|=BbHE=Ejx=DVAmi$ti|L
WW@%;?$tETiDM^MYxJ+a!)dK*E88W{B

literal 0
HcmV?d00001

diff --git a/runinfo/014/checkpoint/dfk.pkl b/runinfo/014/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..61cda9a00cc1779fd06e979a246bb58cd08380de
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<2DLq^ziN)FR$@!&uB~!dvO7#HQHyXqM

literal 0
HcmV?d00001

diff --git a/runinfo/014/checkpoint/tasks.pkl b/runinfo/014/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..43e10cac9d644b7092cfbcc3694bf083dc02c4e4
GIT binary patch
literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

literal 0
HcmV?d00001

diff --git a/runinfo/015/checkpoint/dfk.pkl b/runinfo/015/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..be417e7a29e669e601f885ef9f56311f45665d9b
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<&DLq^ziN)FR$@!&uB~!dvOZ5QRO&Z1k

literal 0
HcmV?d00001

diff --git a/runinfo/015/checkpoint/tasks.pkl b/runinfo/015/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/016/checkpoint/dfk.pkl b/runinfo/016/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..235a8b3f11be4d3b8a94443b6d46e5372486386d
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<YDLq^ziN)FR$@!&uB~!dvOZ5QRU>e5&

literal 0
HcmV?d00001

diff --git a/runinfo/016/checkpoint/tasks.pkl b/runinfo/016/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..2a6331874dc697a78d8087aab357ef59778341c9
GIT binary patch
literal 415
zcmZ|HJxW7C5CC9>AbJ47Qah_Kv%B-NH?UE>!t7+02%^E{flVL>c;)k|mSSP+eh2tY
ztFMQ%KgZ>MUTtl^UFO@$2?`btFRdWuVoa4=0fKHh@iJe<r^oK_^8U6w%@-fBpI#5k
z<L-P~pZ+f)TjSE$u_Z)`s^)-hCMs!zeN=wm3`@1%$-6`_W3QfsNl3s_)h?Ju<?(u0
xCd^?*QoE-TA}(P$6d4GkgpSIe%VEhL6*L2cf?y49U>a_O#HzL#mCtw6`WIF~fkglS

literal 0
HcmV?d00001

diff --git a/runinfo/017/checkpoint/dfk.pkl b/runinfo/017/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..dc3c30d19d7c6ed6f38a92e67c87a0a0444a956a
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH=DDLq^ziN)FR$@!&uB~!dvOZ5QRa~jA1

literal 0
HcmV?d00001

diff --git a/runinfo/017/checkpoint/tasks.pkl b/runinfo/017/checkpoint/tasks.pkl
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/runinfo/018/checkpoint/dfk.pkl b/runinfo/018/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..ff38200ea62d3b04a171b19e840f886527e90af2
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH;_DLq^ziN)FR$@!&uB~!dvOZ5QRh8oEL

literal 0
HcmV?d00001

diff --git a/runinfo/018/checkpoint/tasks.pkl b/runinfo/018/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..f13c7af35c3363740ff448250c6c7d6ac6c6830b
GIT binary patch
literal 415
zcmZ|IF-}7<41i&V3PcaU(&ddzmEAareFGM_L+m&z5`v2MNi0Y`z#GG1xD$t<5-a%+
z@crl2*TdCcpZ$JW?aOiBm#I|_N^VjFiwb$7oB+8cPl~(Hms|fZKb)T5Ui;H>{qD#4
z<<uY7ck}lAKgq5tr6Kc01qZ_vy|Feg23crCeosRZFb49H(yjr-L?pRlEv7&go5_fz
z^^oLh)q=&U5TZtDWX_Vn5hP|UBXYVKk^-a@oe(@^t#062K$QJ5YK$ZDXESeq0jlAG
A!2kdN

literal 0
HcmV?d00001

diff --git a/runinfo/019/checkpoint/dfk.pkl b/runinfo/019/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..33601045bc7228d8d23b85608b68fecd9876fc27
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<wDLq^ziN)FR$@!&uB~!dvOZ5QRnHtIf

literal 0
HcmV?d00001

diff --git a/runinfo/019/checkpoint/tasks.pkl b/runinfo/019/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..f13c7af35c3363740ff448250c6c7d6ac6c6830b
GIT binary patch
literal 415
zcmZ|IF-}7<41i&V3PcaU(&ddzmEAareFGM_L+m&z5`v2MNi0Y`z#GG1xD$t<5-a%+
z@crl2*TdCcpZ$JW?aOiBm#I|_N^VjFiwb$7oB+8cPl~(Hms|fZKb)T5Ui;H>{qD#4
z<<uY7ck}lAKgq5tr6Kc01qZ_vy|Feg23crCeosRZFb49H(yjr-L?pRlEv7&go5_fz
z^^oLh)q=&U5TZtDWX_Vn5hP|UBXYVKk^-a@oe(@^t#062K$QJ5YK$ZDXESeq0jlAG
A!2kdN

literal 0
HcmV?d00001

diff --git a/runinfo/020/checkpoint/dfk.pkl b/runinfo/020/checkpoint/dfk.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..eb770c8ed3465f2a732ba2a1cf28c7b7382be813
GIT binary patch
literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFGzdDLq^ziN)FR$@!&uB~!eaO7#HP`5M0f

literal 0
HcmV?d00001

diff --git a/runinfo/020/checkpoint/tasks.pkl b/runinfo/020/checkpoint/tasks.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..5ea3527e19b06f2f403ff213d3255bc1b0fe23fd
GIT binary patch
literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C|IVMTbQRNCYc*s8l+g786>9|8kwb;StOg7SfnHw
zrcCMKOsz;xEhx#%&zs`c!&a19T$)od#ha;AuK~M>$tFgYCWZ#aW+{fLCW$5~N#;qG
Wi76&#Mv2Mh7D+}1xJ+ay)dK*Pp)$V!

literal 0
HcmV?d00001


From 6fd93a9bfb3a49b87c2b0887c11c7164207e0ba2 Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Mon, 18 Mar 2024 16:33:13 +0300
Subject: [PATCH 2/6] Remove accidentally committed runinfo files

---
 runinfo/000/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/000/checkpoint/tasks.pkl | Bin 328 -> 0 bytes
 runinfo/001/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/001/checkpoint/tasks.pkl |   0
 runinfo/002/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/002/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/003/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/003/checkpoint/tasks.pkl |   0
 runinfo/004/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/004/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/005/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/005/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/006/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/006/checkpoint/tasks.pkl | Bin 164 -> 0 bytes
 runinfo/007/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/007/checkpoint/tasks.pkl | Bin 328 -> 0 bytes
 runinfo/008/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/008/checkpoint/tasks.pkl |   0
 runinfo/009/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/009/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/010/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/010/checkpoint/tasks.pkl |   0
 runinfo/011/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/011/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/012/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/012/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/013/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/013/checkpoint/tasks.pkl | Bin 164 -> 0 bytes
 runinfo/014/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/014/checkpoint/tasks.pkl | Bin 328 -> 0 bytes
 runinfo/015/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/015/checkpoint/tasks.pkl |   0
 runinfo/016/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/016/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/017/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/017/checkpoint/tasks.pkl |   0
 runinfo/018/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/018/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/019/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/019/checkpoint/tasks.pkl | Bin 415 -> 0 bytes
 runinfo/020/checkpoint/dfk.pkl   | Bin 78 -> 0 bytes
 runinfo/020/checkpoint/tasks.pkl | Bin 164 -> 0 bytes
 42 files changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 runinfo/000/checkpoint/dfk.pkl
 delete mode 100644 runinfo/000/checkpoint/tasks.pkl
 delete mode 100644 runinfo/001/checkpoint/dfk.pkl
 delete mode 100644 runinfo/001/checkpoint/tasks.pkl
 delete mode 100644 runinfo/002/checkpoint/dfk.pkl
 delete mode 100644 runinfo/002/checkpoint/tasks.pkl
 delete mode 100644 runinfo/003/checkpoint/dfk.pkl
 delete mode 100644 runinfo/003/checkpoint/tasks.pkl
 delete mode 100644 runinfo/004/checkpoint/dfk.pkl
 delete mode 100644 runinfo/004/checkpoint/tasks.pkl
 delete mode 100644 runinfo/005/checkpoint/dfk.pkl
 delete mode 100644 runinfo/005/checkpoint/tasks.pkl
 delete mode 100644 runinfo/006/checkpoint/dfk.pkl
 delete mode 100644 runinfo/006/checkpoint/tasks.pkl
 delete mode 100644 runinfo/007/checkpoint/dfk.pkl
 delete mode 100644 runinfo/007/checkpoint/tasks.pkl
 delete mode 100644 runinfo/008/checkpoint/dfk.pkl
 delete mode 100644 runinfo/008/checkpoint/tasks.pkl
 delete mode 100644 runinfo/009/checkpoint/dfk.pkl
 delete mode 100644 runinfo/009/checkpoint/tasks.pkl
 delete mode 100644 runinfo/010/checkpoint/dfk.pkl
 delete mode 100644 runinfo/010/checkpoint/tasks.pkl
 delete mode 100644 runinfo/011/checkpoint/dfk.pkl
 delete mode 100644 runinfo/011/checkpoint/tasks.pkl
 delete mode 100644 runinfo/012/checkpoint/dfk.pkl
 delete mode 100644 runinfo/012/checkpoint/tasks.pkl
 delete mode 100644 runinfo/013/checkpoint/dfk.pkl
 delete mode 100644 runinfo/013/checkpoint/tasks.pkl
 delete mode 100644 runinfo/014/checkpoint/dfk.pkl
 delete mode 100644 runinfo/014/checkpoint/tasks.pkl
 delete mode 100644 runinfo/015/checkpoint/dfk.pkl
 delete mode 100644 runinfo/015/checkpoint/tasks.pkl
 delete mode 100644 runinfo/016/checkpoint/dfk.pkl
 delete mode 100644 runinfo/016/checkpoint/tasks.pkl
 delete mode 100644 runinfo/017/checkpoint/dfk.pkl
 delete mode 100644 runinfo/017/checkpoint/tasks.pkl
 delete mode 100644 runinfo/018/checkpoint/dfk.pkl
 delete mode 100644 runinfo/018/checkpoint/tasks.pkl
 delete mode 100644 runinfo/019/checkpoint/dfk.pkl
 delete mode 100644 runinfo/019/checkpoint/tasks.pkl
 delete mode 100644 runinfo/020/checkpoint/dfk.pkl
 delete mode 100644 runinfo/020/checkpoint/tasks.pkl

diff --git a/runinfo/000/checkpoint/dfk.pkl b/runinfo/000/checkpoint/dfk.pkl
deleted file mode 100644
index 42edab3d8438858722522a1d2ff2b2566a85118e..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo7DLq^ziN)FR$@!&uB~!dvO7#HP*BZY7

diff --git a/runinfo/000/checkpoint/tasks.pkl b/runinfo/000/checkpoint/tasks.pkl
deleted file mode 100644
index 43e10cac9d644b7092cfbcc3694bf083dc02c4e4..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

diff --git a/runinfo/001/checkpoint/dfk.pkl b/runinfo/001/checkpoint/dfk.pkl
deleted file mode 100644
index 3b662b2a7ce40652259ddb87761adb1199075d13..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo-DLq^ziN)FR$@!&uB~!dvOZ5QQ?Ha)V

diff --git a/runinfo/001/checkpoint/tasks.pkl b/runinfo/001/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/002/checkpoint/dfk.pkl b/runinfo/002/checkpoint/dfk.pkl
deleted file mode 100644
index b7795f14043475d3207618f7e947cba1b5e2c367..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFodDLq^ziN)FR$@!&uB~!dvOZ5QR02;yo

diff --git a/runinfo/002/checkpoint/tasks.pkl b/runinfo/002/checkpoint/tasks.pkl
deleted file mode 100644
index 7b870b571ee3af2cde33315d7631506c09db5746..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|Jy-Gtt5I|vzC|FoYTCowW!p!c@&%S|;zJbN;WR?h`VsgPoNG-R#zORL?dmiB9
z99KX0Cx3k{ck^mz``t2MS58o{aCm72DHmg^+zJqM%ZZoyJU%_%56^F}%j10Z5&P-o
zusqycOq=8XBxGw`8auXxNKw@s(9J|8ZLyEY+tVSb);oEZ2xjcnlQ0PhSgP6u(}=uW
y56Of%%t&hYR6@ihEQcZkVU*Aj`82*{j|!RrLP4+wH!ux1LSj|hj>zw;Y4Z!F;(tv5

diff --git a/runinfo/003/checkpoint/dfk.pkl b/runinfo/003/checkpoint/dfk.pkl
deleted file mode 100644
index 82262c516874b881152e766b37fc7d7df977d510..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFpIDLq^ziN)FR$@!&uB~!dvOZ5QR6B@$+

diff --git a/runinfo/003/checkpoint/tasks.pkl b/runinfo/003/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/004/checkpoint/dfk.pkl b/runinfo/004/checkpoint/dfk.pkl
deleted file mode 100644
index bf23f7ba146299594b0e0f8f05bc638535b94501..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFoNDLq^ziN)FR$@!&uB~!dvOZ5QRCK|*5

diff --git a/runinfo/004/checkpoint/tasks.pkl b/runinfo/004/checkpoint/tasks.pkl
deleted file mode 100644
index 6d31d3eac987ec92e1ce522d417dc9fcfb450c0b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|I!A(Ok41i&TDkKgpz@<HMs_e!|><!=mJH(Eo7NLS@pTq^J1H5CHkO|m;N?gf5
z!1tdPU-uV(efGO~u`P#fpI5DNP;!$ZSX9Up<pjtrc~abjK41HX`P*^#y6;c()w>_2
zmt%j-x6}IcKgq5tr6KcK1qZ_vy|Feg23crC{w#+iU<~9XrA-5fiAZwAT1<f~Hj@$g
zeKRDvTD4%YDuk#}8kw^sa0H22%ZPlw9FhX06rB(}WUX%CT0oTjJZg+1@?kZte*vt-
BgMt76

diff --git a/runinfo/005/checkpoint/dfk.pkl b/runinfo/005/checkpoint/dfk.pkl
deleted file mode 100644
index 4a1d3a294535cef6a891df6546111cd01ac0f9a3..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFp2DLq^ziN)FR$@!&uB~!dvOZ5QRIU2<P

diff --git a/runinfo/005/checkpoint/tasks.pkl b/runinfo/005/checkpoint/tasks.pkl
deleted file mode 100644
index 6d31d3eac987ec92e1ce522d417dc9fcfb450c0b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|I!A(Ok41i&TDkKgpz@<HMs_e!|><!=mJH(Eo7NLS@pTq^J1H5CHkO|m;N?gf5
z!1tdPU-uV(efGO~u`P#fpI5DNP;!$ZSX9Up<pjtrc~abjK41HX`P*^#y6;c()w>_2
zmt%j-x6}IcKgq5tr6KcK1qZ_vy|Feg23crC{w#+iU<~9XrA-5fiAZwAT1<f~Hj@$g
zeKRDvTD4%YDuk#}8kw^sa0H22%ZPlw9FhX06rB(}WUX%CT0oTjJZg+1@?kZte*vt-
BgMt76

diff --git a/runinfo/006/checkpoint/dfk.pkl b/runinfo/006/checkpoint/dfk.pkl
deleted file mode 100644
index 874a78154e124a450df2def432081f4178f774da..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFotDLq^ziN)FR$@!&uB~!eaO7#HQLmI;X

diff --git a/runinfo/006/checkpoint/tasks.pkl b/runinfo/006/checkpoint/tasks.pkl
deleted file mode 100644
index 71fbd07dddf46427ceb72493bcabe20884ffd5ac..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C?uO0S(+Fc7@MUSrkW(0q$HUqSth2Km>DG|n_DCq
z8BFQnOsz;xEhx#%&zs`c!&a19T$)od#ham2uK~M>mTBe|=BbHE=Ejx=DVAmi$ti|L
WW@%;?$tETiDM^MYxJ+a!)dK*E88W{B

diff --git a/runinfo/007/checkpoint/dfk.pkl b/runinfo/007/checkpoint/dfk.pkl
deleted file mode 100644
index 8236f8554ae87b051eb7dac29e0795bb13e01133..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFpYDLq^ziN)FR$@!&uB~!dvO7#HQTpGpz

diff --git a/runinfo/007/checkpoint/tasks.pkl b/runinfo/007/checkpoint/tasks.pkl
deleted file mode 100644
index 43e10cac9d644b7092cfbcc3694bf083dc02c4e4..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

diff --git a/runinfo/008/checkpoint/dfk.pkl b/runinfo/008/checkpoint/dfk.pkl
deleted file mode 100644
index 2914824d73d087f1771f5da0945e61cd1969b8dc..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFoFDLq^ziN)FR$@!&uB~!dvOZ5QRavI10

diff --git a/runinfo/008/checkpoint/tasks.pkl b/runinfo/008/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/009/checkpoint/dfk.pkl b/runinfo/009/checkpoint/dfk.pkl
deleted file mode 100644
index 316ee2c87b2306fe33e8b242379276c8fe98c903..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFFo_DLq^ziN)FR$@!&uB~!dvOZ5QRg&N5K

diff --git a/runinfo/009/checkpoint/tasks.pkl b/runinfo/009/checkpoint/tasks.pkl
deleted file mode 100644
index 44f968dcff09c91c986b0c79d9bb35ed4c1c6515..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|HJxW9|5CC9{MX?e=dn*x(WhTk|q_VZqJ4|LLtRO1xKClt?0I#rk-oay9*qZME
z-(mHAfAr^bxtUj6+ijQms&ayYg~LlLNVynO<yL^8TTZ;pr}5$OwtsqkSsv%(_t;I(
z`{m*Cd|Ds=FCkmw(%7*jM2f2BfNmx#X@h-K{+ta<wcg3QL@;Boo`gwAz*5yNm`3I8
z#js46!;GYMPbEZL!g44w5Jm|dm0u^rl07PD1_%Yg8r;A%+z5$PZ8IwGuBY`cKn#D>

diff --git a/runinfo/010/checkpoint/dfk.pkl b/runinfo/010/checkpoint/dfk.pkl
deleted file mode 100644
index 85fbf53152b6d6a15658ae85865d755c4f62b0d2..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH;-DLq^ziN)FR$@!&uB~!dvOZ5QQ?i#@W

diff --git a/runinfo/010/checkpoint/tasks.pkl b/runinfo/010/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/011/checkpoint/dfk.pkl b/runinfo/011/checkpoint/dfk.pkl
deleted file mode 100644
index ac39ce6997d92b494dd6a61892b73e336e6b00d6..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<oDLq^ziN)FR$@!&uB~!dvOZ5QR0UE*p

diff --git a/runinfo/011/checkpoint/tasks.pkl b/runinfo/011/checkpoint/tasks.pkl
deleted file mode 100644
index 900a1d7324a11fcfa04be8d5017b29c3a395daf5..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|IF-}7<41i&VsuD8?pc7)M?8Zs#3m_J_L+m&z5~5YxC$S)PWO!q^4X5EGRAMFn
z0lxpd_<Fqh>!aV#i)}e>`@CwEgOZyR!J<N*C?`N}$&=zH^!eJ~&G)C5-CKX2mj^#i
zuc!XBTTbiq|0KJrl!nX~6&wsx^v2q}7-XRl`ExrY0b?L9DQy}+Ohl3^)?x}|v6+m>
z@0%gX)v5)HRUt%;(#V`8fg?!FT1MpOYDfx@QglM_khQvjYXMRA%cwDq$cMXW{R_*X
BgS7wv

diff --git a/runinfo/012/checkpoint/dfk.pkl b/runinfo/012/checkpoint/dfk.pkl
deleted file mode 100644
index 6a2fb46970d2bda2108060e837baa7bca94b0bde..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<IDLq^ziN)FR$@!&uB~!dvOZ5QR6dJ<-

diff --git a/runinfo/012/checkpoint/tasks.pkl b/runinfo/012/checkpoint/tasks.pkl
deleted file mode 100644
index 900a1d7324a11fcfa04be8d5017b29c3a395daf5..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|IF-}7<41i&VsuD8?pc7)M?8Zs#3m_J_L+m&z5~5YxC$S)PWO!q^4X5EGRAMFn
z0lxpd_<Fqh>!aV#i)}e>`@CwEgOZyR!J<N*C?`N}$&=zH^!eJ~&G)C5-CKX2mj^#i
zuc!XBTTbiq|0KJrl!nX~6&wsx^v2q}7-XRl`ExrY0b?L9DQy}+Ohl3^)?x}|v6+m>
z@0%gX)v5)HRUt%;(#V`8fg?!FT1MpOYDfx@QglM_khQvjYXMRA%cwDq$cMXW{R_*X
BgS7wv

diff --git a/runinfo/013/checkpoint/dfk.pkl b/runinfo/013/checkpoint/dfk.pkl
deleted file mode 100644
index 0dbeb2acdee59325a15dffe59d9b9df63b0b5ae0..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<|DLq^ziN)FR$@!&uB~!eaO7#HQ9vZ;_

diff --git a/runinfo/013/checkpoint/tasks.pkl b/runinfo/013/checkpoint/tasks.pkl
deleted file mode 100644
index 71fbd07dddf46427ceb72493bcabe20884ffd5ac..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C?uO0S(+Fc7@MUSrkW(0q$HUqSth2Km>DG|n_DCq
z8BFQnOsz;xEhx#%&zs`c!&a19T$)od#ham2uK~M>mTBe|=BbHE=Ejx=DVAmi$ti|L
WW@%;?$tETiDM^MYxJ+a!)dK*E88W{B

diff --git a/runinfo/014/checkpoint/dfk.pkl b/runinfo/014/checkpoint/dfk.pkl
deleted file mode 100644
index 61cda9a00cc1779fd06e979a246bb58cd08380de..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<2DLq^ziN)FR$@!&uB~!dvO7#HQHyXqM

diff --git a/runinfo/014/checkpoint/tasks.pkl b/runinfo/014/checkpoint/tasks.pkl
deleted file mode 100644
index 43e10cac9d644b7092cfbcc3694bf083dc02c4e4..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 328
zcmZ|HL25!V5CBjqAHiF6=}IPMl9`;qh0r@pW)dtE6~7<c2p-@s)BE;Ax8@z-y@ubz
z>ff_%=iwydsm-4hYsHvj2xNxhm=KvUMe<sMK$|z^q2+r2zMR|FyuOuj`nk8`YTCWt
zj}}D$8626GN}Nh|y3F2!VkYj5AKlRb8neK%auUksErKN|f@nsrHxAuVeR1HmFxBOb
Tnl-t-RSbJF0nWW~J?;JgVP9p3

diff --git a/runinfo/015/checkpoint/dfk.pkl b/runinfo/015/checkpoint/dfk.pkl
deleted file mode 100644
index be417e7a29e669e601f885ef9f56311f45665d9b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<&DLq^ziN)FR$@!&uB~!dvOZ5QRO&Z1k

diff --git a/runinfo/015/checkpoint/tasks.pkl b/runinfo/015/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/016/checkpoint/dfk.pkl b/runinfo/016/checkpoint/dfk.pkl
deleted file mode 100644
index 235a8b3f11be4d3b8a94443b6d46e5372486386d..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<YDLq^ziN)FR$@!&uB~!dvOZ5QRU>e5&

diff --git a/runinfo/016/checkpoint/tasks.pkl b/runinfo/016/checkpoint/tasks.pkl
deleted file mode 100644
index 2a6331874dc697a78d8087aab357ef59778341c9..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|HJxW7C5CC9>AbJ47Qah_Kv%B-NH?UE>!t7+02%^E{flVL>c;)k|mSSP+eh2tY
ztFMQ%KgZ>MUTtl^UFO@$2?`btFRdWuVoa4=0fKHh@iJe<r^oK_^8U6w%@-fBpI#5k
z<L-P~pZ+f)TjSE$u_Z)`s^)-hCMs!zeN=wm3`@1%$-6`_W3QfsNl3s_)h?Ju<?(u0
xCd^?*QoE-TA}(P$6d4GkgpSIe%VEhL6*L2cf?y49U>a_O#HzL#mCtw6`WIF~fkglS

diff --git a/runinfo/017/checkpoint/dfk.pkl b/runinfo/017/checkpoint/dfk.pkl
deleted file mode 100644
index dc3c30d19d7c6ed6f38a92e67c87a0a0444a956a..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH=DDLq^ziN)FR$@!&uB~!dvOZ5QRa~jA1

diff --git a/runinfo/017/checkpoint/tasks.pkl b/runinfo/017/checkpoint/tasks.pkl
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/runinfo/018/checkpoint/dfk.pkl b/runinfo/018/checkpoint/dfk.pkl
deleted file mode 100644
index ff38200ea62d3b04a171b19e840f886527e90af2..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH;_DLq^ziN)FR$@!&uB~!dvOZ5QRh8oEL

diff --git a/runinfo/018/checkpoint/tasks.pkl b/runinfo/018/checkpoint/tasks.pkl
deleted file mode 100644
index f13c7af35c3363740ff448250c6c7d6ac6c6830b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|IF-}7<41i&V3PcaU(&ddzmEAareFGM_L+m&z5`v2MNi0Y`z#GG1xD$t<5-a%+
z@crl2*TdCcpZ$JW?aOiBm#I|_N^VjFiwb$7oB+8cPl~(Hms|fZKb)T5Ui;H>{qD#4
z<<uY7ck}lAKgq5tr6Kc01qZ_vy|Feg23crCeosRZFb49H(yjr-L?pRlEv7&go5_fz
z^^oLh)q=&U5TZtDWX_Vn5hP|UBXYVKk^-a@oe(@^t#062K$QJ5YK$ZDXESeq0jlAG
A!2kdN

diff --git a/runinfo/019/checkpoint/dfk.pkl b/runinfo/019/checkpoint/dfk.pkl
deleted file mode 100644
index 33601045bc7228d8d23b85608b68fecd9876fc27..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFH<wDLq^ziN)FR$@!&uB~!dvOZ5QRnHtIf

diff --git a/runinfo/019/checkpoint/tasks.pkl b/runinfo/019/checkpoint/tasks.pkl
deleted file mode 100644
index f13c7af35c3363740ff448250c6c7d6ac6c6830b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 415
zcmZ|IF-}7<41i&V3PcaU(&ddzmEAareFGM_L+m&z5`v2MNi0Y`z#GG1xD$t<5-a%+
z@crl2*TdCcpZ$JW?aOiBm#I|_N^VjFiwb$7oB+8cPl~(Hms|fZKb)T5Ui;H>{qD#4
z<<uY7ck}lAKgq5tr6Kc01qZ_vy|Feg23crCeosRZFb49H(yjr-L?pRlEv7&go5_fz
z^^oLh)q=&U5TZtDWX_Vn5hP|UBXYVKk^-a@oe(@^t#062K$QJ5YK$ZDXESeq0jlAG
A!2kdN

diff --git a/runinfo/020/checkpoint/dfk.pkl b/runinfo/020/checkpoint/dfk.pkl
deleted file mode 100644
index eb770c8ed3465f2a732ba2a1cf28c7b7382be813..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 78
zcmZo*nd-~{0ku;!df19e^HMU4rt~Q5hZd(673%|u#EiU@)S^uNg2bZY9DSgI%)GRG
aeFGzdDLq^ziN)FR$@!&uB~!eaO7#HP`5M0f

diff --git a/runinfo/020/checkpoint/tasks.pkl b/runinfo/020/checkpoint/tasks.pkl
deleted file mode 100644
index 5ea3527e19b06f2f403ff213d3255bc1b0fe23fd..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 164
zcmZo*nd;5}0ku;!dRQ_Ni!-M5C|IVMTbQRNCYc*s8l+g786>9|8kwb;StOg7SfnHw
zrcCMKOsz;xEhx#%&zs`c!&a19T$)od#ha;AuK~M>$tFgYCWZ#aW+{fLCW$5~N#;qG
Wi76&#Mv2Mh7D+}1xJ+ay)dK*Pp)$V!


From 37e10c9f09fdeb8f6e1d1d56ae566fe427b0de3b Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Mon, 18 Mar 2024 16:41:25 +0300
Subject: [PATCH 3/6] Remove parsl/dataflow/dflow.py from PR

---
 parsl/dataflow/dflow.py | 1448 ---------------------------------------
 1 file changed, 1448 deletions(-)
 delete mode 100644 parsl/dataflow/dflow.py

diff --git a/parsl/dataflow/dflow.py b/parsl/dataflow/dflow.py
deleted file mode 100644
index f45ac37629..0000000000
--- a/parsl/dataflow/dflow.py
+++ /dev/null
@@ -1,1448 +0,0 @@
-from __future__ import annotations
-import atexit
-import logging
-import os
-import pathlib
-import pickle
-import random
-import time
-import typeguard
-import inspect
-import threading
-import sys
-import datetime
-from getpass import getuser
-from typeguard import typechecked
-from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple, Union
-from uuid import uuid4
-from socket import gethostname
-from concurrent.futures import Future
-from functools import partial
-
-import parsl
-from parsl.app.errors import RemoteExceptionWrapper
-from parsl.app.futures import DataFuture
-from parsl.channels import Channel
-from parsl.config import Config
-from parsl.data_provider.data_manager import DataManager
-from parsl.data_provider.files import File
-from parsl.dataflow.errors import BadCheckpoint, DependencyError, JoinError
-from parsl.dataflow.futures import AppFuture
-from parsl.dataflow.memoization import Memoizer
-from parsl.dataflow.rundirs import make_rundir
-from parsl.dataflow.states import States, FINAL_STATES, FINAL_FAILURE_STATES
-from parsl.dataflow.taskrecord import TaskRecord
-from parsl.errors import ConfigurationError, InternalConsistencyError, NoDataFlowKernelError
-from parsl.jobs.job_status_poller import JobStatusPoller
-from parsl.jobs.states import JobStatus, JobState
-from parsl.usage_tracking.usage import UsageTracker
-from parsl.executors.base import ParslExecutor
-from parsl.executors.status_handling import BlockProviderExecutor
-from parsl.executors.threads import ThreadPoolExecutor
-from parsl.monitoring import MonitoringHub
-from parsl.process_loggers import wrap_with_logs
-from parsl.providers.base import ExecutionProvider
-from parsl.utils import get_version, get_std_fname_mode, get_all_checkpoints, Timer
-
-from parsl.monitoring.message_type import MessageType
-
-logger = logging.getLogger(__name__)
-
-
-class DataFlowKernel:
-    """The DataFlowKernel adds dependency awareness to an existing executor.
-
-    It is responsible for managing futures, such that when dependencies are resolved,
-    pending tasks move to the runnable state.
-
-    Here is a simplified diagram of what happens internally::
-
-         User             |        DFK         |    Executor
-        ----------------------------------------------------------
-                          |                    |
-               Task-------+> +Submit           |
-             App_Fu<------+--|                 |
-                          |  Dependencies met  |
-                          |         task-------+--> +Submit
-                          |        Ex_Fu<------+----|
-
-    """
-
-    @typechecked
-    def __init__(self, config: Config) -> None:
-        """Initialize the DataFlowKernel.
-
-        Parameters
-        ----------
-        config : Config
-            A specification of all configuration options. For more details see the
-            :class:~`parsl.config.Config` documentation.
-        """
-
-        # this will be used to check cleanup only happens once
-        self.cleanup_called = False
-
-        self._config = config
-        self.run_dir = make_rundir(config.run_dir)
-
-        if config.initialize_logging:
-            parsl.set_file_logger("{}/parsl.log".format(self.run_dir), level=logging.DEBUG)
-
-        logger.info("Starting DataFlowKernel with config\n{}".format(config))
-
-        logger.info("Parsl version: {}".format(get_version()))
-
-        self.checkpoint_lock = threading.Lock()
-
-        self.usage_tracker = UsageTracker(self)
-        self.usage_tracker.send_message()
-
-        self.task_state_counts_lock = threading.Lock()
-        self.task_state_counts = {state: 0 for state in States}
-
-        # Monitoring
-        self.run_id = str(uuid4())
-
-        self.monitoring: Optional[MonitoringHub]
-        self.monitoring = config.monitoring
-
-        # hub address and port for interchange to connect
-        self.hub_address = None  # type: Optional[str]
-        self.hub_interchange_port = None  # type: Optional[int]
-        if self.monitoring:
-            if self.monitoring.logdir is None:
-                self.monitoring.logdir = self.run_dir
-            self.hub_address = self.monitoring.hub_address
-            self.hub_interchange_port = self.monitoring.start(self.run_id, self.run_dir, self.config.run_dir)
-
-        self.time_began = datetime.datetime.now()
-        self.time_completed: Optional[datetime.datetime] = None
-
-        logger.info("Run id is: " + self.run_id)
-
-        self.workflow_name = None
-        if self.monitoring is not None and self.monitoring.workflow_name is not None:
-            self.workflow_name = self.monitoring.workflow_name
-        else:
-            for frame in inspect.stack():
-                logger.debug("Considering candidate for workflow name: {}".format(frame.filename))
-                fname = os.path.basename(str(frame.filename))
-                parsl_file_names = ['dflow.py', 'typeguard.py', '__init__.py']
-                # Find first file name not considered a parsl file
-                if fname not in parsl_file_names:
-                    self.workflow_name = fname
-                    logger.debug("Using {} as workflow name".format(fname))
-                    break
-            else:
-                logger.debug("Could not choose a name automatically")
-                self.workflow_name = "unnamed"
-
-        self.workflow_version = str(self.time_began.replace(microsecond=0))
-        if self.monitoring is not None and self.monitoring.workflow_version is not None:
-            self.workflow_version = self.monitoring.workflow_version
-
-        workflow_info = {
-                'python_version': "{}.{}.{}".format(sys.version_info.major,
-                                                    sys.version_info.minor,
-                                                    sys.version_info.micro),
-                'parsl_version': get_version(),
-                "time_began": self.time_began,
-                'time_completed': None,
-                'run_id': self.run_id,
-                'workflow_name': self.workflow_name,
-                'workflow_version': self.workflow_version,
-                'rundir': self.run_dir,
-                'tasks_completed_count': self.task_state_counts[States.exec_done],
-                'tasks_failed_count': self.task_state_counts[States.failed],
-                'user': getuser(),
-                'host': gethostname(),
-        }
-
-        if self.monitoring:
-            self.monitoring.send(MessageType.WORKFLOW_INFO,
-                                 workflow_info)
-
-        if config.checkpoint_files is not None:
-            checkpoints = self.load_checkpoints(config.checkpoint_files)
-        elif config.checkpoint_files is None and config.checkpoint_mode is not None:
-            checkpoints = self.load_checkpoints(get_all_checkpoints(self.run_dir))
-        else:
-            checkpoints = {}
-
-        self.memoizer = Memoizer(self, memoize=config.app_cache, checkpoint=checkpoints)
-        self.checkpointed_tasks = 0
-        self._checkpoint_timer = None
-        self.checkpoint_mode = config.checkpoint_mode
-        self.checkpointable_tasks: List[TaskRecord] = []
-
-        # this must be set before executors are added since add_executors calls
-        # job_status_poller.add_executors.
-        self.job_status_poller = JobStatusPoller(strategy=self.config.strategy,
-                                                 max_idletime=self.config.max_idletime,
-                                                 dfk=self)
-
-        self.executors: Dict[str, ParslExecutor] = {}
-
-        self.data_manager = DataManager(self)
-        parsl_internal_executor = ThreadPoolExecutor(max_threads=config.internal_tasks_max_threads, label='_parsl_internal')
-        self.add_executors(config.executors)
-        self.add_executors([parsl_internal_executor])
-
-        if self.checkpoint_mode == "periodic":
-            if config.checkpoint_period is None:
-                raise ConfigurationError("Checkpoint period must be specified with periodic checkpoint mode")
-            else:
-                try:
-                    h, m, s = map(int, config.checkpoint_period.split(':'))
-                except Exception:
-                    raise ConfigurationError("invalid checkpoint_period provided: {0} expected HH:MM:SS".format(config.checkpoint_period))
-                checkpoint_period = (h * 3600) + (m * 60) + s
-                self._checkpoint_timer = Timer(self.checkpoint, interval=checkpoint_period, name="Checkpoint")
-
-        self.task_count = 0
-        self.tasks: Dict[int, TaskRecord] = {}
-        self.submitter_lock = threading.Lock()
-
-        atexit.register(self.atexit_cleanup)
-
-    def _send_task_log_info(self, task_record: TaskRecord) -> None:
-        if self.monitoring:
-            task_log_info = self._create_task_log_info(task_record)
-            self.monitoring.send(MessageType.TASK_INFO, task_log_info)
-
-    def _create_task_log_info(self, task_record):
-        """
-        Create the dictionary that will be included in the log.
-        """
-        info_to_monitor = ['func_name', 'memoize', 'hashsum', 'fail_count', 'fail_cost', 'status',
-                           'id', 'time_invoked', 'try_time_launched', 'time_returned', 'try_time_returned', 'executor']
-
-        task_log_info = {"task_" + k: task_record[k] for k in info_to_monitor}
-        task_log_info['run_id'] = self.run_id
-        task_log_info['try_id'] = task_record['try_id']
-        task_log_info['timestamp'] = datetime.datetime.now()
-        task_log_info['task_status_name'] = task_record['status'].name
-        task_log_info['tasks_failed_count'] = self.task_state_counts[States.failed]
-        task_log_info['tasks_completed_count'] = self.task_state_counts[States.exec_done]
-        task_log_info['tasks_memo_completed_count'] = self.task_state_counts[States.memo_done]
-        task_log_info['from_memo'] = task_record['from_memo']
-        task_log_info['task_inputs'] = str(task_record['kwargs'].get('inputs', None))
-        task_log_info['task_outputs'] = str(task_record['kwargs'].get('outputs', None))
-        task_log_info['task_stdin'] = task_record['kwargs'].get('stdin', None)
-        stdout_spec = task_record['kwargs'].get('stdout', None)
-        stderr_spec = task_record['kwargs'].get('stderr', None)
-        try:
-            stdout_name, _ = get_std_fname_mode('stdout', stdout_spec)
-        except Exception as e:
-            logger.warning("Incorrect stdout format {} for Task {}".format(stdout_spec, task_record['id']))
-            stdout_name = str(e)
-        try:
-            stderr_name, _ = get_std_fname_mode('stderr', stderr_spec)
-        except Exception as e:
-            logger.warning("Incorrect stderr format {} for Task {}".format(stderr_spec, task_record['id']))
-            stderr_name = str(e)
-        task_log_info['task_stdout'] = stdout_name
-        task_log_info['task_stderr'] = stderr_name
-        task_log_info['task_fail_history'] = ",".join(task_record['fail_history'])
-        task_log_info['task_depends'] = None
-        if task_record['depends'] is not None:
-            task_log_info['task_depends'] = ",".join([str(t.tid) for t in task_record['depends']
-                                                      if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
-        task_log_info['task_joins'] = None
-
-        if isinstance(task_record['joins'], list):
-            task_log_info['task_joins'] = ",".join([str(t.tid) for t in task_record['joins']
-                                                    if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
-        elif isinstance(task_record['joins'], Future):
-            task_log_info['task_joins'] = ",".join([str(t.tid) for t in [task_record['joins']]
-                                                    if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
-
-        return task_log_info
-
-    def _count_deps(self, depends: Sequence[Future]) -> int:
-        """Count the number of unresolved futures in the list depends.
-        """
-        count = 0
-        for dep in depends:
-            if not dep.done():
-                count += 1
-
-        return count
-
-    @property
-    def config(self) -> Config:
-        """Returns the fully initialized config that the DFK is actively using.
-
-        Returns:
-             - Config object
-        """
-        return self._config
-
-    def handle_exec_update(self, task_record: TaskRecord, future: Future) -> None:
-        """This function is called only as a callback from an execution
-        attempt reaching a final state (either successfully or failing).
-
-        It will launch retries if necessary, and update the task
-        structure.
-
-        Args:
-             task_record (dict) : Task record
-             future (Future) : The future object corresponding to the task which
-             makes this callback
-        """
-
-        task_id = task_record['id']
-
-        task_record['try_time_returned'] = datetime.datetime.now()
-
-        if not future.done():
-            raise InternalConsistencyError("done callback called, despite future not reporting itself as done")
-
-        try:
-            res = self._unwrap_remote_exception_wrapper(future)
-
-        except Exception as e:
-            logger.info(f"Task {task_id} try {task_record['try_id']} failed with exception of type {type(e).__name__}")
-            # We keep the history separately, since the future itself could be
-            # tossed.
-            task_record['fail_history'].append(repr(e))
-            task_record['fail_count'] += 1
-            if self._config.retry_handler:
-                try:
-                    cost = self._config.retry_handler(e, task_record)
-                except Exception as retry_handler_exception:
-                    logger.exception("retry_handler raised an exception - will not retry")
-
-                    # this can be any amount > self._config.retries, to stop any more
-                    # retries from happening
-                    task_record['fail_cost'] = self._config.retries + 1
-
-                    # make the reported exception be the retry handler's exception,
-                    # rather than the execution level exception
-                    e = retry_handler_exception
-                else:
-                    task_record['fail_cost'] += cost
-            else:
-                task_record['fail_cost'] += 1
-
-            if task_record['status'] == States.dep_fail:
-                logger.info("Task {} failed due to dependency failure so skipping retries".format(task_id))
-                task_record['time_returned'] = datetime.datetime.now()
-                self._send_task_log_info(task_record)
-                with task_record['app_fu']._update_lock:
-                    task_record['app_fu'].set_exception(e)
-
-            elif task_record['fail_cost'] <= self._config.retries:
-
-                # record the final state for this try before we mutate for retries
-                self.update_task_state(task_record, States.fail_retryable)
-                self._send_task_log_info(task_record)
-
-                task_record['try_id'] += 1
-                self.update_task_state(task_record, States.pending)
-                task_record['try_time_launched'] = None
-                task_record['try_time_returned'] = None
-                task_record['fail_history'] = []
-                self._send_task_log_info(task_record)
-
-                logger.info("Task {} marked for retry".format(task_id))
-
-            else:
-                logger.exception("Task {} failed after {} retry attempts".format(task_id,
-                                                                                 task_record['try_id']))
-                task_record['time_returned'] = datetime.datetime.now()
-                self.update_task_state(task_record, States.failed)
-                task_record['time_returned'] = datetime.datetime.now()
-                self._send_task_log_info(task_record)
-                with task_record['app_fu']._update_lock:
-                    task_record['app_fu'].set_exception(e)
-
-        else:
-            if task_record['from_memo']:
-                self._complete_task(task_record, States.memo_done, res)
-                self._send_task_log_info(task_record)
-            else:
-                if not task_record['join']:
-                    self._complete_task(task_record, States.exec_done, res)
-                    self._send_task_log_info(task_record)
-                else:
-                    # This is a join task, and the original task's function code has
-                    # completed. That means that the future returned by that code
-                    # will be available inside the executor future, so we can now
-                    # record the inner app ID in monitoring, and add a completion
-                    # listener to that inner future.
-
-                    joinable = future.result()
-
-                    # Fail with a TypeError if the joinapp python body returned
-                    # something we can't join on.
-                    if isinstance(joinable, Future):
-                        self.update_task_state(task_record, States.joining)
-                        task_record['joins'] = joinable
-                        task_record['join_lock'] = threading.Lock()
-                        self._send_task_log_info(task_record)
-                        joinable.add_done_callback(partial(self.handle_join_update, task_record))
-                    elif joinable == []:  # got a list, but it had no entries, and specifically, no Futures.
-                        self.update_task_state(task_record, States.joining)
-                        task_record['joins'] = joinable
-                        task_record['join_lock'] = threading.Lock()
-                        self._send_task_log_info(task_record)
-                        self.handle_join_update(task_record, None)
-                    elif isinstance(joinable, list) and [j for j in joinable if not isinstance(j, Future)] == []:
-                        self.update_task_state(task_record, States.joining)
-                        task_record['joins'] = joinable
-                        task_record['join_lock'] = threading.Lock()
-                        self._send_task_log_info(task_record)
-                        for inner_future in joinable:
-                            inner_future.add_done_callback(partial(self.handle_join_update, task_record))
-                    else:
-                        task_record['time_returned'] = datetime.datetime.now()
-                        self.update_task_state(task_record, States.failed)
-                        task_record['time_returned'] = datetime.datetime.now()
-                        self._send_task_log_info(task_record)
-                        with task_record['app_fu']._update_lock:
-                            task_record['app_fu'].set_exception(
-                                TypeError(f"join_app body must return a Future or list of Futures, got {joinable} of type {type(joinable)}"))
-
-        self._log_std_streams(task_record)
-
-        # it might be that in the course of the update, we've gone back to being
-        # pending - in which case, we should consider ourself for relaunch
-        if task_record['status'] == States.pending:
-            self.launch_if_ready(task_record)
-
-    def handle_join_update(self, task_record: TaskRecord, inner_app_future: Optional[AppFuture]) -> None:
-        with task_record['join_lock']:
-            # inner_app_future has completed, which is one (potentially of many)
-            # futures the outer task is joining on.
-
-            # If the outer task is joining on a single future, then
-            # use the result of the inner_app_future as the final result of
-            # the outer app future.
-
-            # If the outer task is joining on a list of futures, then
-            # check if the list is all done, and if so, return a list
-            # of the results. Otherwise, this callback can do nothing and
-            # processing will happen in another callback (on the final Future
-            # to complete)
-
-            # There is no retry handling here: inner apps are responsible for
-            # their own retrying, and joining state is responsible for passing
-            # on whatever the result of that retrying was (if any).
-
-            outer_task_id = task_record['id']
-            logger.debug(f"Join callback for task {outer_task_id}, inner_app_future {inner_app_future}")
-
-            if task_record['status'] != States.joining:
-                logger.debug(f"Join callback for task {outer_task_id} skipping because task is not in joining state")
-                return
-
-            joinable = task_record['joins']
-
-            if isinstance(joinable, list):
-                for future in joinable:
-                    if not future.done():
-                        logger.debug(f"A joinable future {future} is not done for task {outer_task_id} - skipping callback")
-                        return  # abandon this callback processing if joinables are not all done
-
-            # now we know each joinable Future is done
-            # so now look for any exceptions
-            exceptions_tids: List[Tuple[BaseException, Optional[str]]]
-            exceptions_tids = []
-            if isinstance(joinable, Future):
-                je = joinable.exception()
-                if je is not None:
-                    if hasattr(joinable, 'task_record'):
-                        tid = joinable.task_record['id']
-                    else:
-                        tid = None
-                    exceptions_tids = [(je, tid)]
-            elif isinstance(joinable, list):
-                for future in joinable:
-                    je = future.exception()
-                    if je is not None:
-                        if hasattr(joinable, 'task_record'):
-                            tid = joinable.task_record['id']
-                        else:
-                            tid = None
-                        exceptions_tids.append((je, tid))
-            else:
-                raise TypeError(f"Unknown joinable type {type(joinable)}")
-
-            if exceptions_tids:
-                logger.debug("Task {} failed due to failure of an inner join future".format(outer_task_id))
-                e = JoinError(exceptions_tids, outer_task_id)
-                # We keep the history separately, since the future itself could be
-                # tossed.
-                task_record['fail_history'].append(repr(e))
-                task_record['fail_count'] += 1
-                # no need to update the fail cost because join apps are never
-                # retried
-
-                self.update_task_state(task_record, States.failed)
-                task_record['time_returned'] = datetime.datetime.now()
-                with task_record['app_fu']._update_lock:
-                    task_record['app_fu'].set_exception(e)
-
-            else:
-                # all the joinables succeeded, so construct a result:
-                if isinstance(joinable, Future):
-                    assert inner_app_future is joinable
-                    res = joinable.result()
-                elif isinstance(joinable, list):
-                    res = []
-                    for future in joinable:
-                        res.append(future.result())
-                else:
-                    raise TypeError(f"Unknown joinable type {type(joinable)}")
-                self._complete_task(task_record, States.exec_done, res)
-
-            self._log_std_streams(task_record)
-
-            self._send_task_log_info(task_record)
-
-    def handle_app_update(self, task_record: TaskRecord, future: AppFuture) -> None:
-        """This function is called as a callback when an AppFuture
-        is in its final state.
-
-        It will trigger post-app processing such as checkpointing.
-
-        Args:
-             task_record : Task record
-             future (Future) : The relevant app future (which should be
-                 consistent with the task structure 'app_fu' entry
-
-        """
-
-        task_id = task_record['id']
-
-        if not task_record['app_fu'].done():
-            logger.error("Internal consistency error: app_fu is not done for task {}".format(task_id))
-        if not task_record['app_fu'] == future:
-            logger.error("Internal consistency error: callback future is not the app_fu in task structure, for task {}".format(task_id))
-
-        self.memoizer.update_memo(task_record, future)
-
-        # Cover all checkpointing cases here:
-        # Do we need to checkpoint now, or queue for later,
-        # or do nothing?
-        if self.checkpoint_mode == 'task_exit':
-            self.checkpoint(tasks=[task_record])
-        elif self.checkpoint_mode in ('manual', 'periodic', 'dfk_exit'):
-            with self.checkpoint_lock:
-                self.checkpointable_tasks.append(task_record)
-        elif self.checkpoint_mode is None:
-            pass
-        else:
-            raise InternalConsistencyError(f"Invalid checkpoint mode {self.checkpoint_mode}")
-
-        self.wipe_task(task_id)
-        return
-
-    def _complete_task(self, task_record: TaskRecord, new_state: States, result: Any) -> None:
-        """Set a task into a completed state
-        """
-        assert new_state in FINAL_STATES
-        assert new_state not in FINAL_FAILURE_STATES
-        old_state = task_record['status']
-
-        self.update_task_state(task_record, new_state)
-
-        logger.info(f"Task {task_record['id']} completed ({old_state.name} -> {new_state.name})")
-        task_record['time_returned'] = datetime.datetime.now()
-
-        with task_record['app_fu']._update_lock:
-            task_record['app_fu'].set_result(result)
-
-    def update_task_state(self, task_record: TaskRecord, new_state: States) -> None:
-        """Updates a task record state, and recording an appropriate change
-        to task state counters.
-        """
-
-        with self.task_state_counts_lock:
-            if 'status' in task_record:
-                self.task_state_counts[task_record['status']] -= 1
-            self.task_state_counts[new_state] += 1
-            task_record['status'] = new_state
-
-    @staticmethod
-    def _unwrap_remote_exception_wrapper(future: Future) -> Any:
-        result = future.result()
-        if isinstance(result, RemoteExceptionWrapper):
-            result.reraise()
-        return result
-
-    def wipe_task(self, task_id: int) -> None:
-        """Remove task with task_id from the internal tasks table
-        """
-        if self.config.garbage_collect:
-            del self.tasks[task_id]
-
-    @staticmethod
-    def check_staging_inhibited(kwargs: Dict[str, Any]) -> bool:
-        return kwargs.get('_parsl_staging_inhibit', False)
-
-    def launch_if_ready(self, task_record: TaskRecord) -> None:
-        """
-        launch_if_ready will launch the specified task, if it is ready
-        to run (for example, without dependencies, and in pending state).
-
-        This should be called by any piece of the DataFlowKernel that
-        thinks a task may have become ready to run.
-
-        It is not an error to call launch_if_ready on a task that is not
-        ready to run - launch_if_ready will not incorrectly launch that
-        task.
-
-        It is also not an error to call launch_if_ready on a task that has
-        already been launched - launch_if_ready will not re-launch that
-        task.
-
-        launch_if_ready is thread safe, so may be called from any thread
-        or callback.
-        """
-        exec_fu = None
-
-        task_id = task_record['id']
-        with task_record['task_launch_lock']:
-
-            if task_record['status'] != States.pending:
-                logger.debug(f"Task {task_id} is not pending, so launch_if_ready skipping")
-                return
-
-            if self._count_deps(task_record['depends']) != 0:
-                logger.debug(f"Task {task_id} has outstanding dependencies, so launch_if_ready skipping")
-                return
-
-            # We can now launch the task or handle any dependency failures
-
-            new_args, kwargs, exceptions_tids = self._unwrap_futures(task_record['args'],
-                                                                     task_record['kwargs'])
-            task_record['args'] = new_args
-            task_record['kwargs'] = kwargs
-
-            if not exceptions_tids:
-                # There are no dependency errors
-                try:
-                    exec_fu = self.launch_task(task_record)
-                    assert isinstance(exec_fu, Future)
-                except Exception as e:
-                    # task launched failed somehow. the execution might
-                    # have been launched and an exception raised after
-                    # that, though. that's hard to detect from here.
-                    # we don't attempt retries here. This is an error with submission
-                    # even though it might come from user code such as a plugged-in
-                    # executor or memoization hash function.
-
-                    logger.debug("Got an exception launching task", exc_info=True)
-                    exec_fu = Future()
-                    exec_fu.set_exception(e)
-            else:
-                logger.info(
-                    "Task {} failed due to dependency failure".format(task_id))
-                # Raise a dependency exception
-                self.update_task_state(task_record, States.dep_fail)
-
-                self._send_task_log_info(task_record)
-
-                exec_fu = Future()
-                exec_fu.set_exception(DependencyError(exceptions_tids,
-                                                      task_id))
-
-        if exec_fu:
-            assert isinstance(exec_fu, Future)
-            try:
-                exec_fu.add_done_callback(partial(self.handle_exec_update, task_record))
-            except Exception:
-                # this exception is ignored here because it is assumed that exception
-                # comes from directly executing handle_exec_update (because exec_fu is
-                # done already). If the callback executes later, then any exception
-                # coming out of the callback will be ignored and not propate anywhere,
-                # so this block attempts to keep the same behaviour here.
-                logger.error("add_done_callback got an exception which will be ignored", exc_info=True)
-
-            task_record['exec_fu'] = exec_fu
-
-    def launch_task(self, task_record: TaskRecord) -> Future:
-        """Handle the actual submission of the task to the executor layer.
-
-        If the app task has the executors attributes not set (default=='all')
-        the task is launched on a randomly selected executor from the
-        list of executors. This behavior could later be updated to support
-        binding to executors based on user specified criteria.
-
-        If the app task specifies a particular set of executors, it will be
-        targeted at those specific executors.
-
-        Args:
-            task_record : The task record
-
-        Returns:
-            Future that tracks the execution of the submitted function
-        """
-        task_id = task_record['id']
-        function = task_record['func']
-        args = task_record['args']
-        kwargs = task_record['kwargs']
-
-        task_record['try_time_launched'] = datetime.datetime.now()
-
-        memo_fu = self.memoizer.check_memo(task_record)
-        if memo_fu:
-            logger.info("Reusing cached result for task {}".format(task_id))
-            task_record['from_memo'] = True
-            assert isinstance(memo_fu, Future)
-            return memo_fu
-
-        task_record['from_memo'] = False
-        executor_label = task_record["executor"]
-        try:
-            executor = self.executors[executor_label]
-        except Exception:
-            logger.exception("Task {} requested invalid executor {}: config is\n{}".format(task_id, executor_label, self._config))
-            raise ValueError("Task {} requested invalid executor {}".format(task_id, executor_label))
-
-        try_id = task_record['fail_count']
-
-        if self.monitoring is not None and self.monitoring.resource_monitoring_enabled:
-            wrapper_logging_level = logging.DEBUG if self.monitoring.monitoring_debug else logging.INFO
-            (function, args, kwargs) = self.monitoring.monitor_wrapper(function, args, kwargs, try_id, task_id,
-                                                                       self.monitoring.monitoring_hub_url,
-                                                                       self.run_id,
-                                                                       wrapper_logging_level,
-                                                                       self.monitoring.resource_monitoring_interval,
-                                                                       executor.radio_mode,
-                                                                       executor.monitor_resources(),
-                                                                       self.run_dir)
-
-        with self.submitter_lock:
-            exec_fu = executor.submit(function, task_record['resource_specification'], *args, **kwargs)
-        self.update_task_state(task_record, States.launched)
-
-        self._send_task_log_info(task_record)
-
-        if hasattr(exec_fu, "parsl_executor_task_id"):
-            logger.info(f"Parsl task {task_id} try {try_id} launched on executor {executor.label} with executor id {exec_fu.parsl_executor_task_id}")
-        else:
-            logger.info(f"Parsl task {task_id} try {try_id} launched on executor {executor.label}")
-
-        self._log_std_streams(task_record)
-
-        return exec_fu
-
-    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any],
-                                                                                                                   Callable]:
-        """Look for inputs of the app that are files. Give the data manager
-        the opportunity to replace a file with a data future for that file,
-        for example wrapping the result of a staging action.
-
-        Args:
-            - executor (str) : executor where the app is going to be launched
-            - args (List) : Positional args to app function
-            - kwargs (Dict) : Kwargs to app function
-        """
-
-        # Return if the task is a data management task, rather than doing
-        #  data management on it.
-        if self.check_staging_inhibited(kwargs):
-            logger.debug("Not performing input staging")
-            return args, kwargs, func
-
-        inputs = kwargs.get('inputs', [])
-        for idx, f in enumerate(inputs):
-            (inputs[idx], func) = self.data_manager.optionally_stage_in(f, func, executor)
-
-        for kwarg, f in kwargs.items():
-            (kwargs[kwarg], func) = self.data_manager.optionally_stage_in(f, func, executor)
-
-        newargs = list(args)
-        for idx, f in enumerate(newargs):
-            (newargs[idx], func) = self.data_manager.optionally_stage_in(f, func, executor)
-
-        return tuple(newargs), kwargs, func
-
-    def _add_output_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], app_fut: AppFuture, func: Callable) -> Callable:
-        logger.debug("Adding output dependencies")
-        outputs = kwargs.get('outputs', [])
-        app_fut._outputs = []
-        for idx, f in enumerate(outputs):
-            if isinstance(f, File) and not self.check_staging_inhibited(kwargs):
-                # replace a File with a DataFuture - either completing when the stageout
-                # future completes, or if no stage out future is returned, then when the
-                # app itself completes.
-
-                # The staging code will get a clean copy which it is allowed to mutate,
-                # while the DataFuture-contained original will not be modified by any staging.
-                f_copy = f.cleancopy()
-                outputs[idx] = f_copy
-
-                logger.debug("Submitting stage out for output file {}".format(repr(f)))
-                stageout_fut = self.data_manager.stage_out(f_copy, executor, app_fut)
-                if stageout_fut:
-                    logger.debug("Adding a dependency on stageout future for {}".format(repr(f)))
-                    app_fut._outputs.append(DataFuture(stageout_fut, f, tid=app_fut.tid))
-                else:
-                    logger.debug("No stageout dependency for {}".format(repr(f)))
-                    app_fut._outputs.append(DataFuture(app_fut, f, tid=app_fut.tid))
-
-                # this is a hook for post-task stageout
-                # note that nothing depends on the output - which is maybe a bug
-                # in the not-very-tested stageout system?
-                func = self.data_manager.replace_task_stage_out(f_copy, func, executor)
-            else:
-                logger.debug("Not performing output staging for: {}".format(repr(f)))
-                app_fut._outputs.append(DataFuture(app_fut, f, tid=app_fut.tid))
-        return func
-
-    def _gather_all_deps(self, args: Sequence[Any], kwargs: Dict[str, Any]) -> List[Future]:
-        """Assemble a list of all Futures passed as arguments, kwargs or in the inputs kwarg.
-
-        Args:
-            - args: The list of args pass to the app
-            - kwargs: The dict of all kwargs passed to the app
-
-        Returns:
-            - list of dependencies
-
-        """
-        depends: List[Future] = []
-
-        def check_dep(d: Any) -> None:
-            if isinstance(d, Future):
-                depends.extend([d])
-
-        # Check the positional args
-        for dep in args:
-            check_dep(dep)
-
-        # Check for explicit kwargs ex, fu_1=<fut>
-        for key in kwargs:
-            dep = kwargs[key]
-            check_dep(dep)
-
-        # Check for futures in inputs=[<fut>...]
-        for dep in kwargs.get('inputs', []):
-            check_dep(dep)
-
-        return depends
-
-    def _unwrap_futures(self, args, kwargs):
-        """This function should be called when all dependencies have completed.
-
-        It will rewrite the arguments for that task, replacing each Future
-        with the result of that future.
-
-        If the user hid futures a level below, we will not catch
-        it, and will (most likely) result in a type error.
-
-        Args:
-             args (List) : Positional args to app function
-             kwargs (Dict) : Kwargs to app function
-
-        Return:
-            a rewritten args list
-            a rewritten kwargs dict
-            pairs of exceptions, task ids from any Futures which stored
-            exceptions rather than results.
-        """
-        dep_failures = []
-
-        # Replace item in args
-        new_args = []
-        for dep in args:
-            if isinstance(dep, Future):
-                try:
-                    new_args.extend([dep.result()])
-                except Exception as e:
-                    # If this Future is associated with a task inside this DFK,
-                    # then refer to the task ID.
-                    # Otherwise make a repr of the Future object.
-                    if hasattr(dep, 'task_record') and dep.task_record['dfk'] == self:
-                        tid = "task " + repr(dep.task_record['id'])
-                    else:
-                        tid = repr(dep)
-                    dep_failures.extend([(e, tid)])
-            else:
-                new_args.extend([dep])
-
-        # Check for explicit kwargs ex, fu_1=<fut>
-        for key in kwargs:
-            dep = kwargs[key]
-            if isinstance(dep, Future):
-                try:
-                    kwargs[key] = dep.result()
-                except Exception as e:
-                    if hasattr(dep, 'task_record'):
-                        tid = dep.task_record['id']
-                    else:
-                        tid = None
-                    dep_failures.extend([(e, tid)])
-
-        # Check for futures in inputs=[<fut>...]
-        if 'inputs' in kwargs:
-            new_inputs = []
-            for dep in kwargs['inputs']:
-                if isinstance(dep, Future):
-                    try:
-                        new_inputs.extend([dep.result()])
-                    except Exception as e:
-                        if hasattr(dep, 'task_record'):
-                            tid = dep.task_record['id']
-                        else:
-                            tid = None
-                        dep_failures.extend([(e, tid)])
-
-                else:
-                    new_inputs.extend([dep])
-            kwargs['inputs'] = new_inputs
-
-        return new_args, kwargs, dep_failures
-
-    def submit(self,
-               func: Callable,
-               app_args: Sequence[Any],
-               executors: Union[str, Sequence[str]],
-               cache: bool,
-               ignore_for_cache: Optional[Sequence[str]],
-               app_kwargs: Dict[str, Any],
-               join: bool = False) -> AppFuture:
-        """Add task to the dataflow system.
-
-        If the app task has the executors attributes not set (default=='all')
-        the task will be launched on a randomly selected executor from the
-        list of executors. If the app task specifies a particular set of
-        executors, it will be targeted at the specified executors.
-
-        Args:
-            - func : A function object
-
-        KWargs :
-            - app_args : Args to the function
-            - executors (list or string) : List of executors this call could go to.
-                    Default='all'
-            - cache (Bool) : To enable memoization or not
-            - ignore_for_cache (sequence) : List of kwargs to be ignored for memoization/checkpointing
-            - app_kwargs (dict) : Rest of the kwargs to the fn passed as dict.
-
-        Returns:
-               (AppFuture) [DataFutures,]
-
-        """
-
-        if ignore_for_cache is None:
-            ignore_for_cache = []
-        else:
-            # duplicate so that it can be modified safely later
-            ignore_for_cache = list(ignore_for_cache)
-
-        if self.cleanup_called:
-            raise NoDataFlowKernelError("Cannot submit to a DFK that has been cleaned up")
-
-        task_id = self.task_count
-        self.task_count += 1
-        if isinstance(executors, str) and executors.lower() == 'all':
-            choices = list(e for e in self.executors if e != '_parsl_internal')
-        elif isinstance(executors, list):
-            choices = executors
-        else:
-            raise ValueError("Task {} supplied invalid type for executors: {}".format(task_id, type(executors)))
-        executor = random.choice(choices)
-        logger.debug("Task {} will be sent to executor {}".format(task_id, executor))
-
-        # The below uses func.__name__ before it has been wrapped by any staging code.
-
-        label = app_kwargs.get('label')
-        for kw in ['stdout', 'stderr']:
-            if kw in app_kwargs:
-                if app_kwargs[kw] == parsl.AUTO_LOGNAME:
-                    if kw not in ignore_for_cache:
-                        ignore_for_cache += [kw]
-                    app_kwargs[kw] = os.path.join(
-                                self.run_dir,
-                                'task_logs',
-                                str(int(task_id / 10000)).zfill(4),  # limit logs to 10k entries per directory
-                                'task_{}_{}{}.{}'.format(
-                                    str(task_id).zfill(4),
-                                    func.__name__,
-                                    '' if label is None else '_{}'.format(label),
-                                    kw)
-                    )
-
-        resource_specification = app_kwargs.get('parsl_resource_specification', {})
-
-        task_record: TaskRecord
-        task_record = {'depends': [],
-                       'dfk': self,
-                       'executor': executor,
-                       'func_name': func.__name__,
-                       'memoize': cache,
-                       'hashsum': None,
-                       'exec_fu': None,
-                       'fail_count': 0,
-                       'fail_cost': 0,
-                       'fail_history': [],
-                       'from_memo': None,
-                       'ignore_for_cache': ignore_for_cache,
-                       'join': join,
-                       'joins': None,
-                       'try_id': 0,
-                       'id': task_id,
-                       'task_launch_lock': threading.Lock(),
-                       'time_invoked': datetime.datetime.now(),
-                       'time_returned': None,
-                       'try_time_launched': None,
-                       'try_time_returned': None,
-                       'resource_specification': resource_specification}
-
-        self.update_task_state(task_record, States.unsched)
-
-        app_fu = AppFuture(task_record)
-
-        # Transform remote input files to data futures
-        app_args, app_kwargs, func = self._add_input_deps(executor, app_args, app_kwargs, func)
-
-        func = self._add_output_deps(executor, app_args, app_kwargs, app_fu, func)
-
-        task_record.update({
-                    'args': app_args,
-                    'func': func,
-                    'kwargs': app_kwargs,
-                    'app_fu': app_fu})
-
-        assert task_id not in self.tasks
-
-        self.tasks[task_id] = task_record
-
-        # Get the list of dependencies for the task
-        depends = self._gather_all_deps(app_args, app_kwargs)
-        task_record['depends'] = depends
-
-        depend_descs = []
-        for d in depends:
-            if isinstance(d, AppFuture) or isinstance(d, DataFuture):
-                depend_descs.append("task {}".format(d.tid))
-            else:
-                depend_descs.append(repr(d))
-
-        if depend_descs != []:
-            waiting_message = "waiting on {}".format(", ".join(depend_descs))
-        else:
-            waiting_message = "not waiting on any dependency"
-
-        logger.info("Task {} submitted for App {}, {}".format(task_id,
-                                                              task_record['func_name'],
-                                                              waiting_message))
-
-        app_fu.add_done_callback(partial(self.handle_app_update, task_record))
-        self.update_task_state(task_record, States.pending)
-        logger.debug("Task {} set to pending state with AppFuture: {}".format(task_id, task_record['app_fu']))
-
-        self._send_task_log_info(task_record)
-
-        # at this point add callbacks to all dependencies to do a launch_if_ready
-        # call whenever a dependency completes.
-
-        # we need to be careful about the order of setting the state to pending,
-        # adding the callbacks, and caling launch_if_ready explicitly once always below.
-
-        # I think as long as we call launch_if_ready once after setting pending, then
-        # we can add the callback dependencies at any point: if the callbacks all fire
-        # before then, they won't cause a launch, but the one below will. if they fire
-        # after we set it pending, then the last one will cause a launch, and the
-        # explicit one won't.
-
-        for d in depends:
-
-            def callback_adapter(dep_fut: Future) -> None:
-                self.launch_if_ready(task_record)
-
-            try:
-                d.add_done_callback(callback_adapter)
-            except Exception as e:
-                logger.error("add_done_callback got an exception {} which will be ignored".format(e))
-
-        self.launch_if_ready(task_record)
-
-        return app_fu
-
-    # it might also be interesting to assert that all DFK
-    # tasks are in a "final" state (3,4,5) when the DFK
-    # is closed down, and report some kind of warning.
-    # although really I'd like this to drain properly...
-    # and a drain function might look like this.
-    # If tasks have their states changed, this won't work properly
-    # but we can validate that...
-    def log_task_states(self) -> None:
-        logger.info("Summary of tasks in DFK:")
-
-        with self.task_state_counts_lock:
-            for state in States:
-                logger.info("Tasks in state {}: {}".format(str(state), self.task_state_counts[state]))
-
-        logger.info("End of summary")
-
-    def _create_remote_dirs_over_channel(self, provider: ExecutionProvider, channel: Channel) -> None:
-        """Create script directories across a channel
-
-        Parameters
-        ----------
-        provider: Provider obj
-           Provider for which scripts dirs are being created
-        channel: Channel obj
-           Channel over which the remote dirs are to be created
-        """
-        run_dir = self.run_dir
-        if channel.script_dir is None:
-
-            # This case will be detected as unreachable by mypy, because of
-            # the type of script_dir, which is str, not Optional[str].
-            # The type system doesn't represent the initialized/uninitialized
-            # state of a channel so cannot represent that a channel needs
-            # its script directory set or not.
-
-            channel.script_dir = os.path.join(run_dir, 'submit_scripts')  # type: ignore[unreachable]
-
-            # Only create dirs if we aren't on a shared-fs
-            if not channel.isdir(run_dir):
-                parent, child = pathlib.Path(run_dir).parts[-2:]
-                remote_run_dir = os.path.join(parent, child)
-                channel.script_dir = os.path.join(remote_run_dir, 'remote_submit_scripts')
-                provider.script_dir = os.path.join(run_dir, 'local_submit_scripts')
-
-        channel.makedirs(channel.script_dir, exist_ok=True)
-
-    def add_executors(self, executors):
-        for executor in executors:
-            executor.run_id = self.run_id
-            executor.run_dir = self.run_dir
-            executor.hub_address = self.hub_address
-            executor.hub_port = self.hub_interchange_port
-            if hasattr(executor, 'provider'):
-                if hasattr(executor.provider, 'script_dir'):
-                    executor.provider.script_dir = os.path.join(self.run_dir, 'submit_scripts')
-                    os.makedirs(executor.provider.script_dir, exist_ok=True)
-
-                    if hasattr(executor.provider, 'channels'):
-                        logger.debug("Creating script_dir across multiple channels")
-                        for channel in executor.provider.channels:
-                            self._create_remote_dirs_over_channel(executor.provider, channel)
-                    else:
-                        self._create_remote_dirs_over_channel(executor.provider, executor.provider.channel)
-
-            self.executors[executor.label] = executor
-            block_ids = executor.start()
-            if self.monitoring and block_ids:
-                new_status = {}
-                for bid in block_ids:
-                    new_status[bid] = JobStatus(JobState.PENDING)
-                msg = executor.create_monitoring_info(new_status)
-                logger.debug("Sending monitoring message {} to hub from DFK".format(msg))
-                self.monitoring.send(MessageType.BLOCK_INFO, msg)
-        block_executors = [e for e in executors if isinstance(e, BlockProviderExecutor)]
-        self.job_status_poller.add_executors(block_executors)
-
-    def atexit_cleanup(self) -> None:
-        if not self.cleanup_called:
-            logger.info("DFK cleanup because python process is exiting")
-            self.cleanup()
-        else:
-            logger.info("python process is exiting, but DFK has already been cleaned up")
-
-    def wait_for_current_tasks(self) -> None:
-        """Waits for all tasks in the task list to be completed, by waiting for their
-        AppFuture to be completed. This method will not necessarily wait for any tasks
-        added after cleanup has started (such as data stageout?)
-        """
-
-        logger.info("Waiting for all remaining tasks to complete")
-
-        # .values is made into a list immediately to reduce (although not
-        # eliminate) a race condition where self.tasks can be modified
-        # elsewhere by a completing task being removed from the dictionary.
-        task_records = list(self.tasks.values())
-        for task_record in task_records:
-            # .exception() is a less exception throwing way of
-            # waiting for completion than .result()
-            fut = task_record['app_fu']
-            if not fut.done():
-                fut.exception()
-            # now app future is done, poll until DFK state is final: a DFK state being final and the app future being done do not imply each other.
-            while task_record['status'] not in FINAL_STATES:
-                time.sleep(0.1)
-
-        logger.info("All remaining tasks completed")
-
-    @wrap_with_logs
-    def cleanup(self) -> None:
-        """DataFlowKernel cleanup.
-
-        This involves releasing all resources explicitly.
-
-        We call scale_in on each of the executors and call executor.shutdown.
-        """
-        logger.info("DFK cleanup initiated")
-
-        # this check won't detect two DFK cleanups happening from
-        # different threads extremely close in time because of
-        # non-atomic read/modify of self.cleanup_called
-        if self.cleanup_called:
-            raise Exception("attempt to clean up DFK when it has already been cleaned-up")
-        self.cleanup_called = True
-
-        self.log_task_states()
-
-        # Checkpointing takes priority over the rest of the tasks
-        # checkpoint if any valid checkpoint method is specified
-        if self.checkpoint_mode is not None:
-            self.checkpoint()
-
-            if self._checkpoint_timer:
-                logger.info("Stopping checkpoint timer")
-                self._checkpoint_timer.close()
-
-        # Send final stats
-        self.usage_tracker.send_message()
-        self.usage_tracker.close()
-
-        logger.info("Closing job status poller")
-        self.job_status_poller.close()
-        logger.info("Terminated job status poller")
-
-        logger.info("Scaling in and shutting down executors")
-
-        for executor in self.executors.values():
-            if isinstance(executor, BlockProviderExecutor):
-                if not executor.bad_state_is_set:
-                    logger.info(f"Scaling in executor {executor.label}")
-                    if executor.provider:
-                        job_ids = executor.provider.resources.keys()
-                        block_ids = executor.scale_in(len(job_ids))
-                        if self.monitoring and block_ids:
-                            new_status = {}
-                            for bid in block_ids:
-                                new_status[bid] = JobStatus(JobState.CANCELLED)
-                            msg = executor.create_monitoring_info(new_status)
-                            logger.debug("Sending message {} to hub from DFK".format(msg))
-                            self.monitoring.send(MessageType.BLOCK_INFO, msg)
-                else:  # and bad_state_is_set
-                    logger.warning(f"Not shutting down executor {executor.label} because it is in bad state")
-            logger.info(f"Shutting down executor {executor.label}")
-            executor.shutdown()
-            logger.info(f"Shut down executor {executor.label}")
-
-        logger.info("Terminated executors")
-        self.time_completed = datetime.datetime.now()
-
-        if self.monitoring:
-            logger.info("Sending final monitoring message")
-            self.monitoring.send(MessageType.WORKFLOW_INFO,
-                                 {'tasks_failed_count': self.task_state_counts[States.failed],
-                                  'tasks_completed_count': self.task_state_counts[States.exec_done],
-                                  "time_began": self.time_began,
-                                  'time_completed': self.time_completed,
-                                  'run_id': self.run_id, 'rundir': self.run_dir,
-                                  'exit_now': True})
-
-            logger.info("Terminating monitoring")
-            self.monitoring.close()
-            logger.info("Terminated monitoring")
-
-        logger.info("DFK cleanup complete")
-
-    def checkpoint(self, tasks: Optional[Sequence[TaskRecord]] = None) -> str:
-        """Checkpoint the dfk incrementally to a checkpoint file.
-
-        When called, every task that has been completed yet not
-        checkpointed is checkpointed to a file.
-
-        Kwargs:
-            - tasks (List of task records) : List of task ids to checkpoint. Default=None
-                                         if set to None, we iterate over all tasks held by the DFK.
-
-        .. note::
-            Checkpointing only works if memoization is enabled
-
-        Returns:
-            Checkpoint dir if checkpoints were written successfully.
-            By default the checkpoints are written to the RUNDIR of the current
-            run under RUNDIR/checkpoints/{tasks.pkl, dfk.pkl}
-        """
-        with self.checkpoint_lock:
-            if tasks:
-                checkpoint_queue = tasks
-            else:
-                checkpoint_queue = self.checkpointable_tasks
-                self.checkpointable_tasks = []
-
-            checkpoint_dir = '{0}/checkpoint'.format(self.run_dir)
-            checkpoint_dfk = checkpoint_dir + '/dfk.pkl'
-            checkpoint_tasks = checkpoint_dir + '/tasks.pkl'
-
-            if not os.path.exists(checkpoint_dir):
-                os.makedirs(checkpoint_dir, exist_ok=True)
-
-            with open(checkpoint_dfk, 'wb') as f:
-                state = {'rundir': self.run_dir,
-                         'task_count': self.task_count
-                         }
-                pickle.dump(state, f)
-
-            count = 0
-
-            with open(checkpoint_tasks, 'ab') as f:
-                for task_record in checkpoint_queue:
-                    task_id = task_record['id']
-
-                    app_fu = task_record['app_fu']
-
-                    if app_fu.done() and app_fu.exception() is None:
-                        hashsum = task_record['hashsum']
-                        if not hashsum:
-                            continue
-                        t = {'hash': hashsum, 'exception': None, 'result': app_fu.result()}
-
-                        # We are using pickle here since pickle dumps to a file in 'ab'
-                        # mode behave like a incremental log.
-                        pickle.dump(t, f)
-                        count += 1
-                        logger.debug("Task {} checkpointed".format(task_id))
-
-            self.checkpointed_tasks += count
-
-            if count == 0:
-                if self.checkpointed_tasks == 0:
-                    logger.warning("No tasks checkpointed so far in this run. Please ensure caching is enabled")
-                else:
-                    logger.debug("No tasks checkpointed in this pass.")
-            else:
-                logger.info("Done checkpointing {} tasks".format(count))
-
-            return checkpoint_dir
-
-    def _load_checkpoints(self, checkpointDirs: Sequence[str]) -> Dict[str, Future[Any]]:
-        """Load a checkpoint file into a lookup table.
-
-        The data being loaded from the pickle file mostly contains input
-        attributes of the task: func, args, kwargs, env...
-        To simplify the check of whether the exact task has been completed
-        in the checkpoint, we hash these input params and use it as the key
-        for the memoized lookup table.
-
-        Args:
-            - checkpointDirs (list) : List of filepaths to checkpoints
-              Eg. ['runinfo/001', 'runinfo/002']
-
-        Returns:
-            - memoized_lookup_table (dict)
-        """
-        memo_lookup_table = {}
-
-        for checkpoint_dir in checkpointDirs:
-            logger.info("Loading checkpoints from {}".format(checkpoint_dir))
-            checkpoint_file = os.path.join(checkpoint_dir, 'tasks.pkl')
-            try:
-                with open(checkpoint_file, 'rb') as f:
-                    while True:
-                        try:
-                            data = pickle.load(f)
-                            # Copy and hash only the input attributes
-                            memo_fu: Future = Future()
-                            assert data['exception'] is None
-                            memo_fu.set_result(data['result'])
-                            memo_lookup_table[data['hash']] = memo_fu
-
-                        except EOFError:
-                            # Done with the checkpoint file
-                            break
-            except FileNotFoundError:
-                reason = "Checkpoint file was not found: {}".format(
-                    checkpoint_file)
-                logger.error(reason)
-                raise BadCheckpoint(reason)
-            except Exception:
-                reason = "Failed to load checkpoint: {}".format(
-                    checkpoint_file)
-                logger.error(reason)
-                raise BadCheckpoint(reason)
-
-            logger.info("Completed loading checkpoint: {0} with {1} tasks".format(checkpoint_file,
-                                                                                  len(memo_lookup_table.keys())))
-        return memo_lookup_table
-
-    @typeguard.typechecked
-    def load_checkpoints(self, checkpointDirs: Optional[Sequence[str]]) -> Dict[str, Future]:
-        """Load checkpoints from the checkpoint files into a dictionary.
-
-        The results are used to pre-populate the memoizer's lookup_table
-
-        Kwargs:
-             - checkpointDirs (list) : List of run folder to use as checkpoints
-               Eg. ['runinfo/001', 'runinfo/002']
-
-        Returns:
-             - dict containing, hashed -> future mappings
-        """
-        self.memo_lookup_table = None
-
-        if checkpointDirs:
-            return self._load_checkpoints(checkpointDirs)
-        else:
-            return {}
-
-    @staticmethod
-    def _log_std_streams(task_record: TaskRecord) -> None:
-        if task_record['app_fu'].stdout is not None:
-            logger.info("Standard output for task {} available at {}".format(task_record['id'], task_record['app_fu'].stdout))
-        if task_record['app_fu'].stderr is not None:
-            logger.info("Standard error for task {} available at {}".format(task_record['id'], task_record['app_fu'].stderr))
-
-
-class DataFlowKernelLoader:
-    """Manage which DataFlowKernel is active.
-
-    This is a singleton class containing only class methods. You should not
-    need to instantiate this class.
-    """
-
-    _dfk: Optional[DataFlowKernel] = None
-
-    @classmethod
-    def clear(cls) -> None:
-        """Clear the active DataFlowKernel so that a new one can be loaded."""
-        cls._dfk = None
-
-    @classmethod
-    @typeguard.typechecked
-    def load(cls, config: Optional[Config] = None) -> DataFlowKernel:
-        """Load a DataFlowKernel.
-
-        Args:
-            - config (Config) : Configuration to load. This config will be passed to a
-              new DataFlowKernel instantiation which will be set as the active DataFlowKernel.
-        Returns:
-            - DataFlowKernel : The loaded DataFlowKernel object.
-        """
-        if cls._dfk is not None:
-            raise ConfigurationError('Config has already been loaded')
-
-        if config is None:
-            cls._dfk = DataFlowKernel(Config())
-        else:
-            cls._dfk = DataFlowKernel(config)
-
-        return cls._dfk
-
-    @classmethod
-    def wait_for_current_tasks(cls) -> None:
-        """Waits for all tasks in the task list to be completed, by waiting for their
-        AppFuture to be completed. This method will not necessarily wait for any tasks
-        added after cleanup has started such as data stageout.
-        """
-        cls.dfk().wait_for_current_tasks()
-
-    @classmethod
-    def dfk(cls) -> DataFlowKernel:
-        """Return the currently-loaded DataFlowKernel."""
-        if cls._dfk is None:
-            raise NoDataFlowKernelError('Must first load config')
-        return cls._dfk

From b22efe54c4ef86e831adae1b62919b3a647d7487 Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Mon, 18 Mar 2024 16:53:28 +0300
Subject: [PATCH 4/6] Fixing files

---
 parsl/dataflow/dflow.py | 1448 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 1448 insertions(+)
 create mode 100644 parsl/dataflow/dflow.py

diff --git a/parsl/dataflow/dflow.py b/parsl/dataflow/dflow.py
new file mode 100644
index 0000000000..f45ac37629
--- /dev/null
+++ b/parsl/dataflow/dflow.py
@@ -0,0 +1,1448 @@
+from __future__ import annotations
+import atexit
+import logging
+import os
+import pathlib
+import pickle
+import random
+import time
+import typeguard
+import inspect
+import threading
+import sys
+import datetime
+from getpass import getuser
+from typeguard import typechecked
+from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple, Union
+from uuid import uuid4
+from socket import gethostname
+from concurrent.futures import Future
+from functools import partial
+
+import parsl
+from parsl.app.errors import RemoteExceptionWrapper
+from parsl.app.futures import DataFuture
+from parsl.channels import Channel
+from parsl.config import Config
+from parsl.data_provider.data_manager import DataManager
+from parsl.data_provider.files import File
+from parsl.dataflow.errors import BadCheckpoint, DependencyError, JoinError
+from parsl.dataflow.futures import AppFuture
+from parsl.dataflow.memoization import Memoizer
+from parsl.dataflow.rundirs import make_rundir
+from parsl.dataflow.states import States, FINAL_STATES, FINAL_FAILURE_STATES
+from parsl.dataflow.taskrecord import TaskRecord
+from parsl.errors import ConfigurationError, InternalConsistencyError, NoDataFlowKernelError
+from parsl.jobs.job_status_poller import JobStatusPoller
+from parsl.jobs.states import JobStatus, JobState
+from parsl.usage_tracking.usage import UsageTracker
+from parsl.executors.base import ParslExecutor
+from parsl.executors.status_handling import BlockProviderExecutor
+from parsl.executors.threads import ThreadPoolExecutor
+from parsl.monitoring import MonitoringHub
+from parsl.process_loggers import wrap_with_logs
+from parsl.providers.base import ExecutionProvider
+from parsl.utils import get_version, get_std_fname_mode, get_all_checkpoints, Timer
+
+from parsl.monitoring.message_type import MessageType
+
+logger = logging.getLogger(__name__)
+
+
+class DataFlowKernel:
+    """The DataFlowKernel adds dependency awareness to an existing executor.
+
+    It is responsible for managing futures, such that when dependencies are resolved,
+    pending tasks move to the runnable state.
+
+    Here is a simplified diagram of what happens internally::
+
+         User             |        DFK         |    Executor
+        ----------------------------------------------------------
+                          |                    |
+               Task-------+> +Submit           |
+             App_Fu<------+--|                 |
+                          |  Dependencies met  |
+                          |         task-------+--> +Submit
+                          |        Ex_Fu<------+----|
+
+    """
+
+    @typechecked
+    def __init__(self, config: Config) -> None:
+        """Initialize the DataFlowKernel.
+
+        Parameters
+        ----------
+        config : Config
+            A specification of all configuration options. For more details see the
+            :class:~`parsl.config.Config` documentation.
+        """
+
+        # this will be used to check cleanup only happens once
+        self.cleanup_called = False
+
+        self._config = config
+        self.run_dir = make_rundir(config.run_dir)
+
+        if config.initialize_logging:
+            parsl.set_file_logger("{}/parsl.log".format(self.run_dir), level=logging.DEBUG)
+
+        logger.info("Starting DataFlowKernel with config\n{}".format(config))
+
+        logger.info("Parsl version: {}".format(get_version()))
+
+        self.checkpoint_lock = threading.Lock()
+
+        self.usage_tracker = UsageTracker(self)
+        self.usage_tracker.send_message()
+
+        self.task_state_counts_lock = threading.Lock()
+        self.task_state_counts = {state: 0 for state in States}
+
+        # Monitoring
+        self.run_id = str(uuid4())
+
+        self.monitoring: Optional[MonitoringHub]
+        self.monitoring = config.monitoring
+
+        # hub address and port for interchange to connect
+        self.hub_address = None  # type: Optional[str]
+        self.hub_interchange_port = None  # type: Optional[int]
+        if self.monitoring:
+            if self.monitoring.logdir is None:
+                self.monitoring.logdir = self.run_dir
+            self.hub_address = self.monitoring.hub_address
+            self.hub_interchange_port = self.monitoring.start(self.run_id, self.run_dir, self.config.run_dir)
+
+        self.time_began = datetime.datetime.now()
+        self.time_completed: Optional[datetime.datetime] = None
+
+        logger.info("Run id is: " + self.run_id)
+
+        self.workflow_name = None
+        if self.monitoring is not None and self.monitoring.workflow_name is not None:
+            self.workflow_name = self.monitoring.workflow_name
+        else:
+            for frame in inspect.stack():
+                logger.debug("Considering candidate for workflow name: {}".format(frame.filename))
+                fname = os.path.basename(str(frame.filename))
+                parsl_file_names = ['dflow.py', 'typeguard.py', '__init__.py']
+                # Find first file name not considered a parsl file
+                if fname not in parsl_file_names:
+                    self.workflow_name = fname
+                    logger.debug("Using {} as workflow name".format(fname))
+                    break
+            else:
+                logger.debug("Could not choose a name automatically")
+                self.workflow_name = "unnamed"
+
+        self.workflow_version = str(self.time_began.replace(microsecond=0))
+        if self.monitoring is not None and self.monitoring.workflow_version is not None:
+            self.workflow_version = self.monitoring.workflow_version
+
+        workflow_info = {
+                'python_version': "{}.{}.{}".format(sys.version_info.major,
+                                                    sys.version_info.minor,
+                                                    sys.version_info.micro),
+                'parsl_version': get_version(),
+                "time_began": self.time_began,
+                'time_completed': None,
+                'run_id': self.run_id,
+                'workflow_name': self.workflow_name,
+                'workflow_version': self.workflow_version,
+                'rundir': self.run_dir,
+                'tasks_completed_count': self.task_state_counts[States.exec_done],
+                'tasks_failed_count': self.task_state_counts[States.failed],
+                'user': getuser(),
+                'host': gethostname(),
+        }
+
+        if self.monitoring:
+            self.monitoring.send(MessageType.WORKFLOW_INFO,
+                                 workflow_info)
+
+        if config.checkpoint_files is not None:
+            checkpoints = self.load_checkpoints(config.checkpoint_files)
+        elif config.checkpoint_files is None and config.checkpoint_mode is not None:
+            checkpoints = self.load_checkpoints(get_all_checkpoints(self.run_dir))
+        else:
+            checkpoints = {}
+
+        self.memoizer = Memoizer(self, memoize=config.app_cache, checkpoint=checkpoints)
+        self.checkpointed_tasks = 0
+        self._checkpoint_timer = None
+        self.checkpoint_mode = config.checkpoint_mode
+        self.checkpointable_tasks: List[TaskRecord] = []
+
+        # this must be set before executors are added since add_executors calls
+        # job_status_poller.add_executors.
+        self.job_status_poller = JobStatusPoller(strategy=self.config.strategy,
+                                                 max_idletime=self.config.max_idletime,
+                                                 dfk=self)
+
+        self.executors: Dict[str, ParslExecutor] = {}
+
+        self.data_manager = DataManager(self)
+        parsl_internal_executor = ThreadPoolExecutor(max_threads=config.internal_tasks_max_threads, label='_parsl_internal')
+        self.add_executors(config.executors)
+        self.add_executors([parsl_internal_executor])
+
+        if self.checkpoint_mode == "periodic":
+            if config.checkpoint_period is None:
+                raise ConfigurationError("Checkpoint period must be specified with periodic checkpoint mode")
+            else:
+                try:
+                    h, m, s = map(int, config.checkpoint_period.split(':'))
+                except Exception:
+                    raise ConfigurationError("invalid checkpoint_period provided: {0} expected HH:MM:SS".format(config.checkpoint_period))
+                checkpoint_period = (h * 3600) + (m * 60) + s
+                self._checkpoint_timer = Timer(self.checkpoint, interval=checkpoint_period, name="Checkpoint")
+
+        self.task_count = 0
+        self.tasks: Dict[int, TaskRecord] = {}
+        self.submitter_lock = threading.Lock()
+
+        atexit.register(self.atexit_cleanup)
+
+    def _send_task_log_info(self, task_record: TaskRecord) -> None:
+        if self.monitoring:
+            task_log_info = self._create_task_log_info(task_record)
+            self.monitoring.send(MessageType.TASK_INFO, task_log_info)
+
+    def _create_task_log_info(self, task_record):
+        """
+        Create the dictionary that will be included in the log.
+        """
+        info_to_monitor = ['func_name', 'memoize', 'hashsum', 'fail_count', 'fail_cost', 'status',
+                           'id', 'time_invoked', 'try_time_launched', 'time_returned', 'try_time_returned', 'executor']
+
+        task_log_info = {"task_" + k: task_record[k] for k in info_to_monitor}
+        task_log_info['run_id'] = self.run_id
+        task_log_info['try_id'] = task_record['try_id']
+        task_log_info['timestamp'] = datetime.datetime.now()
+        task_log_info['task_status_name'] = task_record['status'].name
+        task_log_info['tasks_failed_count'] = self.task_state_counts[States.failed]
+        task_log_info['tasks_completed_count'] = self.task_state_counts[States.exec_done]
+        task_log_info['tasks_memo_completed_count'] = self.task_state_counts[States.memo_done]
+        task_log_info['from_memo'] = task_record['from_memo']
+        task_log_info['task_inputs'] = str(task_record['kwargs'].get('inputs', None))
+        task_log_info['task_outputs'] = str(task_record['kwargs'].get('outputs', None))
+        task_log_info['task_stdin'] = task_record['kwargs'].get('stdin', None)
+        stdout_spec = task_record['kwargs'].get('stdout', None)
+        stderr_spec = task_record['kwargs'].get('stderr', None)
+        try:
+            stdout_name, _ = get_std_fname_mode('stdout', stdout_spec)
+        except Exception as e:
+            logger.warning("Incorrect stdout format {} for Task {}".format(stdout_spec, task_record['id']))
+            stdout_name = str(e)
+        try:
+            stderr_name, _ = get_std_fname_mode('stderr', stderr_spec)
+        except Exception as e:
+            logger.warning("Incorrect stderr format {} for Task {}".format(stderr_spec, task_record['id']))
+            stderr_name = str(e)
+        task_log_info['task_stdout'] = stdout_name
+        task_log_info['task_stderr'] = stderr_name
+        task_log_info['task_fail_history'] = ",".join(task_record['fail_history'])
+        task_log_info['task_depends'] = None
+        if task_record['depends'] is not None:
+            task_log_info['task_depends'] = ",".join([str(t.tid) for t in task_record['depends']
+                                                      if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
+        task_log_info['task_joins'] = None
+
+        if isinstance(task_record['joins'], list):
+            task_log_info['task_joins'] = ",".join([str(t.tid) for t in task_record['joins']
+                                                    if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
+        elif isinstance(task_record['joins'], Future):
+            task_log_info['task_joins'] = ",".join([str(t.tid) for t in [task_record['joins']]
+                                                    if isinstance(t, AppFuture) or isinstance(t, DataFuture)])
+
+        return task_log_info
+
+    def _count_deps(self, depends: Sequence[Future]) -> int:
+        """Count the number of unresolved futures in the list depends.
+        """
+        count = 0
+        for dep in depends:
+            if not dep.done():
+                count += 1
+
+        return count
+
+    @property
+    def config(self) -> Config:
+        """Returns the fully initialized config that the DFK is actively using.
+
+        Returns:
+             - Config object
+        """
+        return self._config
+
+    def handle_exec_update(self, task_record: TaskRecord, future: Future) -> None:
+        """This function is called only as a callback from an execution
+        attempt reaching a final state (either successfully or failing).
+
+        It will launch retries if necessary, and update the task
+        structure.
+
+        Args:
+             task_record (dict) : Task record
+             future (Future) : The future object corresponding to the task which
+             makes this callback
+        """
+
+        task_id = task_record['id']
+
+        task_record['try_time_returned'] = datetime.datetime.now()
+
+        if not future.done():
+            raise InternalConsistencyError("done callback called, despite future not reporting itself as done")
+
+        try:
+            res = self._unwrap_remote_exception_wrapper(future)
+
+        except Exception as e:
+            logger.info(f"Task {task_id} try {task_record['try_id']} failed with exception of type {type(e).__name__}")
+            # We keep the history separately, since the future itself could be
+            # tossed.
+            task_record['fail_history'].append(repr(e))
+            task_record['fail_count'] += 1
+            if self._config.retry_handler:
+                try:
+                    cost = self._config.retry_handler(e, task_record)
+                except Exception as retry_handler_exception:
+                    logger.exception("retry_handler raised an exception - will not retry")
+
+                    # this can be any amount > self._config.retries, to stop any more
+                    # retries from happening
+                    task_record['fail_cost'] = self._config.retries + 1
+
+                    # make the reported exception be the retry handler's exception,
+                    # rather than the execution level exception
+                    e = retry_handler_exception
+                else:
+                    task_record['fail_cost'] += cost
+            else:
+                task_record['fail_cost'] += 1
+
+            if task_record['status'] == States.dep_fail:
+                logger.info("Task {} failed due to dependency failure so skipping retries".format(task_id))
+                task_record['time_returned'] = datetime.datetime.now()
+                self._send_task_log_info(task_record)
+                with task_record['app_fu']._update_lock:
+                    task_record['app_fu'].set_exception(e)
+
+            elif task_record['fail_cost'] <= self._config.retries:
+
+                # record the final state for this try before we mutate for retries
+                self.update_task_state(task_record, States.fail_retryable)
+                self._send_task_log_info(task_record)
+
+                task_record['try_id'] += 1
+                self.update_task_state(task_record, States.pending)
+                task_record['try_time_launched'] = None
+                task_record['try_time_returned'] = None
+                task_record['fail_history'] = []
+                self._send_task_log_info(task_record)
+
+                logger.info("Task {} marked for retry".format(task_id))
+
+            else:
+                logger.exception("Task {} failed after {} retry attempts".format(task_id,
+                                                                                 task_record['try_id']))
+                task_record['time_returned'] = datetime.datetime.now()
+                self.update_task_state(task_record, States.failed)
+                task_record['time_returned'] = datetime.datetime.now()
+                self._send_task_log_info(task_record)
+                with task_record['app_fu']._update_lock:
+                    task_record['app_fu'].set_exception(e)
+
+        else:
+            if task_record['from_memo']:
+                self._complete_task(task_record, States.memo_done, res)
+                self._send_task_log_info(task_record)
+            else:
+                if not task_record['join']:
+                    self._complete_task(task_record, States.exec_done, res)
+                    self._send_task_log_info(task_record)
+                else:
+                    # This is a join task, and the original task's function code has
+                    # completed. That means that the future returned by that code
+                    # will be available inside the executor future, so we can now
+                    # record the inner app ID in monitoring, and add a completion
+                    # listener to that inner future.
+
+                    joinable = future.result()
+
+                    # Fail with a TypeError if the joinapp python body returned
+                    # something we can't join on.
+                    if isinstance(joinable, Future):
+                        self.update_task_state(task_record, States.joining)
+                        task_record['joins'] = joinable
+                        task_record['join_lock'] = threading.Lock()
+                        self._send_task_log_info(task_record)
+                        joinable.add_done_callback(partial(self.handle_join_update, task_record))
+                    elif joinable == []:  # got a list, but it had no entries, and specifically, no Futures.
+                        self.update_task_state(task_record, States.joining)
+                        task_record['joins'] = joinable
+                        task_record['join_lock'] = threading.Lock()
+                        self._send_task_log_info(task_record)
+                        self.handle_join_update(task_record, None)
+                    elif isinstance(joinable, list) and [j for j in joinable if not isinstance(j, Future)] == []:
+                        self.update_task_state(task_record, States.joining)
+                        task_record['joins'] = joinable
+                        task_record['join_lock'] = threading.Lock()
+                        self._send_task_log_info(task_record)
+                        for inner_future in joinable:
+                            inner_future.add_done_callback(partial(self.handle_join_update, task_record))
+                    else:
+                        task_record['time_returned'] = datetime.datetime.now()
+                        self.update_task_state(task_record, States.failed)
+                        task_record['time_returned'] = datetime.datetime.now()
+                        self._send_task_log_info(task_record)
+                        with task_record['app_fu']._update_lock:
+                            task_record['app_fu'].set_exception(
+                                TypeError(f"join_app body must return a Future or list of Futures, got {joinable} of type {type(joinable)}"))
+
+        self._log_std_streams(task_record)
+
+        # it might be that in the course of the update, we've gone back to being
+        # pending - in which case, we should consider ourself for relaunch
+        if task_record['status'] == States.pending:
+            self.launch_if_ready(task_record)
+
+    def handle_join_update(self, task_record: TaskRecord, inner_app_future: Optional[AppFuture]) -> None:
+        with task_record['join_lock']:
+            # inner_app_future has completed, which is one (potentially of many)
+            # futures the outer task is joining on.
+
+            # If the outer task is joining on a single future, then
+            # use the result of the inner_app_future as the final result of
+            # the outer app future.
+
+            # If the outer task is joining on a list of futures, then
+            # check if the list is all done, and if so, return a list
+            # of the results. Otherwise, this callback can do nothing and
+            # processing will happen in another callback (on the final Future
+            # to complete)
+
+            # There is no retry handling here: inner apps are responsible for
+            # their own retrying, and joining state is responsible for passing
+            # on whatever the result of that retrying was (if any).
+
+            outer_task_id = task_record['id']
+            logger.debug(f"Join callback for task {outer_task_id}, inner_app_future {inner_app_future}")
+
+            if task_record['status'] != States.joining:
+                logger.debug(f"Join callback for task {outer_task_id} skipping because task is not in joining state")
+                return
+
+            joinable = task_record['joins']
+
+            if isinstance(joinable, list):
+                for future in joinable:
+                    if not future.done():
+                        logger.debug(f"A joinable future {future} is not done for task {outer_task_id} - skipping callback")
+                        return  # abandon this callback processing if joinables are not all done
+
+            # now we know each joinable Future is done
+            # so now look for any exceptions
+            exceptions_tids: List[Tuple[BaseException, Optional[str]]]
+            exceptions_tids = []
+            if isinstance(joinable, Future):
+                je = joinable.exception()
+                if je is not None:
+                    if hasattr(joinable, 'task_record'):
+                        tid = joinable.task_record['id']
+                    else:
+                        tid = None
+                    exceptions_tids = [(je, tid)]
+            elif isinstance(joinable, list):
+                for future in joinable:
+                    je = future.exception()
+                    if je is not None:
+                        if hasattr(joinable, 'task_record'):
+                            tid = joinable.task_record['id']
+                        else:
+                            tid = None
+                        exceptions_tids.append((je, tid))
+            else:
+                raise TypeError(f"Unknown joinable type {type(joinable)}")
+
+            if exceptions_tids:
+                logger.debug("Task {} failed due to failure of an inner join future".format(outer_task_id))
+                e = JoinError(exceptions_tids, outer_task_id)
+                # We keep the history separately, since the future itself could be
+                # tossed.
+                task_record['fail_history'].append(repr(e))
+                task_record['fail_count'] += 1
+                # no need to update the fail cost because join apps are never
+                # retried
+
+                self.update_task_state(task_record, States.failed)
+                task_record['time_returned'] = datetime.datetime.now()
+                with task_record['app_fu']._update_lock:
+                    task_record['app_fu'].set_exception(e)
+
+            else:
+                # all the joinables succeeded, so construct a result:
+                if isinstance(joinable, Future):
+                    assert inner_app_future is joinable
+                    res = joinable.result()
+                elif isinstance(joinable, list):
+                    res = []
+                    for future in joinable:
+                        res.append(future.result())
+                else:
+                    raise TypeError(f"Unknown joinable type {type(joinable)}")
+                self._complete_task(task_record, States.exec_done, res)
+
+            self._log_std_streams(task_record)
+
+            self._send_task_log_info(task_record)
+
+    def handle_app_update(self, task_record: TaskRecord, future: AppFuture) -> None:
+        """This function is called as a callback when an AppFuture
+        is in its final state.
+
+        It will trigger post-app processing such as checkpointing.
+
+        Args:
+             task_record : Task record
+             future (Future) : The relevant app future (which should be
+                 consistent with the task structure 'app_fu' entry
+
+        """
+
+        task_id = task_record['id']
+
+        if not task_record['app_fu'].done():
+            logger.error("Internal consistency error: app_fu is not done for task {}".format(task_id))
+        if not task_record['app_fu'] == future:
+            logger.error("Internal consistency error: callback future is not the app_fu in task structure, for task {}".format(task_id))
+
+        self.memoizer.update_memo(task_record, future)
+
+        # Cover all checkpointing cases here:
+        # Do we need to checkpoint now, or queue for later,
+        # or do nothing?
+        if self.checkpoint_mode == 'task_exit':
+            self.checkpoint(tasks=[task_record])
+        elif self.checkpoint_mode in ('manual', 'periodic', 'dfk_exit'):
+            with self.checkpoint_lock:
+                self.checkpointable_tasks.append(task_record)
+        elif self.checkpoint_mode is None:
+            pass
+        else:
+            raise InternalConsistencyError(f"Invalid checkpoint mode {self.checkpoint_mode}")
+
+        self.wipe_task(task_id)
+        return
+
+    def _complete_task(self, task_record: TaskRecord, new_state: States, result: Any) -> None:
+        """Set a task into a completed state
+        """
+        assert new_state in FINAL_STATES
+        assert new_state not in FINAL_FAILURE_STATES
+        old_state = task_record['status']
+
+        self.update_task_state(task_record, new_state)
+
+        logger.info(f"Task {task_record['id']} completed ({old_state.name} -> {new_state.name})")
+        task_record['time_returned'] = datetime.datetime.now()
+
+        with task_record['app_fu']._update_lock:
+            task_record['app_fu'].set_result(result)
+
+    def update_task_state(self, task_record: TaskRecord, new_state: States) -> None:
+        """Updates a task record state, and recording an appropriate change
+        to task state counters.
+        """
+
+        with self.task_state_counts_lock:
+            if 'status' in task_record:
+                self.task_state_counts[task_record['status']] -= 1
+            self.task_state_counts[new_state] += 1
+            task_record['status'] = new_state
+
+    @staticmethod
+    def _unwrap_remote_exception_wrapper(future: Future) -> Any:
+        result = future.result()
+        if isinstance(result, RemoteExceptionWrapper):
+            result.reraise()
+        return result
+
+    def wipe_task(self, task_id: int) -> None:
+        """Remove task with task_id from the internal tasks table
+        """
+        if self.config.garbage_collect:
+            del self.tasks[task_id]
+
+    @staticmethod
+    def check_staging_inhibited(kwargs: Dict[str, Any]) -> bool:
+        return kwargs.get('_parsl_staging_inhibit', False)
+
+    def launch_if_ready(self, task_record: TaskRecord) -> None:
+        """
+        launch_if_ready will launch the specified task, if it is ready
+        to run (for example, without dependencies, and in pending state).
+
+        This should be called by any piece of the DataFlowKernel that
+        thinks a task may have become ready to run.
+
+        It is not an error to call launch_if_ready on a task that is not
+        ready to run - launch_if_ready will not incorrectly launch that
+        task.
+
+        It is also not an error to call launch_if_ready on a task that has
+        already been launched - launch_if_ready will not re-launch that
+        task.
+
+        launch_if_ready is thread safe, so may be called from any thread
+        or callback.
+        """
+        exec_fu = None
+
+        task_id = task_record['id']
+        with task_record['task_launch_lock']:
+
+            if task_record['status'] != States.pending:
+                logger.debug(f"Task {task_id} is not pending, so launch_if_ready skipping")
+                return
+
+            if self._count_deps(task_record['depends']) != 0:
+                logger.debug(f"Task {task_id} has outstanding dependencies, so launch_if_ready skipping")
+                return
+
+            # We can now launch the task or handle any dependency failures
+
+            new_args, kwargs, exceptions_tids = self._unwrap_futures(task_record['args'],
+                                                                     task_record['kwargs'])
+            task_record['args'] = new_args
+            task_record['kwargs'] = kwargs
+
+            if not exceptions_tids:
+                # There are no dependency errors
+                try:
+                    exec_fu = self.launch_task(task_record)
+                    assert isinstance(exec_fu, Future)
+                except Exception as e:
+                    # task launched failed somehow. the execution might
+                    # have been launched and an exception raised after
+                    # that, though. that's hard to detect from here.
+                    # we don't attempt retries here. This is an error with submission
+                    # even though it might come from user code such as a plugged-in
+                    # executor or memoization hash function.
+
+                    logger.debug("Got an exception launching task", exc_info=True)
+                    exec_fu = Future()
+                    exec_fu.set_exception(e)
+            else:
+                logger.info(
+                    "Task {} failed due to dependency failure".format(task_id))
+                # Raise a dependency exception
+                self.update_task_state(task_record, States.dep_fail)
+
+                self._send_task_log_info(task_record)
+
+                exec_fu = Future()
+                exec_fu.set_exception(DependencyError(exceptions_tids,
+                                                      task_id))
+
+        if exec_fu:
+            assert isinstance(exec_fu, Future)
+            try:
+                exec_fu.add_done_callback(partial(self.handle_exec_update, task_record))
+            except Exception:
+                # this exception is ignored here because it is assumed that exception
+                # comes from directly executing handle_exec_update (because exec_fu is
+                # done already). If the callback executes later, then any exception
+                # coming out of the callback will be ignored and not propate anywhere,
+                # so this block attempts to keep the same behaviour here.
+                logger.error("add_done_callback got an exception which will be ignored", exc_info=True)
+
+            task_record['exec_fu'] = exec_fu
+
+    def launch_task(self, task_record: TaskRecord) -> Future:
+        """Handle the actual submission of the task to the executor layer.
+
+        If the app task has the executors attributes not set (default=='all')
+        the task is launched on a randomly selected executor from the
+        list of executors. This behavior could later be updated to support
+        binding to executors based on user specified criteria.
+
+        If the app task specifies a particular set of executors, it will be
+        targeted at those specific executors.
+
+        Args:
+            task_record : The task record
+
+        Returns:
+            Future that tracks the execution of the submitted function
+        """
+        task_id = task_record['id']
+        function = task_record['func']
+        args = task_record['args']
+        kwargs = task_record['kwargs']
+
+        task_record['try_time_launched'] = datetime.datetime.now()
+
+        memo_fu = self.memoizer.check_memo(task_record)
+        if memo_fu:
+            logger.info("Reusing cached result for task {}".format(task_id))
+            task_record['from_memo'] = True
+            assert isinstance(memo_fu, Future)
+            return memo_fu
+
+        task_record['from_memo'] = False
+        executor_label = task_record["executor"]
+        try:
+            executor = self.executors[executor_label]
+        except Exception:
+            logger.exception("Task {} requested invalid executor {}: config is\n{}".format(task_id, executor_label, self._config))
+            raise ValueError("Task {} requested invalid executor {}".format(task_id, executor_label))
+
+        try_id = task_record['fail_count']
+
+        if self.monitoring is not None and self.monitoring.resource_monitoring_enabled:
+            wrapper_logging_level = logging.DEBUG if self.monitoring.monitoring_debug else logging.INFO
+            (function, args, kwargs) = self.monitoring.monitor_wrapper(function, args, kwargs, try_id, task_id,
+                                                                       self.monitoring.monitoring_hub_url,
+                                                                       self.run_id,
+                                                                       wrapper_logging_level,
+                                                                       self.monitoring.resource_monitoring_interval,
+                                                                       executor.radio_mode,
+                                                                       executor.monitor_resources(),
+                                                                       self.run_dir)
+
+        with self.submitter_lock:
+            exec_fu = executor.submit(function, task_record['resource_specification'], *args, **kwargs)
+        self.update_task_state(task_record, States.launched)
+
+        self._send_task_log_info(task_record)
+
+        if hasattr(exec_fu, "parsl_executor_task_id"):
+            logger.info(f"Parsl task {task_id} try {try_id} launched on executor {executor.label} with executor id {exec_fu.parsl_executor_task_id}")
+        else:
+            logger.info(f"Parsl task {task_id} try {try_id} launched on executor {executor.label}")
+
+        self._log_std_streams(task_record)
+
+        return exec_fu
+
+    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any],
+                                                                                                                   Callable]:
+        """Look for inputs of the app that are files. Give the data manager
+        the opportunity to replace a file with a data future for that file,
+        for example wrapping the result of a staging action.
+
+        Args:
+            - executor (str) : executor where the app is going to be launched
+            - args (List) : Positional args to app function
+            - kwargs (Dict) : Kwargs to app function
+        """
+
+        # Return if the task is a data management task, rather than doing
+        #  data management on it.
+        if self.check_staging_inhibited(kwargs):
+            logger.debug("Not performing input staging")
+            return args, kwargs, func
+
+        inputs = kwargs.get('inputs', [])
+        for idx, f in enumerate(inputs):
+            (inputs[idx], func) = self.data_manager.optionally_stage_in(f, func, executor)
+
+        for kwarg, f in kwargs.items():
+            (kwargs[kwarg], func) = self.data_manager.optionally_stage_in(f, func, executor)
+
+        newargs = list(args)
+        for idx, f in enumerate(newargs):
+            (newargs[idx], func) = self.data_manager.optionally_stage_in(f, func, executor)
+
+        return tuple(newargs), kwargs, func
+
+    def _add_output_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], app_fut: AppFuture, func: Callable) -> Callable:
+        logger.debug("Adding output dependencies")
+        outputs = kwargs.get('outputs', [])
+        app_fut._outputs = []
+        for idx, f in enumerate(outputs):
+            if isinstance(f, File) and not self.check_staging_inhibited(kwargs):
+                # replace a File with a DataFuture - either completing when the stageout
+                # future completes, or if no stage out future is returned, then when the
+                # app itself completes.
+
+                # The staging code will get a clean copy which it is allowed to mutate,
+                # while the DataFuture-contained original will not be modified by any staging.
+                f_copy = f.cleancopy()
+                outputs[idx] = f_copy
+
+                logger.debug("Submitting stage out for output file {}".format(repr(f)))
+                stageout_fut = self.data_manager.stage_out(f_copy, executor, app_fut)
+                if stageout_fut:
+                    logger.debug("Adding a dependency on stageout future for {}".format(repr(f)))
+                    app_fut._outputs.append(DataFuture(stageout_fut, f, tid=app_fut.tid))
+                else:
+                    logger.debug("No stageout dependency for {}".format(repr(f)))
+                    app_fut._outputs.append(DataFuture(app_fut, f, tid=app_fut.tid))
+
+                # this is a hook for post-task stageout
+                # note that nothing depends on the output - which is maybe a bug
+                # in the not-very-tested stageout system?
+                func = self.data_manager.replace_task_stage_out(f_copy, func, executor)
+            else:
+                logger.debug("Not performing output staging for: {}".format(repr(f)))
+                app_fut._outputs.append(DataFuture(app_fut, f, tid=app_fut.tid))
+        return func
+
+    def _gather_all_deps(self, args: Sequence[Any], kwargs: Dict[str, Any]) -> List[Future]:
+        """Assemble a list of all Futures passed as arguments, kwargs or in the inputs kwarg.
+
+        Args:
+            - args: The list of args pass to the app
+            - kwargs: The dict of all kwargs passed to the app
+
+        Returns:
+            - list of dependencies
+
+        """
+        depends: List[Future] = []
+
+        def check_dep(d: Any) -> None:
+            if isinstance(d, Future):
+                depends.extend([d])
+
+        # Check the positional args
+        for dep in args:
+            check_dep(dep)
+
+        # Check for explicit kwargs ex, fu_1=<fut>
+        for key in kwargs:
+            dep = kwargs[key]
+            check_dep(dep)
+
+        # Check for futures in inputs=[<fut>...]
+        for dep in kwargs.get('inputs', []):
+            check_dep(dep)
+
+        return depends
+
+    def _unwrap_futures(self, args, kwargs):
+        """This function should be called when all dependencies have completed.
+
+        It will rewrite the arguments for that task, replacing each Future
+        with the result of that future.
+
+        If the user hid futures a level below, we will not catch
+        it, and will (most likely) result in a type error.
+
+        Args:
+             args (List) : Positional args to app function
+             kwargs (Dict) : Kwargs to app function
+
+        Return:
+            a rewritten args list
+            a rewritten kwargs dict
+            pairs of exceptions, task ids from any Futures which stored
+            exceptions rather than results.
+        """
+        dep_failures = []
+
+        # Replace item in args
+        new_args = []
+        for dep in args:
+            if isinstance(dep, Future):
+                try:
+                    new_args.extend([dep.result()])
+                except Exception as e:
+                    # If this Future is associated with a task inside this DFK,
+                    # then refer to the task ID.
+                    # Otherwise make a repr of the Future object.
+                    if hasattr(dep, 'task_record') and dep.task_record['dfk'] == self:
+                        tid = "task " + repr(dep.task_record['id'])
+                    else:
+                        tid = repr(dep)
+                    dep_failures.extend([(e, tid)])
+            else:
+                new_args.extend([dep])
+
+        # Check for explicit kwargs ex, fu_1=<fut>
+        for key in kwargs:
+            dep = kwargs[key]
+            if isinstance(dep, Future):
+                try:
+                    kwargs[key] = dep.result()
+                except Exception as e:
+                    if hasattr(dep, 'task_record'):
+                        tid = dep.task_record['id']
+                    else:
+                        tid = None
+                    dep_failures.extend([(e, tid)])
+
+        # Check for futures in inputs=[<fut>...]
+        if 'inputs' in kwargs:
+            new_inputs = []
+            for dep in kwargs['inputs']:
+                if isinstance(dep, Future):
+                    try:
+                        new_inputs.extend([dep.result()])
+                    except Exception as e:
+                        if hasattr(dep, 'task_record'):
+                            tid = dep.task_record['id']
+                        else:
+                            tid = None
+                        dep_failures.extend([(e, tid)])
+
+                else:
+                    new_inputs.extend([dep])
+            kwargs['inputs'] = new_inputs
+
+        return new_args, kwargs, dep_failures
+
+    def submit(self,
+               func: Callable,
+               app_args: Sequence[Any],
+               executors: Union[str, Sequence[str]],
+               cache: bool,
+               ignore_for_cache: Optional[Sequence[str]],
+               app_kwargs: Dict[str, Any],
+               join: bool = False) -> AppFuture:
+        """Add task to the dataflow system.
+
+        If the app task has the executors attributes not set (default=='all')
+        the task will be launched on a randomly selected executor from the
+        list of executors. If the app task specifies a particular set of
+        executors, it will be targeted at the specified executors.
+
+        Args:
+            - func : A function object
+
+        KWargs :
+            - app_args : Args to the function
+            - executors (list or string) : List of executors this call could go to.
+                    Default='all'
+            - cache (Bool) : To enable memoization or not
+            - ignore_for_cache (sequence) : List of kwargs to be ignored for memoization/checkpointing
+            - app_kwargs (dict) : Rest of the kwargs to the fn passed as dict.
+
+        Returns:
+               (AppFuture) [DataFutures,]
+
+        """
+
+        if ignore_for_cache is None:
+            ignore_for_cache = []
+        else:
+            # duplicate so that it can be modified safely later
+            ignore_for_cache = list(ignore_for_cache)
+
+        if self.cleanup_called:
+            raise NoDataFlowKernelError("Cannot submit to a DFK that has been cleaned up")
+
+        task_id = self.task_count
+        self.task_count += 1
+        if isinstance(executors, str) and executors.lower() == 'all':
+            choices = list(e for e in self.executors if e != '_parsl_internal')
+        elif isinstance(executors, list):
+            choices = executors
+        else:
+            raise ValueError("Task {} supplied invalid type for executors: {}".format(task_id, type(executors)))
+        executor = random.choice(choices)
+        logger.debug("Task {} will be sent to executor {}".format(task_id, executor))
+
+        # The below uses func.__name__ before it has been wrapped by any staging code.
+
+        label = app_kwargs.get('label')
+        for kw in ['stdout', 'stderr']:
+            if kw in app_kwargs:
+                if app_kwargs[kw] == parsl.AUTO_LOGNAME:
+                    if kw not in ignore_for_cache:
+                        ignore_for_cache += [kw]
+                    app_kwargs[kw] = os.path.join(
+                                self.run_dir,
+                                'task_logs',
+                                str(int(task_id / 10000)).zfill(4),  # limit logs to 10k entries per directory
+                                'task_{}_{}{}.{}'.format(
+                                    str(task_id).zfill(4),
+                                    func.__name__,
+                                    '' if label is None else '_{}'.format(label),
+                                    kw)
+                    )
+
+        resource_specification = app_kwargs.get('parsl_resource_specification', {})
+
+        task_record: TaskRecord
+        task_record = {'depends': [],
+                       'dfk': self,
+                       'executor': executor,
+                       'func_name': func.__name__,
+                       'memoize': cache,
+                       'hashsum': None,
+                       'exec_fu': None,
+                       'fail_count': 0,
+                       'fail_cost': 0,
+                       'fail_history': [],
+                       'from_memo': None,
+                       'ignore_for_cache': ignore_for_cache,
+                       'join': join,
+                       'joins': None,
+                       'try_id': 0,
+                       'id': task_id,
+                       'task_launch_lock': threading.Lock(),
+                       'time_invoked': datetime.datetime.now(),
+                       'time_returned': None,
+                       'try_time_launched': None,
+                       'try_time_returned': None,
+                       'resource_specification': resource_specification}
+
+        self.update_task_state(task_record, States.unsched)
+
+        app_fu = AppFuture(task_record)
+
+        # Transform remote input files to data futures
+        app_args, app_kwargs, func = self._add_input_deps(executor, app_args, app_kwargs, func)
+
+        func = self._add_output_deps(executor, app_args, app_kwargs, app_fu, func)
+
+        task_record.update({
+                    'args': app_args,
+                    'func': func,
+                    'kwargs': app_kwargs,
+                    'app_fu': app_fu})
+
+        assert task_id not in self.tasks
+
+        self.tasks[task_id] = task_record
+
+        # Get the list of dependencies for the task
+        depends = self._gather_all_deps(app_args, app_kwargs)
+        task_record['depends'] = depends
+
+        depend_descs = []
+        for d in depends:
+            if isinstance(d, AppFuture) or isinstance(d, DataFuture):
+                depend_descs.append("task {}".format(d.tid))
+            else:
+                depend_descs.append(repr(d))
+
+        if depend_descs != []:
+            waiting_message = "waiting on {}".format(", ".join(depend_descs))
+        else:
+            waiting_message = "not waiting on any dependency"
+
+        logger.info("Task {} submitted for App {}, {}".format(task_id,
+                                                              task_record['func_name'],
+                                                              waiting_message))
+
+        app_fu.add_done_callback(partial(self.handle_app_update, task_record))
+        self.update_task_state(task_record, States.pending)
+        logger.debug("Task {} set to pending state with AppFuture: {}".format(task_id, task_record['app_fu']))
+
+        self._send_task_log_info(task_record)
+
+        # at this point add callbacks to all dependencies to do a launch_if_ready
+        # call whenever a dependency completes.
+
+        # we need to be careful about the order of setting the state to pending,
+        # adding the callbacks, and caling launch_if_ready explicitly once always below.
+
+        # I think as long as we call launch_if_ready once after setting pending, then
+        # we can add the callback dependencies at any point: if the callbacks all fire
+        # before then, they won't cause a launch, but the one below will. if they fire
+        # after we set it pending, then the last one will cause a launch, and the
+        # explicit one won't.
+
+        for d in depends:
+
+            def callback_adapter(dep_fut: Future) -> None:
+                self.launch_if_ready(task_record)
+
+            try:
+                d.add_done_callback(callback_adapter)
+            except Exception as e:
+                logger.error("add_done_callback got an exception {} which will be ignored".format(e))
+
+        self.launch_if_ready(task_record)
+
+        return app_fu
+
+    # it might also be interesting to assert that all DFK
+    # tasks are in a "final" state (3,4,5) when the DFK
+    # is closed down, and report some kind of warning.
+    # although really I'd like this to drain properly...
+    # and a drain function might look like this.
+    # If tasks have their states changed, this won't work properly
+    # but we can validate that...
+    def log_task_states(self) -> None:
+        logger.info("Summary of tasks in DFK:")
+
+        with self.task_state_counts_lock:
+            for state in States:
+                logger.info("Tasks in state {}: {}".format(str(state), self.task_state_counts[state]))
+
+        logger.info("End of summary")
+
+    def _create_remote_dirs_over_channel(self, provider: ExecutionProvider, channel: Channel) -> None:
+        """Create script directories across a channel
+
+        Parameters
+        ----------
+        provider: Provider obj
+           Provider for which scripts dirs are being created
+        channel: Channel obj
+           Channel over which the remote dirs are to be created
+        """
+        run_dir = self.run_dir
+        if channel.script_dir is None:
+
+            # This case will be detected as unreachable by mypy, because of
+            # the type of script_dir, which is str, not Optional[str].
+            # The type system doesn't represent the initialized/uninitialized
+            # state of a channel so cannot represent that a channel needs
+            # its script directory set or not.
+
+            channel.script_dir = os.path.join(run_dir, 'submit_scripts')  # type: ignore[unreachable]
+
+            # Only create dirs if we aren't on a shared-fs
+            if not channel.isdir(run_dir):
+                parent, child = pathlib.Path(run_dir).parts[-2:]
+                remote_run_dir = os.path.join(parent, child)
+                channel.script_dir = os.path.join(remote_run_dir, 'remote_submit_scripts')
+                provider.script_dir = os.path.join(run_dir, 'local_submit_scripts')
+
+        channel.makedirs(channel.script_dir, exist_ok=True)
+
+    def add_executors(self, executors):
+        for executor in executors:
+            executor.run_id = self.run_id
+            executor.run_dir = self.run_dir
+            executor.hub_address = self.hub_address
+            executor.hub_port = self.hub_interchange_port
+            if hasattr(executor, 'provider'):
+                if hasattr(executor.provider, 'script_dir'):
+                    executor.provider.script_dir = os.path.join(self.run_dir, 'submit_scripts')
+                    os.makedirs(executor.provider.script_dir, exist_ok=True)
+
+                    if hasattr(executor.provider, 'channels'):
+                        logger.debug("Creating script_dir across multiple channels")
+                        for channel in executor.provider.channels:
+                            self._create_remote_dirs_over_channel(executor.provider, channel)
+                    else:
+                        self._create_remote_dirs_over_channel(executor.provider, executor.provider.channel)
+
+            self.executors[executor.label] = executor
+            block_ids = executor.start()
+            if self.monitoring and block_ids:
+                new_status = {}
+                for bid in block_ids:
+                    new_status[bid] = JobStatus(JobState.PENDING)
+                msg = executor.create_monitoring_info(new_status)
+                logger.debug("Sending monitoring message {} to hub from DFK".format(msg))
+                self.monitoring.send(MessageType.BLOCK_INFO, msg)
+        block_executors = [e for e in executors if isinstance(e, BlockProviderExecutor)]
+        self.job_status_poller.add_executors(block_executors)
+
+    def atexit_cleanup(self) -> None:
+        if not self.cleanup_called:
+            logger.info("DFK cleanup because python process is exiting")
+            self.cleanup()
+        else:
+            logger.info("python process is exiting, but DFK has already been cleaned up")
+
+    def wait_for_current_tasks(self) -> None:
+        """Waits for all tasks in the task list to be completed, by waiting for their
+        AppFuture to be completed. This method will not necessarily wait for any tasks
+        added after cleanup has started (such as data stageout?)
+        """
+
+        logger.info("Waiting for all remaining tasks to complete")
+
+        # .values is made into a list immediately to reduce (although not
+        # eliminate) a race condition where self.tasks can be modified
+        # elsewhere by a completing task being removed from the dictionary.
+        task_records = list(self.tasks.values())
+        for task_record in task_records:
+            # .exception() is a less exception throwing way of
+            # waiting for completion than .result()
+            fut = task_record['app_fu']
+            if not fut.done():
+                fut.exception()
+            # now app future is done, poll until DFK state is final: a DFK state being final and the app future being done do not imply each other.
+            while task_record['status'] not in FINAL_STATES:
+                time.sleep(0.1)
+
+        logger.info("All remaining tasks completed")
+
+    @wrap_with_logs
+    def cleanup(self) -> None:
+        """DataFlowKernel cleanup.
+
+        This involves releasing all resources explicitly.
+
+        We call scale_in on each of the executors and call executor.shutdown.
+        """
+        logger.info("DFK cleanup initiated")
+
+        # this check won't detect two DFK cleanups happening from
+        # different threads extremely close in time because of
+        # non-atomic read/modify of self.cleanup_called
+        if self.cleanup_called:
+            raise Exception("attempt to clean up DFK when it has already been cleaned-up")
+        self.cleanup_called = True
+
+        self.log_task_states()
+
+        # Checkpointing takes priority over the rest of the tasks
+        # checkpoint if any valid checkpoint method is specified
+        if self.checkpoint_mode is not None:
+            self.checkpoint()
+
+            if self._checkpoint_timer:
+                logger.info("Stopping checkpoint timer")
+                self._checkpoint_timer.close()
+
+        # Send final stats
+        self.usage_tracker.send_message()
+        self.usage_tracker.close()
+
+        logger.info("Closing job status poller")
+        self.job_status_poller.close()
+        logger.info("Terminated job status poller")
+
+        logger.info("Scaling in and shutting down executors")
+
+        for executor in self.executors.values():
+            if isinstance(executor, BlockProviderExecutor):
+                if not executor.bad_state_is_set:
+                    logger.info(f"Scaling in executor {executor.label}")
+                    if executor.provider:
+                        job_ids = executor.provider.resources.keys()
+                        block_ids = executor.scale_in(len(job_ids))
+                        if self.monitoring and block_ids:
+                            new_status = {}
+                            for bid in block_ids:
+                                new_status[bid] = JobStatus(JobState.CANCELLED)
+                            msg = executor.create_monitoring_info(new_status)
+                            logger.debug("Sending message {} to hub from DFK".format(msg))
+                            self.monitoring.send(MessageType.BLOCK_INFO, msg)
+                else:  # and bad_state_is_set
+                    logger.warning(f"Not shutting down executor {executor.label} because it is in bad state")
+            logger.info(f"Shutting down executor {executor.label}")
+            executor.shutdown()
+            logger.info(f"Shut down executor {executor.label}")
+
+        logger.info("Terminated executors")
+        self.time_completed = datetime.datetime.now()
+
+        if self.monitoring:
+            logger.info("Sending final monitoring message")
+            self.monitoring.send(MessageType.WORKFLOW_INFO,
+                                 {'tasks_failed_count': self.task_state_counts[States.failed],
+                                  'tasks_completed_count': self.task_state_counts[States.exec_done],
+                                  "time_began": self.time_began,
+                                  'time_completed': self.time_completed,
+                                  'run_id': self.run_id, 'rundir': self.run_dir,
+                                  'exit_now': True})
+
+            logger.info("Terminating monitoring")
+            self.monitoring.close()
+            logger.info("Terminated monitoring")
+
+        logger.info("DFK cleanup complete")
+
+    def checkpoint(self, tasks: Optional[Sequence[TaskRecord]] = None) -> str:
+        """Checkpoint the dfk incrementally to a checkpoint file.
+
+        When called, every task that has been completed yet not
+        checkpointed is checkpointed to a file.
+
+        Kwargs:
+            - tasks (List of task records) : List of task ids to checkpoint. Default=None
+                                         if set to None, we iterate over all tasks held by the DFK.
+
+        .. note::
+            Checkpointing only works if memoization is enabled
+
+        Returns:
+            Checkpoint dir if checkpoints were written successfully.
+            By default the checkpoints are written to the RUNDIR of the current
+            run under RUNDIR/checkpoints/{tasks.pkl, dfk.pkl}
+        """
+        with self.checkpoint_lock:
+            if tasks:
+                checkpoint_queue = tasks
+            else:
+                checkpoint_queue = self.checkpointable_tasks
+                self.checkpointable_tasks = []
+
+            checkpoint_dir = '{0}/checkpoint'.format(self.run_dir)
+            checkpoint_dfk = checkpoint_dir + '/dfk.pkl'
+            checkpoint_tasks = checkpoint_dir + '/tasks.pkl'
+
+            if not os.path.exists(checkpoint_dir):
+                os.makedirs(checkpoint_dir, exist_ok=True)
+
+            with open(checkpoint_dfk, 'wb') as f:
+                state = {'rundir': self.run_dir,
+                         'task_count': self.task_count
+                         }
+                pickle.dump(state, f)
+
+            count = 0
+
+            with open(checkpoint_tasks, 'ab') as f:
+                for task_record in checkpoint_queue:
+                    task_id = task_record['id']
+
+                    app_fu = task_record['app_fu']
+
+                    if app_fu.done() and app_fu.exception() is None:
+                        hashsum = task_record['hashsum']
+                        if not hashsum:
+                            continue
+                        t = {'hash': hashsum, 'exception': None, 'result': app_fu.result()}
+
+                        # We are using pickle here since pickle dumps to a file in 'ab'
+                        # mode behave like a incremental log.
+                        pickle.dump(t, f)
+                        count += 1
+                        logger.debug("Task {} checkpointed".format(task_id))
+
+            self.checkpointed_tasks += count
+
+            if count == 0:
+                if self.checkpointed_tasks == 0:
+                    logger.warning("No tasks checkpointed so far in this run. Please ensure caching is enabled")
+                else:
+                    logger.debug("No tasks checkpointed in this pass.")
+            else:
+                logger.info("Done checkpointing {} tasks".format(count))
+
+            return checkpoint_dir
+
+    def _load_checkpoints(self, checkpointDirs: Sequence[str]) -> Dict[str, Future[Any]]:
+        """Load a checkpoint file into a lookup table.
+
+        The data being loaded from the pickle file mostly contains input
+        attributes of the task: func, args, kwargs, env...
+        To simplify the check of whether the exact task has been completed
+        in the checkpoint, we hash these input params and use it as the key
+        for the memoized lookup table.
+
+        Args:
+            - checkpointDirs (list) : List of filepaths to checkpoints
+              Eg. ['runinfo/001', 'runinfo/002']
+
+        Returns:
+            - memoized_lookup_table (dict)
+        """
+        memo_lookup_table = {}
+
+        for checkpoint_dir in checkpointDirs:
+            logger.info("Loading checkpoints from {}".format(checkpoint_dir))
+            checkpoint_file = os.path.join(checkpoint_dir, 'tasks.pkl')
+            try:
+                with open(checkpoint_file, 'rb') as f:
+                    while True:
+                        try:
+                            data = pickle.load(f)
+                            # Copy and hash only the input attributes
+                            memo_fu: Future = Future()
+                            assert data['exception'] is None
+                            memo_fu.set_result(data['result'])
+                            memo_lookup_table[data['hash']] = memo_fu
+
+                        except EOFError:
+                            # Done with the checkpoint file
+                            break
+            except FileNotFoundError:
+                reason = "Checkpoint file was not found: {}".format(
+                    checkpoint_file)
+                logger.error(reason)
+                raise BadCheckpoint(reason)
+            except Exception:
+                reason = "Failed to load checkpoint: {}".format(
+                    checkpoint_file)
+                logger.error(reason)
+                raise BadCheckpoint(reason)
+
+            logger.info("Completed loading checkpoint: {0} with {1} tasks".format(checkpoint_file,
+                                                                                  len(memo_lookup_table.keys())))
+        return memo_lookup_table
+
+    @typeguard.typechecked
+    def load_checkpoints(self, checkpointDirs: Optional[Sequence[str]]) -> Dict[str, Future]:
+        """Load checkpoints from the checkpoint files into a dictionary.
+
+        The results are used to pre-populate the memoizer's lookup_table
+
+        Kwargs:
+             - checkpointDirs (list) : List of run folder to use as checkpoints
+               Eg. ['runinfo/001', 'runinfo/002']
+
+        Returns:
+             - dict containing, hashed -> future mappings
+        """
+        self.memo_lookup_table = None
+
+        if checkpointDirs:
+            return self._load_checkpoints(checkpointDirs)
+        else:
+            return {}
+
+    @staticmethod
+    def _log_std_streams(task_record: TaskRecord) -> None:
+        if task_record['app_fu'].stdout is not None:
+            logger.info("Standard output for task {} available at {}".format(task_record['id'], task_record['app_fu'].stdout))
+        if task_record['app_fu'].stderr is not None:
+            logger.info("Standard error for task {} available at {}".format(task_record['id'], task_record['app_fu'].stderr))
+
+
+class DataFlowKernelLoader:
+    """Manage which DataFlowKernel is active.
+
+    This is a singleton class containing only class methods. You should not
+    need to instantiate this class.
+    """
+
+    _dfk: Optional[DataFlowKernel] = None
+
+    @classmethod
+    def clear(cls) -> None:
+        """Clear the active DataFlowKernel so that a new one can be loaded."""
+        cls._dfk = None
+
+    @classmethod
+    @typeguard.typechecked
+    def load(cls, config: Optional[Config] = None) -> DataFlowKernel:
+        """Load a DataFlowKernel.
+
+        Args:
+            - config (Config) : Configuration to load. This config will be passed to a
+              new DataFlowKernel instantiation which will be set as the active DataFlowKernel.
+        Returns:
+            - DataFlowKernel : The loaded DataFlowKernel object.
+        """
+        if cls._dfk is not None:
+            raise ConfigurationError('Config has already been loaded')
+
+        if config is None:
+            cls._dfk = DataFlowKernel(Config())
+        else:
+            cls._dfk = DataFlowKernel(config)
+
+        return cls._dfk
+
+    @classmethod
+    def wait_for_current_tasks(cls) -> None:
+        """Waits for all tasks in the task list to be completed, by waiting for their
+        AppFuture to be completed. This method will not necessarily wait for any tasks
+        added after cleanup has started such as data stageout.
+        """
+        cls.dfk().wait_for_current_tasks()
+
+    @classmethod
+    def dfk(cls) -> DataFlowKernel:
+        """Return the currently-loaded DataFlowKernel."""
+        if cls._dfk is None:
+            raise NoDataFlowKernelError('Must first load config')
+        return cls._dfk

From ed743e463c9c29a39174ebce890bfaf113eba808 Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Tue, 19 Mar 2024 08:56:46 +0300
Subject: [PATCH 5/6] Joining dflow lines

---
 parsl/dataflow/dflow.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/parsl/dataflow/dflow.py b/parsl/dataflow/dflow.py
index f45ac37629..707e2abc23 100644
--- a/parsl/dataflow/dflow.py
+++ b/parsl/dataflow/dflow.py
@@ -730,8 +730,7 @@ def launch_task(self, task_record: TaskRecord) -> Future:
 
         return exec_fu
 
-    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any],
-                                                                                                                   Callable]:
+    def _add_input_deps(self, executor: str, args: Sequence[Any], kwargs: Dict[str, Any], func: Callable) -> Tuple[Sequence[Any], Dict[str, Any], Callable]:
         """Look for inputs of the app that are files. Give the data manager
         the opportunity to replace a file with a data future for that file,
         for example wrapping the result of a staging action.

From 92b99ca67517ec3af8a45f056634c1cb49c6c79e Mon Sep 17 00:00:00 2001
From: Serah Nderi <sarahngima77@gmail.com>
Date: Tue, 19 Mar 2024 09:05:34 +0300
Subject: [PATCH 6/6] Fixing memoization test file

---
 parsl/tests/test_python_apps/test_memoize_3.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/parsl/tests/test_python_apps/test_memoize_3.py b/parsl/tests/test_python_apps/test_memoize_3.py
index 4047189853..ad43f0eaa1 100644
--- a/parsl/tests/test_python_apps/test_memoize_3.py
+++ b/parsl/tests/test_python_apps/test_memoize_3.py
@@ -27,6 +27,3 @@ def bar():
     # Sort the dictionary, it should raise a TypeError
     with pytest.raises(TypeError):
         sorted(d)
-
-    # Create a dictionary with enum keys
-    d_enum = {Foo.x: 1, Foo.y: 2}