print step keys in nice format (#70)

wanghan-iapcm · Han Wang · web-flow · commit 0a27bf8b1117 · 2022-09-10T21:22:06.000+08:00
Co-authored-by: Han Wang &lt;wang_han@iapcm.ac.cn&gt;
diff --git a/dpgen2/entrypoint/submit.py b/dpgen2/entrypoint/submit.py
@@ -367,9 +367,8 @@ def workflow_concurrent_learning(
     return dpgen_step
 
 
-def submit_concurrent_learning(
+def wf_global_workflow(
         wf_config,
-        reuse_step = None,
 ):
     dflow_config_data = wf_config.get('dflow_config', None)
     dflow_config(dflow_config_data)
@@ -384,9 +383,18 @@ def submit_concurrent_learning(
     else :
         lebesgue_context = None
 
+    return lebesgue_context
+
+
+def submit_concurrent_learning(
+        wf_config,
+        reuse_step = None,
+):
+    context = wf_global_workflow(wf_config)
+    
     dpgen_step = workflow_concurrent_learning(wf_config)
 
-    wf = Workflow(name="dpgen", context=lebesgue_context)
+    wf = Workflow(name="dpgen", context=context)
     wf.add(dpgen_step)
 
     wf.submit(reuse_step=reuse_step)
@@ -441,20 +449,16 @@ def resubmit_concurrent_learning(
         list_steps = False,
         reuse = None,
 ):
-    # set global config
-    from dflow import config, s3_config
-    dflow_config = wf_config.get('dflow_config', None)
-    if dflow_config :
-        config["host"] = dflow_config.get('host', None)
-        s3_config["endpoint"] = dflow_config.get('s3_endpoint', None)
-        config["k8s_api_server"] = dflow_config.get('k8s_api_server', None)
-        config["token"] = dflow_config.get('token', None)    
+    context = wf_global_workflow(wf_config)
 
     old_wf = Workflow(id=wfid)
 
     all_step_keys = successful_step_keys(old_wf)
+    all_step_keys = sort_slice_ops(
+        all_step_keys, ['run-train', 'run-lmp', 'run-fp'],)
     if list_steps:
-        prt_str = print_list_steps(all_step_keys)
+        prt_str = print_keys_in_nice_format(
+            all_step_keys, ['run-train', 'run-lmp', 'run-fp'],)
         print(prt_str)
 
     if reuse is None:
@@ -465,6 +469,10 @@ def resubmit_concurrent_learning(
     for ii in reuse_idx:
         reuse_step += old_wf_info.get_step(key=all_step_keys[ii])
 
-    wf = submit_concurrent_learning(wf_config, reuse_step=reuse_step)
+    wf = submit_concurrent_learning(
+        wf_config, 
+        context=context,
+        reuse_step=reuse_step,
+    )
 
     return wf
diff --git a/dpgen2/utils/dflow_query.py b/dpgen2/utils/dflow_query.py
@@ -0,0 +1,124 @@
+import numpy as np
+import re
+from typing import (
+    List, Optional, Any,
+)
+
+def get_subkey(
+        key : str, 
+        idx : Optional[int] = -1, 
+):
+    return key.split('--')[idx]
+
+def get_last_scheduler(
+        wf : Any, 
+        keys : List[str],
+):
+    """
+    get the output Scheduler of the last successful iteration
+    """
+    scheduler_keys = []
+    for ii in keys:
+        if get_subkey(ii) == 'scheduler':
+            scheduler_keys.append(ii)
+    if len(scheduler_keys) == 0:
+        return None
+    else:
+        skey = sorted(scheduler_keys)[-1]
+        step = wf.query_step(key=skey)
+        return step.outputs.parameters['exploration_scheduler'].value
+
+        
+def get_last_iteration(
+        keys : List[str], 
+):
+    """
+    get the index of the last iteraction from a list of step keys.
+    """
+    return int(sorted([get_subkey(ii,0) for ii in keys])[-1].split('-')[1])
+
+
+def find_slice_ranges(
+        keys : List[str], 
+        sliced_subkey : str,
+):
+    """
+    find range of sliced OPs that matches the pattern 'iter-[0-9]*--{sliced_subkey}-[0-9]*'
+    """
+    found_range = []
+    tmp_range = []
+    status = 'not-found'
+    for idx,ii in enumerate(keys):
+        if status == 'not-found':
+            if re.match(f'iter-[0-9]*--{sliced_subkey}-[0-9]*', ii):
+                status = 'found'
+                tmp_range.append(idx)
+        elif status == 'found':
+            if not re.match(f'iter-[0-9]*--{sliced_subkey}-[0-9]*', ii):
+                status = 'not-found'
+                tmp_range.append(idx)                
+                found_range.append(tmp_range)
+                tmp_range = []
+        else :
+            raise RuntimeError(f'unknown status {status}, terrible error')
+    return found_range
+
+
+def _sort_slice_ops(keys, sliced_subkey):
+    found_range = find_slice_ranges(keys, sliced_subkey)
+    for ii in found_range:
+        keys[ii[0]:ii[1]] = sorted(keys[ii[0]:ii[1]])
+    return keys
+
+
+def sort_slice_ops(
+        keys : List[str], 
+        sliced_subkey : List[str],
+):
+    """
+    sort the keys of the sliced ops. the keys of the sliced ops contains sliced_subkey
+    """
+    if isinstance(sliced_subkey, str) :
+        sliced_subkey = [sliced_subkey]
+    for ii in sliced_subkey:
+        keys = _sort_slice_ops(keys, ii)
+    return keys
+
+
+def print_keys_in_nice_format(
+        keys : List[str], 
+        sliced_subkey : List[str],
+        idx_fmt_len : int = 8,
+):
+    keys = sort_slice_ops(keys, sliced_subkey)
+    slice_range = []
+    for ii in sliced_subkey:
+        found_range = find_slice_ranges(keys, ii)
+        slice_range += found_range
+    slice_0 = [ii[0] for ii in slice_range]
+    slice_1 = [ii[1] for ii in slice_range]
+    
+    normal_fmt = f'%{idx_fmt_len*2+4}d'
+    range_fmt = f'%d -> %d'
+    range_s_fmt = f'%{idx_fmt_len*2+4}s'
+    
+    idx = 0
+    ret = []
+    while(True):
+        if idx >= len(keys):
+            break
+        try:
+            idx_in_slice = slice_0.index(idx)
+            range_0 = slice_0[idx_in_slice]
+            range_1 = slice_1[idx_in_slice] - 1
+            idx = range_1
+            range_str = range_fmt % (range_0, range_1)
+            ret.append((range_s_fmt + ' : ' + '%s -> %s') % (
+                range_str, keys[range_0], keys[range_1]))
+        except ValueError:
+            ret.append((normal_fmt + ' : ' + '%s') % (
+                idx, keys[idx]))
+        idx += 1
+    return '\n'.join(ret + [''])
+
+
diff --git a/tests/utils/test_dflow_query.py b/tests/utils/test_dflow_query.py
@@ -0,0 +1,186 @@
+import os, textwrap
+import numpy as np
+import unittest
+
+from typing import Set, List
+from pathlib import Path
+try:
+    from exploration.context import dpgen2
+except ModuleNotFoundError:
+    # case of upload everything to argo, no context needed
+    pass
+from dflow.python import (
+    FatalError,
+)
+from dpgen2.exploration.scheduler import (
+    ConvergenceCheckStageScheduler,
+    ExplorationScheduler,
+)
+from dpgen2.exploration.report import ExplorationReport
+from dpgen2.exploration.task import ExplorationTaskGroup, ExplorationStage
+from dpgen2.exploration.selector import TrustLevel, ConfSelectorLammpsFrames
+from mocked_ops import (
+    MockedExplorationReport,
+    MockedExplorationTaskGroup,
+    MockedExplorationTaskGroup1,
+    MockedStage,
+    MockedStage1,
+)
+from dpgen2.utils.dflow_query import (
+    get_last_scheduler,
+    get_subkey,
+    get_last_iteration,
+    find_slice_ranges,
+    sort_slice_ops,
+    print_keys_in_nice_format,
+)
+
+dpgen_keys = [
+'init--scheduler',
+ 'init--id',
+ 'iter-000000--prep-train',
+ 'iter-000000--run-train-0002',
+ 'iter-000000--run-train-0000',
+ 'iter-000000--run-train-0001',
+ 'iter-000000--prep-run-train',
+ 'iter-000000--prep-lmp',
+ 'iter-000000--run-lmp-000001',
+ 'iter-000000--run-lmp-000004',
+ 'iter-000000--run-lmp-000005',
+ 'iter-000000--run-lmp-000002',
+ 'iter-000000--run-lmp-000003',
+ 'iter-000000--run-lmp-000000',
+ 'iter-000000--prep-run-lmp',
+ 'iter-000000--select-confs',
+ 'iter-000000--prep-fp',
+ 'iter-000000--run-fp-000001',
+ 'iter-000000--run-fp-000000',
+ 'iter-000000--prep-run-fp',
+ 'iter-000000--collect-data',
+ 'iter-000000--block',
+ 'iter-000000--scheduler',
+ 'iter-000000--id',
+ 'iter-000001--prep-train',
+ 'iter-000001--run-train-0000',
+ 'iter-000001--run-train-0001',
+ 'iter-000001--run-train-0002',
+ 'iter-000001--prep-run-train',
+ 'iter-000001--prep-lmp',
+ 'iter-000001--run-lmp-000003',
+ 'iter-000001--run-lmp-000000',
+ 'iter-000001--run-lmp-000001',
+ 'iter-000001--run-lmp-000005',
+ 'iter-000001--run-lmp-000002',
+ 'iter-000001--run-lmp-000004',
+ 'iter-000001--prep-run-lmp',
+ 'iter-000001--select-confs',
+ 'iter-000001--prep-fp',
+ 'iter-000001--run-fp-000001',
+ 'iter-000001--run-fp-000000',
+ 'iter-000001--prep-run-fp',
+ 'iter-000001--collect-data',
+ 'iter-000001--block',
+ 'iter-000001--scheduler',
+ 'iter-000001--id',
+ 'iter-000000--loop'
+]
+
+class MockedTar:
+    value = 10
+
+class MockedFoo:
+    parameters = {
+        'exploration_scheduler' : MockedTar()
+    }
+
+class MockedBar:
+    outputs = MockedFoo        
+
+class MockedWF:
+    def query_step(self,key=None):
+        assert(key == 'iter1--scheduler')
+        return MockedBar()
+
+class TestDflowQuery(unittest.TestCase):
+    def test_get_subkey(self):
+        self.assertEqual(get_subkey('aa--bb--cc', 0),  'aa')
+        self.assertEqual(get_subkey('aa--bb--cc', 1),  'bb')
+        self.assertEqual(get_subkey('aa--bb--cc', 2),  'cc')
+        self.assertEqual(get_subkey('aa--bb--cc'),  'cc')
+        self.assertEqual(get_subkey('aa'),  'aa')
+        self.assertEqual(get_subkey('aa---bb'),  '-bb')
+        self.assertEqual(get_subkey('aa----bb', 1),  '')
+        self.assertEqual(get_subkey(''),  '')
+
+    def test_get_last_scheduler(self):
+        value = get_last_scheduler(
+            MockedWF(), 
+            ['iter1--scheduler', 'foo', 'bar', 'iter0--scheduler'],
+        )
+        self.assertEqual(value, 10)
+
+    def test_get_last_iteration(self):
+        last = get_last_iteration(dpgen_keys)
+        self.assertEqual(last, 1)
+
+    def test_sort_slice_ops(self):
+        idxes = find_slice_ranges(dpgen_keys, 'run-lmp')
+        self.assertEqual(idxes, [[8, 14], [30, 36]])
+
+    def test_sort_slice_ops(self):
+        expected_output = [
+            'init--scheduler',
+            'init--id',
+            'iter-000000--prep-train',
+            'iter-000000--run-train-0000',
+            'iter-000000--run-train-0001',
+            'iter-000000--run-train-0002',
+            'iter-000000--prep-run-train',
+            'iter-000000--prep-lmp',
+            'iter-000000--run-lmp-000000',
+            'iter-000000--run-lmp-000001',
+            'iter-000000--run-lmp-000002',
+            'iter-000000--run-lmp-000003',
+            'iter-000000--run-lmp-000004',
+            'iter-000000--run-lmp-000005',
+            'iter-000000--prep-run-lmp',
+            'iter-000000--select-confs',
+            'iter-000000--prep-fp',
+            'iter-000000--run-fp-000000',
+            'iter-000000--run-fp-000001',
+            'iter-000000--prep-run-fp',
+            'iter-000000--collect-data',
+            'iter-000000--block',
+            'iter-000000--scheduler',
+            'iter-000000--id',
+            'iter-000001--prep-train',
+            'iter-000001--run-train-0000',
+            'iter-000001--run-train-0001',
+            'iter-000001--run-train-0002',
+            'iter-000001--prep-run-train',
+        ]
+        ncheck = len(expected_output)
+        self.assertEqual(
+            sort_slice_ops(dpgen_keys[:ncheck], ['run-train', 'run-lmp', 'run-fp']),
+            expected_output,
+        )
+
+    def test_print_keys(self):
+        expected_output = [
+            '                   0 : init--scheduler',
+            '                   1 : init--id',
+            '                   2 : iter-000000--prep-train',
+            '              3 -> 5 : iter-000000--run-train-0000 -> iter-000000--run-train-0002',
+            '                   6 : iter-000000--prep-run-train',
+        ]
+        expected_output = '\n'.join(expected_output + [''])
+        
+        ret = print_keys_in_nice_format(
+            dpgen_keys[:7], 
+            ['run-train', 'run-lmp', 'run-fp'],
+            idx_fmt_len = 8,
+        )
+
+        self.assertEqual(expected_output, ret)
+
+