graph.py 17.7 KB
Newer Older
1
import collections
2 3 4
import os
from enum import Enum, auto
from functools import partial
5
import importlib as imp
6

7
import comsdk.aux as aux
8 9 10

ImplicitParallelizationInfo = collections.namedtuple('ImplicitParallelizationInfo', ['array_keys_mapping', 'branches_number', 'branch_i'])

11 12 13 14 15 16
class Func():
    __slots__ = (
        'module',
        'func', 
        'name'
    )
17
    def __init__(self, module="", name="", dummy=False,func=None):
18 19
        self.module = module
        self.name = name
20 21
        if module =="" or name =="":
            dummy = True
22 23 24 25
        if func is not None:
            self.func = func
        elif dummy:
            self.func = lambda data: data
26 27
        else: 
            print(module, name, "loading")
28
            self.func = getattr(imp.import_module(module), name)
29

30 31 32 33 34 35 36
    def __str__(self):
        return "{}.{}()".format(self.module, self.name)

class Selector(Func):
    __slots__=(
        'ntransf'
    )
37 38 39
    def __init__(self, ntransf, module="", name="", dummy=False):
        if module=="" and name =="":
            dummy = True
40
        self.ntransf = ntransf
41
        super().__init__(module, name, func=(lambda x: [True for i in range(ntransf)]) if dummy else None)
42 43


44
class Transfer:
Savva Golubitsky's avatar
Savva Golubitsky committed
45
    def __init__(self, edge, output_state, order=0):
46 47
        self.edge = edge
        self.output_state = output_state
Savva Golubitsky's avatar
Savva Golubitsky committed
48
        self.order = order
49

50
    def transfer(self, data, dynamic_keys_mapping={}):
51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66
        #print(dynamic_keys_mapping)
        self.edge.morph(data, dynamic_keys_mapping)
        #return self.output_state, None
        return self.output_state

class IdleRunType(Enum):
    INIT = auto()
    CLEANUP = auto()

class PluralState:
    def __init__(self, states):
        self.states = states
        pass

    def connect_to(self, term_states, edge):
        for init_state, term_state in zip(self.states, term_states):
67
            init_state.transfers.append(Transfer(edge, term_state))
68 69

class Graph:
70 71 72 73 74 75 76 77 78 79
    '''
    Class describing a graph-based computational method. Graph execution must start from this object.     
    '''
    def __init__(self, init_state,
                 term_state=None,
                 ):
        self.init_state = init_state
        self.term_state = term_state
        if self.term_state is not None:
            self.term_state.is_term_state = True
80 81 82
        self._initialized = False

    def run(self, data):
83 84 85 86 87 88 89 90 91 92 93 94
        '''
        Goes through the graph and returns boolean denoting whether the graph has finished successfully.
        It runs twice -- the first run is idle (needed for initialization) and the second run is real.
        The input data will be augmented by metadata:
        1) '__CURRENT_WORKING_DIR__' -- absolute path to the current working directory as defined by the OS
        2) '__WORKING_DIR__' -- absolute path to the directory from which external binaries or resources will be launched.
        It will be set only if it is not yet set in data
        3) '__EXCEPTION__' if any error occurs
        '''
        self.init_graph(data)
        cur_state = self.init_state
        implicit_parallelization_info = None
95
        while cur_state is not None:
96 97
 #           print('1) In main loop', implicit_parallelization_info)
#            morph = _run_state(cur_state, data, implicit_parallelization_info)
98
            transfer_f, implicit_parallelization_info = _run_state(cur_state, data, implicit_parallelization_info)
99
#            print('2) In main loop', implicit_parallelization_info)
100
            if '__EXCEPTION__' in data:
101 102
                return False
#            cur_state, implicit_parallelization_info = morph(data)
103
            cur_state = transfer_f(data)
104
#            print(morph)
105
            if '__EXCEPTION__' in data:
106 107 108
                return False
        return True

109
    def init_graph(self, data={}):
110 111 112 113 114 115 116 117
        if not self._initialized:
            self.init_state.idle_run(IdleRunType.INIT, [self.init_state.name])
            self._initialized = True
        else:
            self.init_state.idle_run(IdleRunType.CLEANUP, [self.init_state.name])
        data['__CURRENT_WORKING_DIR__'] = os.getcwd()
        if not '__WORKING_DIR__' in data:
            data['__WORKING_DIR__'] = data['__CURRENT_WORKING_DIR__']
118 119 120 121

class State:
    __slots__ = [
        'name',
122
        'input_edges_number', #output_edges_number == len(transfers)
123 124
        'looped_edges_number',
        'activated_input_edges_number',
125
        'transfers',
126
        'parallelization_policy',
127
        'selector',
128 129
        'is_term_state',
        'array_keys_mapping',
130
        '_branching_states_history',
131
        '_proxy_state',
132 133 134
        ]
    def __init__(self, name, 
                 parallelization_policy=None,
135
                 selector=None,
136
                 array_keys_mapping=None, # if array_keys_mapping is not None, we have implicit parallelization in this state
137 138
                 ):
        self.name = name
139
        self.parallelization_policy = SerialParallelizationPolicy() if parallelization_policy is None else parallelization_policy
140
        self.selector = Selector(1) if selector is None else selector
141
        self.array_keys_mapping = array_keys_mapping
142 143 144
        self.input_edges_number = 0
        self.looped_edges_number = 0
        self.activated_input_edges_number = 0
145
        self.transfers = []
146
        self.is_term_state=False
147
        self._branching_states_history = None
148
        self._proxy_state=None
149

150
    def idle_run(self, idle_run_type, branching_states_history):
151
        def __sort_by_order(tr):
152
            # print(tr.edge.order)
153 154 155 156
            return tr.edge.order
        self.transfers.sort(key = __sort_by_order)
        print(self.name)
        for t in self.transfers:
157
            print("\t", t.edge.order, t.edge.pred_name, t.edge.morph_name)
158 159 160
        if self._proxy_state is not None:
            return self._proxy_state.idle_run(idle_run_type, branching_states_history)
        if idle_run_type == IdleRunType.INIT:
161 162 163 164 165 166 167
            self.input_edges_number += 1
            if self.input_edges_number != 1:
                if self._is_looped_branch(branching_states_history):
                    self.looped_edges_number += 1
                return # no need to go further if we already were there
            if self._branching_states_history is None:
                self._branching_states_history = branching_states_history
168 169 170 171 172 173 174 175 176
        elif idle_run_type == IdleRunType.CLEANUP:
            self.activated_input_edges_number = 0
#           print('\tCLEANUP STATE {}, active: {}, branches_story: {}'.format(self.name, self.activated_input_edges_number, self._branching_states_history))
            if self._branching_states_history is not None and self._is_looped_branch(branching_states_history):
#                print('\tqwer')
                self._branching_states_history = None
                return
            if self._branching_states_history is None:
                self._branching_states_history = branching_states_history
177 178 179 180
        else:
            self.activated_input_edges_number += 1 # BUG: here we need to choose somehow whether we proceed or not
#        if len(self.output_edges) == 0:
#            print('Terminate state found')
181 182
        if len(self.transfers) == 1:
            self.transfers[0].output_state.idle_run(idle_run_type, branching_states_history)
183
        else:
184 185
            for i, transfer in enumerate(self.transfers):
                next_state = transfer.output_state
186
                next_state.idle_run(idle_run_type, branching_states_history + [next_state.name])
187

Savva Golubitsky's avatar
Savva Golubitsky committed
188
    def connect_to(self, term_state, edge=None):
189
        self.transfers.append(Transfer(edge, term_state))
190 191
#        edge.set_output_state(term_state)
#        self.output_edges.append(edge)
192

193 194
    def replace_with_graph(self, graph):
        self._proxy_state = graph.init_state
195
        graph.term_state.transfers = self.transfers
196 197 198 199 200 201 202 203 204

    def run(self, data, implicit_parallelization_info=None):
        print('STATE {}, just entered, implicit_parallelization_info: {}'.format(self.name, implicit_parallelization_info))
        if self._proxy_state is not None:
            return self._proxy_state.run(data, implicit_parallelization_info)
        self._activate_input_edge(implicit_parallelization_info)
        #self.activated_input_edges_number += 1
        print('STATE {}, required input: {}, active: {}, looped: {}'.format(self.name, self.input_edges_number, self.activated_input_edges_number, self.looped_edges_number))
#        print('qwer')
205
        if not self._ready_to_transfer(implicit_parallelization_info):
206 207 208 209 210
            return None, None # it means that this state waits for some incoming edges (it is a point of collision of several edges)
        self._reset_activity(implicit_parallelization_info)
        if self.is_term_state:
            implicit_parallelization_info = None
        #print(self.name)
211 212
        if len(self.transfers) == 0:
            return transfer_to_termination, None
213
        predicate_values = []
214
        dynamic_keys_mapping = build_dynamic_keys_mapping(implicit_parallelization_info)
215 216
        for transfer in self.transfers:
            predicate_values.append(transfer.edge.predicate(data, dynamic_keys_mapping))
217 218 219
        selected_edges = self.selector.func(predicate_values)
        print(selected_edges)
        if not selected_edges:
220 221
            raise GraphUnexpectedTermination(
                'State {}: Predicate values {} do not conform selection policy'.format(self.name, predicate_values))
222 223
        selected_transfers = [self.transfers[i] for i, _ in enumerate(selected_edges) if selected_edges[i]==True]
        print( selected_transfers)
224
        return self.parallelization_policy.make_transfer_func(selected_transfers,
225 226 227
                                                         array_keys_mapping=self.array_keys_mapping,
                                                         implicit_parallelization_info=implicit_parallelization_info,), \
               implicit_parallelization_info
228 229


230 231 232 233 234 235 236
    def _activate_input_edge(self, implicit_parallelization_info=None):
        if implicit_parallelization_info is None or self.is_term_state:
            self.activated_input_edges_number += 1
        else:
            if isinstance(self.activated_input_edges_number, int):
                self.activated_input_edges_number = [0 for i in range(implicit_parallelization_info.branches_number)]
            self.activated_input_edges_number[implicit_parallelization_info.branch_i] += 1
237

238
    def _ready_to_transfer(self, implicit_parallelization_info=None):
239 240 241 242 243 244 245 246
        required_activated_input_edges_number = self.input_edges_number - self.looped_edges_number
        if implicit_parallelization_info is not None:
            if self.is_term_state:
                required_activated_input_edges_number = implicit_parallelization_info.branches_number
                return self.activated_input_edges_number == required_activated_input_edges_number
            return self.activated_input_edges_number[implicit_parallelization_info.branch_i] == required_activated_input_edges_number
        else:
            return self.activated_input_edges_number == required_activated_input_edges_number
247

248 249 250 251 252 253
#        if implicit_parallelization_info is None or self.is_term_state:
#            if self.is_term_state:
#                required_activated_input_edges_number = implicit_parallelization_info.branches_number
#            return self.activated_input_edges_number == required_activated_input_edges_number
#        else:
#            return self.activated_input_edges_number[implicit_parallelization_info.branch_i] == required_activated_input_edges_number
254

255 256
    def _reset_activity(self, implicit_parallelization_info=None):
        self._branching_states_history = None
257
        if self._ready_to_transfer(implicit_parallelization_info) and self._has_loop():
258 259 260 261 262 263 264 265 266 267
            if implicit_parallelization_info is None or self.is_term_state:
                self.activated_input_edges_number -= 1
            else:
                self.activated_input_edges_number[implicit_parallelization_info.branch_i] -= 1
        else:
#            self.activated_input_edges_number = 0
            if implicit_parallelization_info is None or self.is_term_state:
                self.activated_input_edges_number = 0
            else:
                self.activated_input_edges_number[implicit_parallelization_info.branch_i] = 0
268

269 270
    def _is_looped_branch(self, branching_states_history):
        return set(self._branching_states_history).issubset(branching_states_history)
271

272 273
    def _has_loop(self):
        return self.looped_edges_number != 0
274

275
def transfer_to_termination(data):
276 277 278 279 280 281 282 283
    return None

class SerialParallelizationPolicy:
#    def __init__(self, data):
#        self.data = data
    def __init__(self):
        pass

284
    def make_transfer_func(self, morphisms, array_keys_mapping=None, implicit_parallelization_info=None):
285
        def _morph(data):
286
            print("\tmorphisms:",len(morphisms))
287 288
            if array_keys_mapping is None:
                dynamic_keys_mapping = build_dynamic_keys_mapping(implicit_parallelization_info)
289
                next_morphs = [partial(morphism.transfer, dynamic_keys_mapping=dynamic_keys_mapping) for morphism in morphisms]
290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
                next_impl_para_infos = [implicit_parallelization_info for _ in morphisms]
 #               print('\t\t {}'.format(implicit_parallelization_infos))
            else:
                if len(morphisms) != 1:
                    raise BadGraphStructure('Impossible to create implicit paralleilzation in the state with {} output edges'.format(len(morphisms)))
                dynamic_keys_mapping = build_dynamic_keys_mapping(implicit_parallelization_info)
                proxy_data = aux.ProxyDict(data, keys_mappings=array_keys_mapping)
                anykey = next(iter(array_keys_mapping.keys()))
                implicit_branches_number = len(proxy_data[anykey])
                next_morphs = []
                next_impl_para_infos = []
                for branch_i in range(implicit_branches_number):
                    implicit_parallelization_info_ = ImplicitParallelizationInfo(array_keys_mapping, implicit_branches_number, branch_i)
                    dynamic_keys_mapping = build_dynamic_keys_mapping(implicit_parallelization_info_)
#                    print(dynamic_keys_mapping)
                    next_morphs.append(partial(morphisms[0].morph, dynamic_keys_mapping=dynamic_keys_mapping))
                    next_impl_para_infos.append(implicit_parallelization_info_)
            cur_morphs = []
            cur_impl_para_infos = []
            #while len(next_morphs) != 1 or _is_implicitly_parallelized(next_impl_para_infos):
            while len(next_morphs) != 1 or _requires_joint_of_implicit_parallelization(array_keys_mapping, next_impl_para_infos):
                if next_impl_para_infos == []:
                    raise Exception(str(len(next_morphs)))
#                print(array_keys_mapping, next_impl_para_infos)
                cur_morphs[:] = next_morphs[:]
                cur_impl_para_infos[:] = next_impl_para_infos[:]
                del next_morphs[:]
                del next_impl_para_infos[:]
                for morph, impl_para_info in zip(cur_morphs, cur_impl_para_infos):
319
                    next_state = morph(data)
320
#                    print('\t next_state: {}, with impl para info: {}'.format(next_state.name, impl_para_info))
321 322
                    if next_state is None:
                        return None
323 324
                    next_morph, next_impl_para_info = _run_state(next_state, data, impl_para_info)
#                    print('\t next_morph: {}'.format(next_morph))
325 326
                    if '__EXCEPTION__' in data:
                        return None
327 328 329 330 331 332 333 334
                    if next_morph is not None:
                        next_morphs.append(next_morph)
                        next_impl_para_infos.append(next_impl_para_info)
#                print(array_keys_mapping, next_impl_para_infos)
                #print(len(next_morphs))
#            print('\t last morph: {}'.format(next_morphs[0]))
            next_state = next_morphs[0](data)
#            print(next_state.name, next_impl_para_infos[0])
335 336 337
            return next_state
        return _morph

338

339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364
class OnlyOneSelectionPolicy:
    def __init__(self):
        pass

    def select(self, predicate_values):
        trues_indices = _get_trues(predicate_values)
        if len(trues_indices) != 1:
            return None
        return trues_indices

class AllSelectionPolicy:
    def __init__(self):
        pass

    def select(self, predicate_values):
        trues_indices = _get_trues(predicate_values)
        if len(trues_indices) != len(predicate_values):
            return None
        return trues_indices

class BadGraphStructure(Exception):
    pass

class GraphUnexpectedTermination(Exception):
    pass

365 366 367 368 369 370 371 372
def _requires_joint_of_implicit_parallelization(array_keys_mapping, impl_para_infos):
    if array_keys_mapping is None:
        return False
    for obj in impl_para_infos:
        if obj is not None:
            return True
    return False

373 374 375
def _get_trues(boolean_list):
    return [i for i, val in enumerate(boolean_list) if val == True]

376 377 378 379 380 381 382 383 384
#def _run_state(state, data, implicit_parallelization_info=None):
#    try:
#        next_morphism = state.run(data, implicit_parallelization_info)
#    except GraphUnexpectedTermination as e:
#        data['__EXCEPTION__'] = str(e)
#        return None
#    return next_morphism

def _run_state(state, data, implicit_parallelization_info=None):
385
    try:
386
        next_morphism, next_impl_para_info = state.run(data, implicit_parallelization_info)
387 388
    except GraphUnexpectedTermination as e:
        data['__EXCEPTION__'] = str(e)
389 390 391 392 393 394 395 396 397 398 399
        return None, None
    return next_morphism, next_impl_para_info


def build_dynamic_keys_mapping(implicit_parallelization_info=None):
    if implicit_parallelization_info is None:
        return {}
    dynamic_keys_mapping = {}
    for key, keys_path in implicit_parallelization_info.array_keys_mapping.items():
        dynamic_keys_mapping[key] = aux.ArrayItemGetter(keys_path, implicit_parallelization_info.branch_i)
    return dynamic_keys_mapping