|
| 1 | +import sys |
| 2 | +import dask |
| 3 | +import numpy as np |
| 4 | +import dask.array as da |
| 5 | +from dask.distributed import Client, Event, get_client, comm, Queue, Future, Variable |
| 6 | +from dask.delayed import Delayed |
| 7 | +import time |
| 8 | +import asyncio |
| 9 | +import json |
| 10 | +import itertools |
| 11 | + |
| 12 | + |
| 13 | +class metadata: |
| 14 | + index = list() |
| 15 | + data = "" |
| 16 | + shap = None |
| 17 | + typ = "" |
| 18 | + def __init__(self, name): |
| 19 | + self.name = name |
| 20 | + |
| 21 | +def connect(sched_file): |
| 22 | + sched = ''.join(chr(i) for i in sched_file) |
| 23 | + with open(sched[:-1]) as f: |
| 24 | + s = json.load(f) |
| 25 | + adr = s["address"] |
| 26 | + client = get_client(adr) |
| 27 | + return client |
| 28 | + |
| 29 | + |
| 30 | +def init(sched_file, rank, size, arrays, deisa_arrays_dtype): |
| 31 | + client = connect(sched_file) |
| 32 | + return Bridge(client, size, rank, arrays, deisa_arrays_dtype) |
| 33 | + |
| 34 | +class Bridge: |
| 35 | + workers = [] |
| 36 | + def __init__(self, Client, Ssize, rank, arrays, deisa_arrays_dtype): |
| 37 | + self.client = Client |
| 38 | + self.rank = rank |
| 39 | + listw = Variable("workers").get() |
| 40 | + if Ssize > len(listw): # more processes than workers |
| 41 | + self.workers = [listw[rank%len(listw)]] |
| 42 | + else: |
| 43 | + k = len(listw)//Ssize # more workers than processes |
| 44 | + self.workers = listw[rank*k:rank*k+ k] |
| 45 | + self.arrays = arrays |
| 46 | + for ele in self.arrays: |
| 47 | + self.arrays[ele]["dtype"] = str(deisa_arrays_dtype[ele]) |
| 48 | + self.arrays[ele]["timedim"] = self.arrays[ele]["timedim"][0] |
| 49 | + self.position = [self.arrays[ele]["starts"][i]//self.arrays[ele]["subsizes"][i] for i in range(len(np.array(self.arrays[ele]["sizes"])))] |
| 50 | + if rank==0: |
| 51 | + Queue("Arrays").put(self.arrays) # If and only if I have a perfect domain decomposition |
| 52 | + |
| 53 | + |
| 54 | + def create_key(self, timestep, name): |
| 55 | + self.position[self.arrays[name]["timedim"]]= timestep |
| 56 | + position = tuple(self.position) |
| 57 | + return ("deisa-"+name, position) |
| 58 | + |
| 59 | + def publish_data(self, data, data_name, timestep): |
| 60 | + event = Event("Done") |
| 61 | + if (timestep==0): |
| 62 | + event.wait() |
| 63 | + key = self.create_key(timestep, data_name) |
| 64 | + shap = list(data.shape) |
| 65 | + new_shape = tuple(shap[:self.arrays[data_name]["timedim"]]+[1]+shap[self.arrays[data_name]["timedim"]:]) |
| 66 | + data.shape = new_shape #will not copy, if not possible raise an error so handle it :p |
| 67 | + #data = data.reshape(new_shape) |
| 68 | + f = self.client.scatter(data, direct = True, workers=self.workers, keys=[key], deisa=True) |
| 69 | + while (f.status != 'finished'): |
| 70 | + f = self.client.scatter(data, direct = True, workers=self.workers, keys=[key], deisa=True) |
| 71 | + data=None |
| 72 | +class Adaptor : |
| 73 | + adr = "" |
| 74 | + client = None |
| 75 | + workers = [] |
| 76 | + queues = [] |
| 77 | + def __init__(self, Sworker, scheduler_info): |
| 78 | + with open(scheduler_info) as f: |
| 79 | + s = json.load(f) |
| 80 | + self.adr = s["address"] |
| 81 | + self.client = Client(self.adr, serializers=['dask', 'pickle']) # msgpack pour grand message ne serialize pas |
| 82 | + dask.config.set({"distributed.deploy.lost-worker-timeout": 60, "distributed.workers.memory.spill":0.97, "distributed.workers.memory.target":0.95, "distributed.workers.memory.terminate":0.99 }) |
| 83 | + self.workers = [comm.get_address_host_port(i,strict=False) for i in self.client.scheduler_info()["workers"].keys()] |
| 84 | + while (len(self.workers)!= Sworker): |
| 85 | + self.workers = [comm.get_address_host_port(i,strict=False) for i in self.client.scheduler_info()["workers"].keys()] |
| 86 | + Variable("workers").set(self.workers) |
| 87 | + |
| 88 | + |
| 89 | + def create_array(self, name, shape, chunksize, dtype, timedim): |
| 90 | + chunks_in_each_dim = [shape[i]//chunksize[i] for i in range(len(shape))] |
| 91 | + l = list(itertools.product(*[range(i) for i in chunks_in_each_dim])) |
| 92 | + items = [] |
| 93 | + for m in l: |
| 94 | + f=Future(key=("deisa-"+name,m), inform=True, deisa=True) |
| 95 | + d = da.from_delayed(dask.delayed(f), shape=chunksize, dtype=dtype) |
| 96 | + items.append([list(m),d]) |
| 97 | + ll = self.array_sort(items) |
| 98 | + arrays = da.block(ll) |
| 99 | + return arrays |
| 100 | + |
| 101 | + def create_array_list(self, name, shape, chunksize, dtype, timedim): #list arrays, one for each time step. |
| 102 | + chunks_in_each_dim = [shape[i]//chunksize[i] for i in range(len(shape))] |
| 103 | + l = list(itertools.product(*[range(i) for i in chunks_in_each_dim])) |
| 104 | + items = [] |
| 105 | + for m in l: |
| 106 | + f=Future(key=("deisa-"+name,m), inform=True, deisa=True) |
| 107 | + d = da.from_delayed(dask.delayed(f), shape=chunksize, dtype=dtype) |
| 108 | + items.append([list(m),d]) |
| 109 | + ll = self.array_sort(items) |
| 110 | + for i in ll: |
| 111 | + arrays.append(da.block(i)) |
| 112 | + return arrays |
| 113 | + |
| 114 | + def array_sort(self, ListDs): |
| 115 | + if len(ListDs[0][0]) == 0: |
| 116 | + return ListDs[0][1] |
| 117 | + else: |
| 118 | + dico = dict() |
| 119 | + for e in ListDs: |
| 120 | + dico.setdefault(e[0][0],[]).append([e[0][1:], e[1]]) |
| 121 | + return [self.array_sort(dico[k]) for k in sorted(dico.keys())] |
| 122 | + |
| 123 | + def get_data(self, as_list=False): |
| 124 | + arrays = dict() |
| 125 | + self.arrays_desc = Queue("Arrays").get() |
| 126 | + for name in self.arrays_desc: |
| 127 | + if not as_list: |
| 128 | + arrays[name] = self.create_array(name,self.arrays_desc[name]["sizes"], self.arrays_desc[name]["subsizes"], self.arrays_desc[name]["dtype"], self.arrays_desc[name]["timedim"]) |
| 129 | + else: #TODO test this |
| 130 | + arrays[name] = self.create_array_list(name,self.arrays_desc[name]["sizes"], self.arrays_desc[name]["subsizes"], self.arrays_desc[name]["dtype"], self.arrays_desc[name]["timedim"]) |
| 131 | + #Barrier after the creation of all the dask arrays |
| 132 | + e = Event("Done") |
| 133 | + e.set() |
| 134 | + return arrays |
| 135 | + |
| 136 | +def Initialization(Sworker, scheduler_info): |
| 137 | + return Adaptor(Sworker, scheduler_info) |
| 138 | + |
0 commit comments