GitList - GitList

Browse code

using asyncio and create user interface

Bas Nijholt authored on 16/08/2017 18:18:11
Showing 2 changed files

Learner-parallel-plotter.ipynb index 7f4a4e3..c51db09 100644
learner.py index e605779..23fc339 100644

@@ -25,12 +25,43 @@
                         "outputs": [],
                         "source": [
                          "import numpy as np\n",
                     -    "import learner\n",
                     +    "import adalearner\n",
                          "from time import sleep\n",
                          "from random import randint\n",
                          "from functools import partial\n",
                     +    "import ipyparallel\n",
                     +    "import concurrent.futures\n",
                          "import importlib\n",
                     -    "importlib.reload(learner)"
                     +    "importlib.reload(adalearner)"
                     +   ]
                     +  },
                     +  {
                     +   "cell_type": "code",
                     +   "execution_count": null,
                     +   "metadata": {
                     +    "collapsed": true
                     +   },
                     +   "outputs": [],
                     +   "source": [
                     +    "import asyncio\n",
                     +    "from ipykernel.eventloops import register_integration\n",
                     +    "\n",
                     +    "@register_integration('asyncio')\n",
                     +    "def loop_asyncio(kernel):\n",
                     +    "    '''Start a kernel with asyncio event loop support.'''\n",
                     +    "    loop = asyncio.get_event_loop()\n",
                     +    "\n",
                     +    "    def kernel_handler():\n",
                     +    "        loop.call_soon(kernel.do_one_iteration)\n",
                     +    "        loop.call_later(kernel._poll_interval, kernel_handler)\n",
                     +    "\n",
                     +    "    loop.call_soon(kernel_handler)\n",
                     +    "    try:\n",
                     +    "        if not loop.is_running():\n",
                     +    "            loop.run_forever()\n",
                     +    "    finally:\n",
                     +    "        loop.run_until_complete(loop.shutdown_asyncgens())\n",
                     +    "        loop.close()"
+                        ]
                        },
+                       {
@@ -38,13 +69,27 @@
                         "execution_count": null,
                         "metadata": {},
                         "outputs": [],
                     +   "source": [
                     +    "%gui asyncio"
                     +   ]
                     +  },
                     +  {
                     +   "cell_type": "code",
                     +   "execution_count": null,
                     +   "metadata": {
                     +    "collapsed": true
                     +   },
                     +   "outputs": [],
                         "source": [
                          "def func(x, wait=True):\n",
                     +    "    \"\"\"Function with a sharp peak on a smooth background\"\"\"\n",
                     +    "    import numpy as np\n",
                     +    "    from time import sleep\n",
                          "    x = np.asarray(x)\n",
                     -    "    a = 10\n",
                     +    "    a = 0.001\n",
                          "    if wait:\n",
                     -    "        sleep(randint(1, 3))\n",
                     -    "    return np.sin(x) + 0.0001/(0.0001 + x**2)"
                     +    "        sleep(np.random.randint(1, 3))\n",
                     +    "    return x + a**2/(a**2 + (x)**2)"
+                        ]
                        },
+                       {
@@ -60,33 +105,21 @@
                         "metadata": {},
                         "outputs": [],
                         "source": [
                     -    "import tornado\n",
                     -    "from distributed import Client\n",
                     +    "learner = adalearner.Learner1D(func, client=ipyparallel.Client())\n",
                          "\n",
                     -    "io = tornado.ioloop.IOLoop.current()\n",
                     -    "\n",
                     -    "# Initialize the learner\n",
                     -    "learner1d = learner.Learner1D()\n",
                     -    "learner1d.add_point(-1, func(-1))\n",
                     -    "learner1d.add_point(1, func(1))"
                     +    "learner.add_point(-1, func(-1))\n",
                     +    "learner.add_point(1, func(1))"
+                        ]
                        },
+                       {
                         "cell_type": "code",
                         "execution_count": null,
                     -   "metadata": {},
                     +   "metadata": {
                     +    "collapsed": true
                     +   },
                         "outputs": [],
                         "source": [
                     -    "async def dask_run(learner):\n",
                     -    "    async with Client(asynchronous=True) as client:\n",
                     -    "        await learner.run(func, client, learner1d ,goal=lambda learner1d: learner1d.loss() < 0.000001)\n",
                     -    "\n",
                     -    "def plot(data):\n",
                     -    "        xy = [(k, v) for k, v in sorted(data.items()) if v is not None]\n",
                     -    "        if not xy:\n",
                     -    "            return hv.Scatter([])\n",
                     -    "        x, y  = np.array(xy, dtype=float).T\n",
                     -    "        return hv.Scatter((x, y))"
                     +    "learner.start()"
+                        ]
                        },
+                       {
@@ -96,7 +129,7 @@
                         "outputs": [],
                         "source": [
                          "data_stream = Stream.define('data', data=param.ObjectSelector(default=dict()))\n",
                     -    "dm = hv.DynamicMap(plot, streams=[data_stream()])\n",
                     +    "dm = hv.DynamicMap(learner.plot, streams=[data_stream()])\n",
                          "dm"
+                        ]
                        },
@@ -106,9 +139,12 @@
                         "metadata": {},
                         "outputs": [],
                         "source": [
                     -    "pc = tornado.ioloop.PeriodicCallback(lambda: dm.event(data=learner1d.data), 100)\n",
                     -    "pc.start()\n",
                     -    "io.add_callback(dask_run, learner)"
                     +    "async def monitor(delay=1):\n",
                     +    "    while True:\n",
                     +    "        dm.event(data=learner.data)\n",
                     +    "        await asyncio.sleep(delay)\n",
                     +    "        \n",
                     +    "monitor_task = learner.ioloop.create_task(monitor())"
+                        ]
                        },
+                       {
@@ -116,7 +152,9 @@
                         "execution_count": null,
                         "metadata": {},
                         "outputs": [],
                     -   "source": []
                     +   "source": [
                     +    "learner.task.print_stack()"
                     +   ]
+                       }
                       ],
                       "metadata": {

learner.py

History View file @ e3a7009

                     similarity index 67%
                     rename from learner.py
                     rename to adalearner.py
@@ -1,20 +1,74 @@
+                    +
                     +import abc
                     +import asyncio
                      import heapq
                     -from math import sqrt
                      import itertools
                     -import multiprocessing
                     +import os
                     +from math import sqrt
                     +import concurrent
                     +import distributed
                     +import holoviews as hv
                     +import ipyparallel
                      import numpy as np
                     -import tornado
                     -def add_arg(func):
                     -    """Make func return (arg, func(arg))."""
                     -    def wrapper(*args):
                     -        return (args[0], func(*args))
                     -    return wrapper
                     +class BaseLearner(metaclass=abc.ABCMeta):
                     +    def __init__(self, xdata=None, ydata=None):
                     +        """Initialize the learner.
+                    +
                     +        Parameters
                     +        ----------
                     +        data :
                     +           Possibly empty list of float-like tuples, describing the initial
                     +           data.
                     +        """
                     +        # A dict {x_n: y_n} for quick checking of local
                     +        # properties.
                     +        self.data = {}
+                    +
                     +        # Add initial data if provided
                     +        if xdata is not None:
                     +            self.add_data(xdata, ydata)
+                    +
                     +    def add_data(self, xvalues, yvalues):
                     +        """Add data to the intervals.
+                    +
                     +        Parameters
                     +        ----------
                     +        xvalues : iterable of numbers
                     +            Values of the x coordinate.
                     +        yvalues : iterable of numbers and None
                     +            Values of the y coordinate. `None` means that the value will be
                     +            provided later.
                     +        """
                     +        try:
                     +            for x, y in zip(xvalues, yvalues):
                     +                self.add_point(x, y)
                     +        except TypeError:
                     +            self.add_point(xvalues, yvalues)
+                    +
                     +    def add_point(self, x, y):
                     +        """Update the data."""
                     +        self.data[x] = y
+                    +
                     +    def remove_unfinished(self):
                     +        self.data = {k: v for k, v in self.data.items() if v is not None}
+                    +
                     +    @abc.abstractmethod
                     +    def loss(self):
                     +        pass
+                    +
                     +    @abc.abstractmethod
                     +    def choose_points(self, n=10):
                     +        pass
+                    +
                     +    @abc.abstractmethod
                     +    def interpolate(self):
                     +        pass
                     -class Learner1D(object):
                     +class _Learner1D(BaseLearner):
                          """ Learns and predicts a 1D function.
                          Description
@@ -38,6 +92,7 @@ class Learner1D(object):
                              """
                              # Set internal variables
                     +        super().__init__(xdata, ydata)
                              # A dict storing the loss function for each interval x_n.
                              self.losses = {}
@@ -45,9 +100,6 @@ class Learner1D(object):
                              # A dict {x_n: [x_{n-1}, x_{n+1}]} for quick checking of local
                              # properties.
                              self.neighbors = {}
                     -        # A dict {x_n: y_n} for quick checking of local
                     -        # properties.
                     -        self.data = {}
                              # Bounding box [[minx, maxx], [miny, maxy]].
                              self._bbox = [[np.inf, -np.inf], [np.inf, -np.inf]]
@@ -55,10 +107,6 @@ class Learner1D(object):
                              self._scale = [0, 0]
                              self._oldscale = [0, 0]
                     -        # Add initial data if provided
                     -        if xdata is not None:
                     -            self.add_data(xdata, ydata)
+                    -
                          def interval_loss(self, x_left, x_right):
                              """Calculate loss in the interval x_left, x_right.
@@ -76,26 +124,10 @@ class Learner1D(object):
                              else:
                                  return max(self.losses.values())
                     -    def add_data(self, xvalues, yvalues):
                     -        """Add data to the intervals.
+                    -
                     -        Parameters
                     -        ----------
                     -        xvalues : iterable of numbers
                     -            Values of the x coordinate.
                     -        yvalues : iterable of numbers and None
                     -            Values of the y coordinate. `None` means that the value will be
                     -            provided later.
                     -        """
                     -        try:
                     -            for x, y in zip(xvalues, yvalues):
                     -                self.add_point(x, y)
                     -        except TypeError:
                     -            self.add_point(xvalues, yvalues)
                          def add_point(self, x, y):
                              """Update the data."""
                     -        self.data[x] = y
                     +        super().add_point(x, y)
                              # Update the scale.
                              self._bbox[0][0] = min(self._bbox[0][0], x)
@@ -138,7 +170,7 @@ class Learner1D(object):
                              return xs
                          def remove_unfinished(self):
                     -        self.data = {k: v for k, v in self.data.items() if v is not None}
                     +        super().remove_unfinished()
                              # Update the scale.
                              self._bbox[0][0] = min(self.data.keys())
                              self._bbox[0][1] = max(self.data.keys())
@@ -149,13 +181,6 @@ class Learner1D(object):
                              self.interpolate()
                     -    def get_largest_interval(self):
                     -        xs = sorted(x for x, y in self.data.items() if y is not None)
                     -        if len(xs) < 2:
                     -            return np.inf
                     -        else:
                     -            return np.diff(xs).max()
+                    -
                          def interpolate(self):
                              xdata = []
                              ydata = []
@@ -200,19 +225,79 @@ class Learner1D(object):
                                      pass
                     -# We can't use API that is specific to any particular asynchronous
                     -# framework, so we have to roll our own utility functions.
                     +class AsyncExecutor:
+                    +
                     +    def __init__(self, executor, ioloop):
                     +        self.executor = executor
                     +        self.ioloop = ioloop
+                    +
                     +    def submit(self, f, *args, **kwargs):
                     +        return self.ioloop.run_in_executor(self.executor, f, *args, **kwargs)
+                    +
+                    +
                     +def ensure_async_executor(client, ioloop):
                     +    if isinstance(client, ipyparallel.Client):
                     +        async_executor = AsyncExecutor(client.executor(), ioloop)
                     +    elif isinstance(client, distributed.Client):
                     +        async_executor = async_executor
                     +    elif client is None:
                     +        client = concurrent.futures.ThreadPoolExecutor(max_workers=os.cpu_count())
                     +        async_executor = AsyncExecutor(client, ioloop)
                     +    else:
                     +        raise NotImplementedError('Blabla')
+                    +
                     +    return async_executor
+                    +
+                    +
                     +def runner(learner):
                     +    if isinstance(learner.client, ipyparallel.Client):
                     +        ncores = len(learner.client)
                     +    elif isinstance(learner.client, distributed.Client):
                     +        ncores = sum(learner.client.ncores().values())
                     +    elif learner.client is None:
                     +        ncores = os.cpu_count()
                     +    else:
                     +        raise NotImplementedError('Blabla')
                     -async def any_complete(futures):
                     -    total = tornado.concurrent.Future()
                     -    for f in futures:
                     -        f.add_done_callback(lambda f: total.set_result(None)
                     -                            if not total.done() else None)
                     -    await total
                     -    return [f for f in futures if f.done()]
                     +    return run_asyncio(learner.func, learner.executor, learner, ncores=ncores,
                     +                       goal=lambda learner: learner.loss() < 0.1)
                     -async def run(f, executor, learner, goal, ncores=multiprocessing.cpu_count()):
                     +class LearnerMixin:
+                    +
                     +    def __init__(self, func, *, client=None, goal=None, ioloop=None, **learner_kwargs):
                     +        self.ioloop = ioloop if ioloop else asyncio.get_event_loop()
                     +        self.executor = ensure_async_executor(client, self.ioloop)  # wraps in `run_in_executor` if concurrent.futures.Executor compatible
                     +        self.client = client
                     +        self.func = func
                     +        self.task = None
                     +        super().__init__(**learner_kwargs)
+                    +
                     +    def start(self):
                     +        self.task = self.ioloop.create_task(runner(self))
+                    +
                     +    def cancel(self):
                     +        if self.task:
                     +            return self.task.cancel()
                     +        else:
                     +            return False
+                    +
+                    +
                     +class Learner1D(LearnerMixin, _Learner1D):
+                    +
                     +    def plot(self, data=None):
                     +        "Plot another learner"
                     +        if data is None:
                     +            data = self.data
                     +        xy = [(k, v) for k, v in sorted(data.items()) if v is not None]
                     +        if not xy:
                     +            return hv.Scatter([])[-1.1:1.1, -1.1:1.1]
                     +        x, y  = np.array(xy, dtype=float).T
                     +        return hv.Scatter((x, y))[-1.1:1.1, -1.1:1.1]
+                    +
+                    +
                     +async def run_asyncio(f, executor, learner, goal,
                     +                      ncores=os.cpu_count()):
                          xs = dict()
                          done = [None] * ncores
@@ -224,8 +309,7 @@ async def run(f, executor, learner, goal, ncores=multiprocessing.cpu_count()):
                              # Collect and results and add them to the learner
                              futures = list(xs.keys())
                     -        await any_complete(futures)
                     -        done = [fut for fut in futures if fut.done()]
                     +        done, _ = await asyncio.wait(futures, return_when=asyncio.FIRST_COMPLETED)
                              for fut in done:
                                  x = xs.pop(fut)
                                  # Need to explicitly await the future (even though we know the
@@ -234,7 +318,8 @@ async def run(f, executor, learner, goal, ncores=multiprocessing.cpu_count()):
                                  y = await fut
                                  learner.add_point(x, y)
                     -    # cancel any outstanding tasks
                     -    for fut in xs.keys():
                     -        fut.cancel()
                          learner.remove_unfinished()
                     +    # cancel any outstanding tasks
                     +    cancelled = all(fut.cancel() for fut in xs.keys())
                     +    if not cancelled:
                     +        raise RuntimeError('Some futures remain uncancelled')