Hello Folks:

I am trying to add a new function, stackless.select() to the Stackless.py 
module. This select() is loosely based on the select() in Newsqueak/Go. Once I 
get this select() to work, I would like to figure out some Python 
syntax to support it. One step deeper into PyPy :-)

For the most part, select() is pretty straightforward to implement. 
In two of my test cases, test4.py and test5.py, the select() function seems to 
work. Unfortunately, I get a sys.exit() error. 

I invoke the programme with 

python ../bin/py.py --withmod_-stackless testX.py

and I get
(test4.py)
THE RESULT FROM SELECT -> hello world
schedule(): returned from _schedule_switch
schedule(): about to _schedule_switch
schedule(): returned from _schedule_switch

File "../py.py", line 171, in <module>
    sys.exit(main_(sys.argv))
  File "../py.py", line 142, in main_
    verbose=interactiveconfig.verbose):
  File "/home/andrew/lab/pypy-dist/pypy/interpreter/main.py", line 103, in 
run_toplevel
    f()
....

 File "/home/andrew/lab/pypy-dist/pypy/interpreter/executioncontext.py", line 
48, in leave
    self.framestack.pop()
  File "/home/andrew/lab/pypy-dist/pypy/interpreter/miscutils.py", line 34, in 
pop
    return self.items.pop()
IndexError: pop from empty list

and

(test5.py)
THE RESULT FROM SELECT -> hello world
schedule(): returned from _schedule_switch
schedule(): about to _schedule_switch
XXX error, nesting_level = 1
Traceback (most recent call last):
  File "../py.py", line 171, in <module>
    sys.exit(main_(sys.argv))
  File "../py.py", line 142, in main_
    verbose=interactiveconfig.verbose):
  File "/home/andrew/lab/pypy-dist/pypy/interpreter/main.py", line 103, in 
run_toplevel
    f()
...

 File "/home/andrew/lab/pypy-dist/pypy/interpreter/gateway.py", line 513, in 
funcrun_obj
    w_result = activation._run(space, scope_w)
  File "<codegen /home/andrew/lab/pypy-dist/pypy/tool/sourcetools.py:177>", 
line 3, in _run_UWS_AppCoroutine
  File "/home/andrew/lab/pypy-dist/pypy/module/_stackless/interp_coroutine.py", 
line 90, in w_switch
    self.switch()
  File "/home/andrew/lab/pypy-dist/pypy/rlib/rcoroutine.py", line 256, in switch
    incoming_frame = state.update(self).switch()
AttributeError: 'tuple' object has no attribute 'switch'


I wrote a third test, test6.py which blocks select() and then terminates 
because there is no tasklet on the other end. I do this on purpose. Test6.py 
works correctly making me suspect something is going wrong with the switching. 
Although I understand most of the Stackless.py module's code, I am still very 
green when it comes to PyPy and  the various coroutine packages.

I understand the PyPy team has not being developing Stackless.py for
a while. However I would greatly appreciate insights into figuring out
what is going  wrong. I would also appreciate insights into how to effectively 
debug PyPy. Eventually I would like to get into a position where I could 
support Stackless.py and continue its development. 

I have enclosed my copy of Stackless.py, the output, and some test
scripts. 

Cheers,
Andrew


      
"""
The Stackless module allows you to do multitasking without using threads.
The essential objects are tasklets and channels.
Please refer to their documentation.
"""

DEBUG = True
RECEIVE = -1
SEND = 1

def debug(message):
    if DEBUG:
       print message

def dprint(*args):
    for arg in args:
        print arg,
    print

import traceback
import sys
import random

try:
    from _stackless import coroutine, greenlet
except ImportError: # we are running from CPython
    from greenlet import greenlet
    try:
        from functools import partial
    except ImportError: # we are not running python 2.5
        class partial(object):
            # just enough of 'partial' to be usefull
            def __init__(self, func, *argl, **argd):
                self.func = func
                self.argl = argl
                self.argd = argd

            def __call__(self):
                return self.func(*self.argl, **self.argd)

    class GWrap(greenlet):
        """This is just a wrapper around greenlets to allow
           to stick additional attributes to a greenlet.
           To be more concrete, we need a backreference to
           the coroutine object"""

    class MWrap(object):
        def __init__(self,something):
            self.something = something

        def __getattr__(self, attr):
            return getattr(self.something, attr)

    class coroutine(object):
        "we can't have greenlet as a base, because greenlets can't be rebound"

        def __init__(self):
            self._frame = None
            self.is_zombie = False

        def __getattr__(self, attr):
            return getattr(self._frame, attr)

        def __del__(self):
            self.is_zombie = True
            del self._frame
            self._frame = None

        def bind(self, func, *argl, **argd):
            """coro.bind(f, *argl, **argd) -> None.
               binds function f to coro. f will be called with
               arguments *argl, **argd
            """
            if self._frame is None or self._frame.dead:
                self._frame = frame = GWrap()
                frame.coro = self
            if hasattr(self._frame, 'run') and self._frame.run:
                raise ValueError("cannot bind a bound coroutine")
            self._frame.run = partial(func, *argl, **argd)

        def switch(self):
            """coro.switch() -> returnvalue
               switches to coroutine coro. If the bound function
               f finishes, the returnvalue is that of f, otherwise
               None is returned
            """
            try:
                return greenlet.switch(self._frame)
            except TypeError, exp: # self._frame is the main coroutine
                return greenlet.switch(self._frame.something)

        def kill(self):
            """coro.kill() : kill coroutine coro"""
            self._frame.throw()

        def _is_alive(self):
            if self._frame is None:
                return False
            return not self._frame.dead
        is_alive = property(_is_alive)
        del _is_alive

        def getcurrent():
            """coroutine.getcurrent() -> the currently running coroutine"""
            try:
                return greenlet.getcurrent().coro
            except AttributeError:
                return _maincoro
        getcurrent = staticmethod(getcurrent)

        def __reduce__(self):
            raise TypeError, 'pickling is not possible based upon greenlets'

    _maincoro = coroutine()
    maingreenlet = greenlet.getcurrent()
    _maincoro._frame = frame = MWrap(maingreenlet)
    frame.coro = _maincoro
    del frame
    del maingreenlet

from collections import deque

import operator
__all__ = 'run getcurrent getmain schedule tasklet channel coroutine \
                TaskletExit greenlet'.split()

_global_task_id = 0
_squeue = None
_main_tasklet = None
_main_coroutine = None
_last_task = None
_channel_callback = None
_schedule_callback = None

def _scheduler_remove(value):
    try:
        del _squeue[operator.indexOf(_squeue, value)]
    except ValueError:pass

def _scheduler_append(value, normal=True):
    if normal:
        _squeue.append(value)
    else:
        _squeue.rotate(-1)
        _squeue.appendleft(value)
        _squeue.rotate(1)

def _scheduler_contains(value):
    try:
        operator.indexOf(_squeue, value)
        return True
    except ValueError:
        return False

def _scheduler_switch(current, next):
    global _last_task
    prev = _last_task
    if (_schedule_callback is not None and
        prev is not next):
        _schedule_callback(prev, next)
    _last_task = next
    assert not next.blocked
    if next is not current:
        next.switch()
    return current


class TaskletExit(Exception):pass

def set_schedule_callback(callback):
    global _schedule_callback
    _schedule_callback = callback

def set_channel_callback(callback):
    global _channel_callback
    _channel_callback = callback

def getruncount():
    return len(_squeue)

class bomb(object):
    def __init__(self, exp_type=None, exp_value=None, exp_traceback=None):
        self.type = exp_type
        self.value = exp_value
        self.traceback = exp_traceback

    def raise_(self):
        raise self.type, self.value, self.traceback

#
# helpers for pickling
#

_stackless_primitive_registry = {}

def register_stackless_primitive(thang, retval_expr='None'):
    import types
    func = thang

    debug("I am in the registry")
    if isinstance(thang, types.MethodType):
        func = thang.im_func
    code = func.func_code
    _stackless_primitive_registry[code] = retval_expr
    # It is not too nice to attach info via the code object, but
    # I can't think of a better solution without a real transform.
    debug("I am leaving the registry")

def rewrite_stackless_primitive(coro_state, alive, tempval):
    flags, state, thunk, parent = coro_state
    for i, frame in enumerate(state):
        retval_expr = _stackless_primitive_registry.get(frame.f_code)
        if retval_expr:
            # this tasklet needs to stop pickling here and return its value.
            tempval = eval(retval_expr, globals(), frame.f_locals)
            state = state[:i]
            coro_state = flags, state, thunk, parent
    return coro_state, alive, tempval

#
#

class channel(object):
    """
    A channel object is used for communication between tasklets.
    By sending on a channel, a tasklet that is waiting to receive
    is resumed. If there is no waiting receiver, the sender is suspended.
    By receiving from a channel, a tasklet that is waiting to send
    is resumed. If there is no waiting sender, the receiver is suspended.

    Attributes:

    preference
    ----------
    -1: prefer receiver
     0: don't prefer anything
     1: prefer sender

    Pseudocode that shows in what situation a schedule happens:

    def send(arg):
        if !receiver:
            schedule()
        elif schedule_all:
            schedule()
        else:
            if (prefer receiver):
                schedule()
            else (don't prefer anything, prefer sender):
                pass

        NOW THE INTERESTING STUFF HAPPENS

    def receive():
        if !sender:
            schedule()
        elif schedule_all:
            schedule()
        else:
            if (prefer sender):
                schedule()
            else (don't prefer anything, prefer receiver):
                pass

        NOW THE INTERESTING STUFF HAPPENS

    schedule_all
    ------------
    True: overwrite preference. This means that the current tasklet always
          schedules before returning from send/receive (it always blocks).
          (see Stackless/module/channelobject.c)
    """

    def __init__(self, label=''):
        self.balance = 0
        self.closing = False
        self.queue = deque()
        self.label = label
        self.preference = -1
        self.schedule_all = False

    def __str__(self):
        return 'channel[%s](%s,%s)' % (self.label, self.balance, self.queue)

    def close(self):
        """
        channel.close() -- stops the channel from enlarging its queue.
        
        If the channel is not empty, the flag 'closing' becomes true.
        If the channel is empty, the flag 'closed' becomes true.
        """
        self.closing = True

    @property
    def closed(self):
        return self.closing and not self.queue

    def open(self):
        """
        channel.open() -- reopen a channel. See channel.close.
        """
        self.closing = False

    def _channel_action(self, arg, d):
        """
        d == -1 : receive
        d ==  1 : send

        the original CStackless has an argument 'stackl' which is not used
        here.

        'target' is the peer tasklet to the current one
        """
        do_schedule=False
        assert abs(d) == 1
        source = getcurrent()
        source.tempval = arg
        if d > 0:
            cando = self.balance < 0
            dir = d
        else:
            cando = self.balance > 0
            dir = 0

        if _channel_callback is not None:
            _channel_callback(self, source, dir, not cando)
        self.balance += d
        if cando:
            # communication 1): there is somebody waiting
            target = self.queue.popleft()
            source.tempval, target.tempval = target.tempval, source.tempval
            target.selected = self
            target.blocked = 0
            if self.schedule_all:
                # always schedule 
                _scheduler_append(target)
                do_schedule = True
            elif self.preference == -d:
                _scheduler_append(target, False)
                do_schedule = True
            else:
                _scheduler_append(target)
        else:
            # communication 2): there is nobody waiting
#            if source.block_trap:
#                raise RuntimeError("this tasklet does not like to be blocked")
#            if self.closing:
#                raise StopIteration()
            source.blocked = d
            self.queue.append(source)
            _scheduler_remove(getcurrent())
            do_schedule = True

        if do_schedule:
            schedule()

        retval = source.tempval


        if isinstance(retval, bomb):
            retval.raise_()
        return retval

    def receive(self):
        """
        channel.receive() -- receive a value over the channel.
        If no other tasklet is already sending on the channel,
        the receiver will be blocked. Otherwise, the receiver will
        continue immediately, and the sender is put at the end of
        the runnables list.
        The above policy can be changed by setting channel flags.
        """
        return self._channel_action(None, -1)

    register_stackless_primitive(receive, retval_expr='receiver.tempval')

    def send_exception(self, exp_type, msg):
        self.send(bomb(exp_type, exp_type(msg)))

    def send_sequence(self, iterable):
        for item in iterable:
            self.send(item)

    def send(self, msg):
        """
        channel.send(value) -- send a value over the channel.
        If no other tasklet is already receiving on the channel,
        the sender will be blocked. Otherwise, the receiver will
        be activated immediately, and the sender is put at the end of
        the runnables list.
        """
        return self._channel_action(msg, 1)
            
    register_stackless_primitive(send)
            
class tasklet(coroutine):
    """
    A tasklet object represents a tiny task in a Python thread.
    At program start, there is always one running main tasklet.
    New tasklets can be created with methods from the stackless
    module.
    """
    tempval = None
    def __new__(cls, func=None, label=''):
        res = coroutine.__new__(cls)
        res.label = label
        res._task_id = None
        return res

    def __init__(self, func=None, label=''):
        coroutine.__init__(self)
        self._init(func, label)

        """
        add new attribute to support select
        principle is that a tasklet using select should be able to be
        serialised
        """
        self.selected = None
        self.selectedChannels = {}

    def _init(self, func=None, label=''):
        global _global_task_id
        self.func = func
        self.alive = False
        self.blocked = False
        self._task_id = _global_task_id
        self.label = label
        _global_task_id += 1

    def __str__(self):
        return '<tasklet[%s, %s]>' % (self.label,self._task_id)

    __repr__ = __str__

    def __call__(self, *argl, **argd):
        return self.setup(*argl, **argd)

    def bind(self, func):
        """
        Binding a tasklet to a callable object.
        The callable is usually passed in to the constructor.
        In some cases, it makes sense to be able to re-bind a tasklet,
        after it has been run, in order to keep its identity.
        Note that a tasklet can only be bound when it doesn't have a frame.
        """
        if not callable(func):
            raise TypeError('tasklet function must be a callable')
        self.func = func

    def kill(self):
        """
        tasklet.kill -- raise a TaskletExit exception for the tasklet.
        Note that this is a regular exception that can be caught.
        The tasklet is immediately activated.
        If the exception passes the toplevel frame of the tasklet,
        the tasklet will silently die.
        """
        if not self.is_zombie:
            coroutine.kill(self)
            _scheduler_remove(self)
            self.alive = False

    def setup(self, *argl, **argd):
        """
        supply the parameters for the callable
        """
        if self.func is None:
            raise TypeError('cframe function must be callable')
        func = self.func
        def _func():
            try:
                try:
                    func(*argl, **argd)
                except TaskletExit:
                    pass
            finally:
                _scheduler_remove(self)
                self.alive = False

        self.func = None
        coroutine.bind(self, _func)
        self.alive = True
        _scheduler_append(self)
        return self

    def run(self):
        self.insert()
        _scheduler_switch(getcurrent(), self)

    def insert(self):
        if self.blocked:
            raise RuntimeError, "You cannot run a blocked tasklet"
            if not self.alive:
                raise RuntimeError, "You cannot run an unbound(dead) tasklet"
        _scheduler_append(self)

    def remove(self):
        if self.blocked:
            raise RuntimeError, "You cannot remove a blocked tasklet."
        if self is getcurrent():
            raise RuntimeError, "The current tasklet cannot be removed."
            # not sure if I will revive this  " Use t=tasklet().capture()"
        _scheduler_remove(self)
        
    def __reduce__(self):
        one, two, coro_state = coroutine.__reduce__(self)
        assert one is coroutine
        assert two == ()
        # we want to get rid of the parent thing.
        # for now, we just drop it
        a, b, c, d = coro_state
        if d:
            assert isinstance(d, coroutine)
        coro_state = a, b, c, None
        coro_state, alive, tempval = rewrite_stackless_primitive(coro_state, self.alive, self.tempval)
        inst_dict = self.__dict__.copy()
        inst_dict.pop('tempval', None)
        return self.__class__, (), (coro_state, alive, tempval, inst_dict)

    def __setstate__(self, (coro_state, alive, tempval, inst_dict)):
        coroutine.__setstate__(self, coro_state)
        self.__dict__.update(inst_dict)
        self.alive = alive
        self.tempval = tempval



def getmain():
    """
    getmain() -- return the main tasklet.
    """
    return _main_tasklet

def getcurrent():
    """
    getcurrent() -- return the currently executing tasklet.
    """

    curr = coroutine.getcurrent()
    if curr is _main_coroutine:
        return _main_tasklet
    else:
        return curr

_run_calls = []
def run():
    """
    run_watchdog(timeout) -- run tasklets until they are all
    done, or timeout instructions have passed. Tasklets must
    provide cooperative schedule() calls.
    If the timeout is met, the function returns.
    The calling tasklet is put aside while the tasklets are running.
    It is inserted back after the function stops, right before the
    tasklet that caused a timeout, if any.
    If an exception occours, it will be passed to the main tasklet.

    Please note that the 'timeout' feature is not yet implemented
    """
    curr = getcurrent()
    _run_calls.append(curr)
    _scheduler_remove(curr)
    try:
        schedule()
        assert not _squeue
    finally:
        _scheduler_append(curr)
    
def schedule_remove(retval=None):
    """
    schedule(retval=stackless.current) -- switch to the next runnable tasklet.
    The return value for this call is retval, with the current
    tasklet as default.
    schedule_remove(retval=stackless.current) -- ditto, and remove self.
    """
    _scheduler_remove(getcurrent())
    r = schedule(retval)
    return r


def schedule(retval=None):
    """
    schedule(retval=stackless.current) -- switch to the next runnable tasklet.
    The return value for this call is retval, with the current
    tasklet as default.
    schedule_remove(retval=stackless.current) -- ditto, and remove self.
    """
    mtask = getmain()
    curr = getcurrent()
    if retval is None:
        retval = curr
    while True:
        if _squeue:
            if _squeue[0] is curr:
                # If the current is at the head, skip it.
                _squeue.rotate(-1)
                
            task = _squeue[0]
            #_squeue.rotate(-1)
        elif _run_calls:
            task = _run_calls.pop()
        else:
            raise RuntimeError('No runnable tasklets left.')
        debug("schedule(): about to _schedule_switch")
        _scheduler_switch(curr, task)
        debug("schedule(): returned from _schedule_switch")
        if curr is _last_task:
            # We are in the tasklet we want to resume at this point.
            return retval


def select(list):
    debug("I have entered select")
    result = None
    ready = []
    source = getcurrent()

    # is there a channel that will not block? If so, put it on the
    # ready list
    for channel, operation, value in list:
        if (channel.balance > 0 and operation == RECEIVE) or \
           (channel.balance < 0 and operation == SEND): \
              ready.append((channel,operation, value))

    # if there are ready channels, randomly select one
    # and return from select()
    l = len(ready)
    if l != 0:
       unblockedChannel, operation, value = ready[random.randint(0, l - 1)]
       debug("unblocked channel and operation " + str(unblockedChannel) +\
            str(operation)) 
       debug("going into channel action")
       result = unblockedChannel._channel_action(value, operation)
       debug("returning from channel action")
    else:
       debug("getting ready to block")

       source.blocked = operation

       for channel, operation, value in list:
           channel.queue.append(source)
           channel.balance += operation
           source.selectedChannels[channel] = (operation, value)

       debug("suspending")
               
       _scheduler_remove(source)

       schedule()
       debug("resuming")

       result = source.tempval

       unblockedChannel = source.selected
       debug('source selected ->' + str(source.selected))
       debug("unblockedChannel ->" + str(source.selected))
       source.selected = None
       source.blocked = False
       del(source.selectedChannels[unblockedChannel])

       debug("removing tasklet from channels")
       # now remove self from all the other channels, ouch
       for channel, (operation, value) in source.selectedChannels.items():
           print "removal ", channel, operation, value
           channel.balance -= operation
           channel.queue.remove(source)
           print "removal ", channel, operation, value

    return unblockedChannel, result

register_stackless_primitive(select, retval_expr='selector.tempval')

def _init():
    global _main_tasklet
    global _global_task_id
    global _squeue
    global _last_task
    _global_task_id = 0
    _main_tasklet = coroutine.getcurrent()
    try:
        _main_tasklet.__class__ = tasklet
    except TypeError: # we are running pypy-c
        class TaskletProxy(object):
            """TaskletProxy is needed to give the _main_coroutine tasklet behaviour"""
            def __init__(self, coro):
                self._coro = coro

            def __getattr__(self,attr):
                return getattr(self._coro,attr)

            def __str__(self):
                return '<tasklet %s a:%s>' % (self._task_id, self.is_alive)

            def __reduce__(self):
                return getmain, ()

            __repr__ = __str__


        global _main_coroutine
        _main_coroutine = _main_tasklet
        _main_tasklet = TaskletProxy(_main_tasklet)
        assert _main_tasklet.is_alive and not _main_tasklet.is_zombie
    _last_task = _main_tasklet
    tasklet._init.im_func(_main_tasklet, label='main')
    _squeue = deque()
    _scheduler_append(_main_tasklet)

_init()
import stackless

"""
test5.py

the purpose of this test is to check whether select will properly
block, unblock and return the correct value
"""
RECEIVE = -1
SEND = 1

def sender(ch):
    stackless.schedule()      #ensure that selector goes first
    ch.send("hello world")
    print "Sender done"


def selector(list):
    channel, result = stackless.select(list)
    print "THE RESULT FROM SELECT ->", result


if __name__ == "__main__":
   list = []

   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))

   stackless.tasklet(selector)(list)
   stackless.tasklet(sender)(list[0][0])
   stackless.run()
   print "THE PROGRAMMING IS ENDING"
   

import stackless

RECEIVE = -1
SEND = 1

def sender(ch):
    stackless.schedule()      #ensure that selector goes first
    ch.send("hello world")
    print "Sender done"


def selector(list):
    channel, result = stackless.select(list)
    print "THE RESULT FROM SELECT ->", result


if __name__ == "__main__":
   list = []

   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))
   list.append((stackless.channel(),RECEIVE, None))

   stackless.tasklet(selector)(list)
   stackless.run()
   print "THE PROGRAMMING IS ENDING"
   

Attachment: results4
Description: Binary data

Attachment: results5
Description: Binary data

_______________________________________________
[email protected]
http://codespeak.net/mailman/listinfo/pypy-dev

Reply via email to