在 Popen.stdin 上轮询/等待 HUP

Polling/awaiting HUP on Popen.stdin

提问人:JamesTheAwesomeDude 提问时间:11/7/2020 最后编辑:JamesTheAwesomeDude 更新时间:1/12/2021 访问量:248

问:

我正在用 Python 为 GNU dd(1) 编写一个基于 Zenity 的状态监视器。 由于我所针对的系统的限制,包装器必须在 Python 2 上运行,并且不能拉入外部库。

其中的要求是 Zenity 的“取消”按钮在尚未完成时终止 dd。

我必须毫不拖延地执行以下操作(即触发/驱动/立即);如果同时满足/触发以下多个条件,则按所列顺序执行:

  • 当 Zenity 退出时,终止 dd
  • 当 dd 写入其时,munge+转发该数据给 Zenity 的stderrstdin
  • 当 dd 退出时,如果其返回码不为 0,则终止 Zenity

但是,epoll 对象似乎只在 dd 的输出上触发;它永远不会在 Zenity 退出时触发,尽管我在 Zenity 上注册了.EPOLLHUPstdin

这应该/如何做到?我知道 epoll 是唯一可用于正确触发 的输出的原语(通过);我也明白它是一个不奇怪的原语,可能不适合在 Zenity 退出时触发。(如果需要,我可以在这个文件中实现更多的逻辑;这样做比引入任何第三方库要好得多,无论它有多小或“常见”。我重申,我知道 epoll 使用起来很笨拙,可能需要大量的胶合逻辑。ddEPOLLIN

或者:如果 epoll 不是监控其出口的正确原语,那么在以 Python 2 兼容的方式监控子进程的输出的同时监控退出子进程的正确方法是什么?subprocess

(我本身并不需要多线程功能;按顺序执行所有操作将完全符合规范;但是,如果在这种情况下,为了避免繁忙循环,多线程编程是绝对必要的,那就这样吧。


以下是我到目前为止的完整代码。

#!/usr/bin/env python
from __future__ import division
import sys,os,stat,fcntl,select,subprocess,re

def main(args=sys.argv[1:]):
    fname = parseifname(args)
    n = sizeof(fname)

    dcmd = ['dd'] + args + ['status=progress']
    zcmd = ['zenity', '--progress', '--time-remaining']

    #Launch dd
    dd = subprocess.Popen(dcmd, stderr=subprocess.PIPE)
    set_nonblocking(dd.stderr)

    #Launch Zenity
    zenity = subprocess.Popen(zcmd, stdin=subprocess.PIPE)
    set_direct(zenity.stdin)#TODO: why doesn't this line work?*

    #set title/status
    zenity.stdin.write(('#%s\n' % ' '.join(dcmd)).encode())
    zenity.stdin.flush()#*i.e. instances of this line shouldn't be necessary...

    #We want to trigger on all of the following:
    toPoll = [
        (dd.stderr, select.EPOLLIN       #dd status update
                  | select.EPOLLHUP),    #dd exit
        (zenity.stdin, select.EPOLLHUP), #Zenity exit
    ]

    calcPercent = genCalcPercent(n)

    with ePoll(toPoll) as E:
        rBytes = re.compile(r'\r(\d+) bytes'.encode())
        while dd.poll() is None:
            evs = E.poll()#TODO: I'm not sure if this is blocking, or if I've induced a busy loop...
            for fn,ev in evs:
                if fn == dd.stderr.fileno():
                    if (ev & select.EPOLLIN):
                        #dd sent some output
                        line = dd.stderr.read()
                        m = rBytes.match(line)
                        #sys.stderr.buffer.write(line)
                        if m:
                            x = int(m.groups()[0])
                            zenity.stdin.write(('%f\n' % calcPercent(x)).encode())
                            zenity.stdin.flush()
                    if (ev & select.EPOLLHUP):
                        #dd exited
                        pass#The containing loop will handle this; don't need to take action
                if fn == zenity.stdin.fileno():
                    if (ev & select.EPOLLHUP):#TODO: WHY DOESN'T THIS ACTIVATE??
                        #Zenity exited
                        dd.terminate()
        if dd.returncode == 0:
            #dd exited successfully
            zenity.stdin.write('100\n'.encode())
            zenity.stdin.flush()
        else:
            zenity.terminate()

# Functions below here #

def parseifname(argv=sys.argv[:1], default='/dev/stdin'):
    '''Given dd's argument list, attempts to return the name of that file which dd would use as its input file'''
    M = re.compile(r'^if=(.*)$')
    ifname = default
    for x in argv:
        m = M.match(x)
        if m:
            ifname = m.groups()[0]
    return ifname

def sizeof(fname):
    '''Attempts to find the length, in bytes, of the given file or block device'''
    s = os.stat(fname)
    m = s.st_mode
    try:
        if stat.S_ISREG(m):
            #Regular File
            n = s.st_size
        elif stat.S_ISBLK(m):
            #Block Device
            n = int(subprocess.check_output(['lsblk', '-b', '-n', '-l', '-o', 'SIZE', '-d', fname]))
        else:
            raise ValueError("file is neither a standard nor block file")
    except:
        #Unidentifiable
        n = None
    return n

def genCalcPercent(n):
    '''Given n, returns a function which, given x, returns either x as a percentage of n, or some sane stand-in for such'''
    if n:
        #Input file size was identified
        return lambda x: 100 * x / n
    else:
        #Input file size was unidentifiable, zero, or otherwise falsy
        #we'll at least  try to visually show progress
        return lambda x: 99.99999 * (1 - 0.5 ** (x / 2**32))

def set_nonblocking(fd=sys.stdin):
    '''Appends os.O_NONBLOCK to the given file descriptor's flags.'''
    return fcntl.fcntl(
     fd,
     fcntl.F_SETFL,
     fcntl.fcntl(fd,fcntl.F_GETFL)
      | os.O_NONBLOCK
    )

def set_direct(fd=sys.stdout):
    '''Appends os.O_SYNC to the given file descriptor's flags.'''
    return fcntl.fcntl(
     fd,
     fcntl.F_SETFL,
     fcntl.fcntl(fd,fcntl.F_GETFL)
      | os.O_SYNC
    )

class ePoll:
    '''Thin contextlib wrapper around select.epoll; allows tersely watching multiple events'''
    def __init__(self, fdSpecs):
        self._E = select.epoll()
        self._fds = []
        for fd,opt in fdSpecs:
            self._E.register(fd,opt)
            self._fds.append(fd)
    def __enter__(self):
        return self._E
    def __exit__(self, exc_type, exc_value, traceback):
        for fd in self._fds:
            self._E.unregister(fd)
        self._E.close()

if __name__=='__main__':
    main()
python 子进程 管道 epoll

评论

0赞 JamesTheAwesomeDude 11/7/2020
虽然它不会直接回答这个问题,但如果(正如我所怀疑的那样)整个事情可以用例如两行 Perl 来完成,我将非常高兴看到它是如何完成的,并且这个问题将成为历史。

答:

0赞 JamesTheAwesomeDude 11/14/2020 #1

事实证明,答案很简单:使用而不是 .EPOLLERREPOLLHUP

我严重怀疑这是否是正确的解决方案*,但它似乎确实有效

import select, subprocess, time

E = select.epoll()

p = subprocess.Popen(["sh", "-c", "sleep 3"], stdin=subprocess.PIPE)

#time.sleep(5) #Uncomment this line to convince yourself there is no race-condition here
E.register(p.stdin, select.EPOLLERR)

print("Polling...")
evs = E.poll()
print("Caught events!")

assert (p.stdin.fileno(), select.EPOLLERR) in evs

E.close()

*如果这不是正确的解决方案,那么即使是现在,我也非常想发现正确的解决方案是什么。


(如果有人关心的话,这是原始问题的脚本的完整版本