提问人:JamesTheAwesomeDude 提问时间:11/7/2020 最后编辑:JamesTheAwesomeDude 更新时间:1/12/2021 访问量:248
在 Popen.stdin 上轮询/等待 HUP
Polling/awaiting HUP on Popen.stdin
问:
我正在用 Python 为 GNU dd(1)
编写一个基于 Zenity 的状态监视器。
由于我所针对的系统的限制,包装器必须在 Python 2 上运行,并且不能拉入外部库。
其中的要求是 Zenity 的“取消”按钮在尚未完成时终止 dd。
我必须毫不拖延地执行以下操作(即触发/驱动/立即);如果同时满足/触发以下多个条件,则按所列顺序执行:
- 当 Zenity 退出时,终止 dd
- 当 dd 写入其时,munge+转发该数据给 Zenity 的
stderr
stdin
- 当 dd 退出时,如果其返回码不为 0,则终止 Zenity
但是,epoll 对象似乎只在 dd 的输出上触发;它永远不会在 Zenity 退出时触发,尽管我在 Zenity 上注册了.EPOLLHUP
stdin
这应该/如何做到?我知道 epoll 是唯一可用于正确触发 的输出的原语(通过);我也明白它是一个不奇怪的原语,可能不适合在 Zenity 退出时触发。(如果需要,我可以在这个文件中实现更多的逻辑;这样做比引入任何第三方库要好得多,无论它有多小或“常见”。我重申,我知道 epoll 使用起来很笨拙,可能需要大量的胶合逻辑。dd
EPOLLIN
或者:如果 epoll 不是监控其出口的正确原语,那么在以 Python 2 兼容的方式监控子进程的输出的同时监控退出子进程的正确方法是什么?subprocess
(我本身并不需要多线程功能;按顺序执行所有操作将完全符合规范;但是,如果在这种情况下,为了避免繁忙循环,多线程编程是绝对必要的,那就这样吧。
以下是我到目前为止的完整代码。
#!/usr/bin/env python
from __future__ import division
import sys,os,stat,fcntl,select,subprocess,re
def main(args=sys.argv[1:]):
fname = parseifname(args)
n = sizeof(fname)
dcmd = ['dd'] + args + ['status=progress']
zcmd = ['zenity', '--progress', '--time-remaining']
#Launch dd
dd = subprocess.Popen(dcmd, stderr=subprocess.PIPE)
set_nonblocking(dd.stderr)
#Launch Zenity
zenity = subprocess.Popen(zcmd, stdin=subprocess.PIPE)
set_direct(zenity.stdin)#TODO: why doesn't this line work?*
#set title/status
zenity.stdin.write(('#%s\n' % ' '.join(dcmd)).encode())
zenity.stdin.flush()#*i.e. instances of this line shouldn't be necessary...
#We want to trigger on all of the following:
toPoll = [
(dd.stderr, select.EPOLLIN #dd status update
| select.EPOLLHUP), #dd exit
(zenity.stdin, select.EPOLLHUP), #Zenity exit
]
calcPercent = genCalcPercent(n)
with ePoll(toPoll) as E:
rBytes = re.compile(r'\r(\d+) bytes'.encode())
while dd.poll() is None:
evs = E.poll()#TODO: I'm not sure if this is blocking, or if I've induced a busy loop...
for fn,ev in evs:
if fn == dd.stderr.fileno():
if (ev & select.EPOLLIN):
#dd sent some output
line = dd.stderr.read()
m = rBytes.match(line)
#sys.stderr.buffer.write(line)
if m:
x = int(m.groups()[0])
zenity.stdin.write(('%f\n' % calcPercent(x)).encode())
zenity.stdin.flush()
if (ev & select.EPOLLHUP):
#dd exited
pass#The containing loop will handle this; don't need to take action
if fn == zenity.stdin.fileno():
if (ev & select.EPOLLHUP):#TODO: WHY DOESN'T THIS ACTIVATE??
#Zenity exited
dd.terminate()
if dd.returncode == 0:
#dd exited successfully
zenity.stdin.write('100\n'.encode())
zenity.stdin.flush()
else:
zenity.terminate()
# Functions below here #
def parseifname(argv=sys.argv[:1], default='/dev/stdin'):
'''Given dd's argument list, attempts to return the name of that file which dd would use as its input file'''
M = re.compile(r'^if=(.*)$')
ifname = default
for x in argv:
m = M.match(x)
if m:
ifname = m.groups()[0]
return ifname
def sizeof(fname):
'''Attempts to find the length, in bytes, of the given file or block device'''
s = os.stat(fname)
m = s.st_mode
try:
if stat.S_ISREG(m):
#Regular File
n = s.st_size
elif stat.S_ISBLK(m):
#Block Device
n = int(subprocess.check_output(['lsblk', '-b', '-n', '-l', '-o', 'SIZE', '-d', fname]))
else:
raise ValueError("file is neither a standard nor block file")
except:
#Unidentifiable
n = None
return n
def genCalcPercent(n):
'''Given n, returns a function which, given x, returns either x as a percentage of n, or some sane stand-in for such'''
if n:
#Input file size was identified
return lambda x: 100 * x / n
else:
#Input file size was unidentifiable, zero, or otherwise falsy
#we'll at least try to visually show progress
return lambda x: 99.99999 * (1 - 0.5 ** (x / 2**32))
def set_nonblocking(fd=sys.stdin):
'''Appends os.O_NONBLOCK to the given file descriptor's flags.'''
return fcntl.fcntl(
fd,
fcntl.F_SETFL,
fcntl.fcntl(fd,fcntl.F_GETFL)
| os.O_NONBLOCK
)
def set_direct(fd=sys.stdout):
'''Appends os.O_SYNC to the given file descriptor's flags.'''
return fcntl.fcntl(
fd,
fcntl.F_SETFL,
fcntl.fcntl(fd,fcntl.F_GETFL)
| os.O_SYNC
)
class ePoll:
'''Thin contextlib wrapper around select.epoll; allows tersely watching multiple events'''
def __init__(self, fdSpecs):
self._E = select.epoll()
self._fds = []
for fd,opt in fdSpecs:
self._E.register(fd,opt)
self._fds.append(fd)
def __enter__(self):
return self._E
def __exit__(self, exc_type, exc_value, traceback):
for fd in self._fds:
self._E.unregister(fd)
self._E.close()
if __name__=='__main__':
main()
答:
事实证明,答案很简单:使用而不是 .EPOLLERR
EPOLLHUP
我严重怀疑这是否是正确的解决方案*,但它似乎确实有效:
import select, subprocess, time
E = select.epoll()
p = subprocess.Popen(["sh", "-c", "sleep 3"], stdin=subprocess.PIPE)
#time.sleep(5) #Uncomment this line to convince yourself there is no race-condition here
E.register(p.stdin, select.EPOLLERR)
print("Polling...")
evs = E.poll()
print("Caught events!")
assert (p.stdin.fileno(), select.EPOLLERR) in evs
E.close()
*如果这不是正确的解决方案,那么即使是现在,我也非常想发现正确的解决方案是什么。
(如果有人关心的话,这是原始问题的脚本的完整版本。
评论