Twisted spawnProcess,将一个进程的输出发送到另一个进程的输入

时间:2014-12-16 20:38:42

标签: python process twisted

我正在尝试使用twisted spawnProcess来复制这样的行为:

cat <input.txt | wc -w

这只是两个命令的一个例子,实际上我有自己的进程(比如python或bash脚本或外部程序),其中每个进程从stdin读取并写入stdout。就像上面的例子一样,我想把stdout从一个进程管道到另一个进程的stdin,我想用spawnProcess来做这个。我在这里使用了一些提示:

Twisted pipe two processes with spawnProcess

但我无法让它发挥作用。它只是在第二个spawnProcess协议上从stdin读取时挂起。我的代码在下面。我做错了什么?我怎样才能实现这个目标?从第一个中调用第二个spawnProcess是否更好?

#!/usr/bin/env python

from twisted.internet import protocol
from twisted.internet import reactor
import re
import os
import sys

class CatPP(protocol.ProcessProtocol):
    def __init__(self,input_data):
        self.input_data=input_data
        self.data = ""

    def connectionMade(self):
        print "connectionMade in CatPP! Now writing to stdin of cat"
        print "   writing this data: %s" % self.input_data
        self.transport.write(self.input_data+'\n')
        print "   closing stdin"
        self.transport.closeStdin() # tell them we're done
        print "   stdin closed"

    def outReceived(self, data):
        print "outReceived from cat! with %d bytes!" % len(data)
        self.data = self.data + data
        print "    received this: %s" % self.data

    def errReceived(self, data):
        print "errReceived from cat! with %d bytes!" % len(data)

    def inConnectionLost(self):
        print "inConnectionLost for cat! stdin is closed! (we probably did it)"

    def outConnectionLost(self):
        print "outConnectionLost for cat! The child closed their stdout!"
        # now is the time to examine what they wrote
        print "I saw cat write this:", self.data

    def errConnectionLost(self):
        print "errConnectionLost for cat! The child closed their stderr."

    def processExited(self, reason):
        print "processExited for cat, status %d" % (reason.value.exitCode,)

    def processEnded(self, reason):
        print "processEnded for cat, status %d" % (reason.value.exitCode,)

class WcPP(protocol.ProcessProtocol):
    def __init__(self):
        self.data = ""

    def connectionMade(self):
        print "connectionMade! Now reading from pipe to get stdin for wp"
        print "    reading from stdin"
        txt = sys.stdin.read()
        print "  Read this from stdin: %s" % (txt,)
        self.transport.write(txt)
        self.transport.closeStdin() # tell them we're done

    def outReceived(self, data):
        print "outReceived from cat! with %d bytes!" % len(data)
        self.data = self.data + data

    def errReceived(self, data):
        print "errReceived from cat! with %d bytes!" % len(data)

    def inConnectionLost(self):
        print "inConnectionLost for cat! stdin is closed! (we probably did it)"

    def outConnectionLost(self):
        print "outConnectionLost for cat! The child closed their stdout!"
        # now is the time to examine what they wrote
        print "Final output:", self.data
        #(dummy, lines, words, chars, file) = re.split(r'\s+', self.data)
        #print "I saw %s lines" % lines

    def errConnectionLost(self):
        print "errConnectionLost for cat! The child closed their stderr."

    def processExited(self, reason):
        print "processExited for cat, status %d" % (reason.value.exitCode,)

    def processEnded(self, reason):
        print "processEnded for cat, status %d" % (reason.value.exitCode,)
        reactor.stop()

readPipe, writePipe = os.pipe()

handle=open('junkin.txt','r')
cat_txt=handle.read()
handle.close()

pp1 = CatPP(cat_txt)
pp2 = WcPP()
reactor.spawnProcess(pp1, "cat", ["cat"], {}, childFDs={1: writePipe})
reactor.spawnProcess(pp2, "wc", ["wc", "-w"], {},childFDs={0: readPipe})
reactor.run()
try:
    os.close(readPipe)
except:
    print "Exception closing readPipe"
try:
    os.close(writePipe)
except:
    print "Exception closing writePipe"

2 个答案:

答案 0 :(得分:1)

这是一个有效的例子。

如果通过cat | wc进行管道传输,spawnProcess会复制管道,因此您需要关闭它们。

from twisted.internet import protocol
from twisted.internet import reactor
import os

class Writer(protocol.ProcessProtocol):
  def __init__(self, data):
    self.data = data
  def connectionMade(self):
    print "Writer -- connection made"
    self.transport.writeToChild(0, self.data)
    self.transport.closeChildFD(0)
  def childDataReceived(self, fd, data):
    pass
  def processEnded(self, status):
    pass

class Reader(protocol.ProcessProtocol):
  def __init__(self):
    pass
  def connectionMade(self):
    print "Reader -- connection made"
    pass
  def childDataReceived(self, fd, data):
    print "Reader -- childDataReceived"
    self.received = data
  def processEnded(self, status):
    print "process ended, got:", self.received

class WriteRead(protocol.ProcessProtocol):
  def __init__(self, data):
    self.data = data
  def connectionMade(self):
    self.transport.writeToChild(0, self.data)
    self.transport.closeChildFD(0)
  def childDataReceived(self, fd, data):
    self.received = data
    print "got data:", data
  def processEnded(self, status):
    print "process ended - now what?"

def test1(data):
    # just call wc
    p2 = reactor.spawnProcess(WriteRead(data), "wc", ["wc"], env=None, childFDs={0: "w", 1: "r"})
    reactor.run()

def test2(data):
    rfd, wfd = os.pipe()
    p1 = reactor.spawnProcess(Writer(data), "cat", ["cat"], env=None, childFDs={0:"w", 1: wfd })
    p2 = reactor.spawnProcess(Reader(),     "wc", ["wc", "-w"], env=None, childFDs={0: rfd, 1: "r"})
    os.close(rfd)
    os.close(wfd)
    reactor.run()

test2("this is a test")

答案 1 :(得分:0)

好的我想出了如何做到但没有使用来自Twisted pipe two processes with spawnProcess的管道方法,我从来没有开始工作。相反,我使用了一个ChainableProcessProtocol类,它将另一个ChainableProcessProtocol作为参数。这种方式可以将这些链接在一起,先前协议的输出写入下一个协议的stdin。当next_protocol为None时,此链接将停止。最终输出是最终协议的数据。这是我的例子:

#!/usr/bin/env python

from twisted.internet import protocol
from twisted.internet import reactor, defer
import re
import os
import sys
import json

def shutdown(x):
    print "Shutdown called"
    reactor.stop()

class ChainableProcessProtocol(protocol.ProcessProtocol):
    def __init__(self,cmd,cmdargs,input_data,next_protocol):
        self.cmd=cmd
        self.cmdargs=cmdargs
        self.input_data=input_data
        self.next_protocol=next_protocol
        self.data = ""

    def set_input_data(self,new_input_data):
        self.input_data=new_input_data

    def connectionMade(self):
        print "connectionMade in %s! Now writing to stdin of cat" % self.cmd
        print "   writing this data: %s" % self.input_data
        self.transport.write(self.input_data+'\n')
        print "   closing stdin"
        self.transport.closeStdin() # tell them we're done
        print "   stdin closed"

    def outReceived(self, data):
        print "outReceived from %s! with %d bytes!" % (self.cmd,len(data))
        self.data = self.data + data
        print "    received this: %s" % self.data

    def errReceived(self, data):
        print "errReceived from %s! with %d bytes!" % (self.cmd,len(data))

    def inConnectionLost(self):
        print "inConnectionLost for %s! stdin is closed! (we probably did it)" %(self.cmd,)

    def outConnectionLost(self):
        print "outConnectionLost for %s! The child closed their stdout!" %(self.cmd,)
        # now is the time to examine what they wrote
        print "I saw %s write this: %s" % (self.cmd,self.data)
        #
        # cmd is done, now write to next_protocol if set
        #
        if self.next_protocol:
            print "Calling chained protocol"
            self.next_protocol.set_input_data(self.data)
            npcmd=self.next_protocol.cmd
            npcmdargs=self.next_protocol.cmdargs
            print "npcmd is %s" % (npcmd,)
            print "npcmdargs is %s" % (json.dumps(npcmdargs),)
            reactor.spawnProcess(self.next_protocol, npcmd, npcmdargs, {})
        else:
            print "No chained protocol"

    def errConnectionLost(self):
        print "errConnectionLost for %s! The child closed their stderr." % (self.cmd,)

    def processExited(self, reason):
        print "processExited for %s, status %d" % (self.cmd,reason.value.exitCode,)

    def processEnded(self, reason):
        print "processEnded for %s, status %d" % (self.cmd,reason.value.exitCode,)

handle=open('junkin.txt','r')
in_txt=handle.read()
handle.close()

#
# Create the last protocol first because earlier protocol(s) need it
#
pp2 = ChainableProcessProtocol("wc",["wc","-w"],'',None)
#
# The first process takes an instance of the second process as an argument
#
pp1 = ChainableProcessProtocol("cat",["cat"],in_txt,pp2)
#
# before using spawnProcess, lets create a deferred to shut down the reactor in 2 seconds
# This should give us enough time. This is only so our test script does not run forever
#
d=defer.Deferred()
d.addCallback(shutdown)
reactor.callLater(2, d.callback, '')
#
# Now spawn the first process
#
reactor.spawnProcess(pp1, pp1.cmd, pp1.cmdargs, {})
reactor.run()
print "Final output is data in pp2: %s" % (pp2.data.strip(),)
print "Done!"