如何使用Python和PyObjC捕获Apple iSight的帧?

11
我正在尝试使用Python(版本2.7或2.6)和PyObjC(版本2.2)从内置在Macbook Pro中的Apple iSight相机中捕获单个帧。作为起点,我使用了这个旧的StackOverflow问题。为了验证它是否有意义,我交叉参考了苹果的MyRecorder示例,看起来它是基于此构建的。不幸的是,我的脚本无法正常工作。我的主要问题是:
  • 我是否正确初始化了相机?
  • 我是否正确启动了事件循环?
  • 是否还有其他设置我应该做?
在下面粘贴的示例脚本中,预期操作是在调用startImageCapture()后,我应该从CaptureDelegate开始打印“Got a frame…”消息。然而,相机的灯从未亮起,委托的回调也从未执行。此外,在startImageCapture()期间没有失败,所有函数都声称成功,并且它成功找到了iSight设备。在pdb中分析会话对象显示它具有有效的输入和输出对象,输出对象已分配委托,设备未被其他进程使用,并且在调用startRunning()后会话标记为运行状态。以下是代码:
#!/usr/bin/env python2.7

import sys
import os
import time
import objc
import QTKit
import AppKit
from Foundation import NSObject
from Foundation import NSTimer
from PyObjCTools import AppHelper
objc.setVerbose(True)

class CaptureDelegate(NSObject):
    def captureOutput_didOutputVideoFrame_withSampleBuffer_fromConnection_(self, captureOutput, 
                                                                           videoFrame, sampleBuffer, 
                                                                           connection):
        # This should get called for every captured frame
        print "Got a frame: %s" % videoFrame

class QuitClass(NSObject):
    def quitMainLoop_(self, aTimer):
        # Just stop the main loop.
        print "Quitting main loop."
        AppHelper.stopEventLoop()


def startImageCapture():
    error = None

    # Create a QT Capture session
    session = QTKit.QTCaptureSession.alloc().init()

    # Find iSight device and open it
    dev = QTKit.QTCaptureDevice.defaultInputDeviceWithMediaType_(QTKit.QTMediaTypeVideo)
    print "Device: %s" % dev
    if not dev.open_(error):
        print "Couldn't open capture device."
        return

    # Create an input instance with the device we found and add to session
    input = QTKit.QTCaptureDeviceInput.alloc().initWithDevice_(dev)
    if not session.addInput_error_(input, error):
        print "Couldn't add input device."
        return

    # Create an output instance with a delegate for callbacks and add to session
    output = QTKit.QTCaptureDecompressedVideoOutput.alloc().init()
    delegate = CaptureDelegate.alloc().init()
    output.setDelegate_(delegate)
    if not session.addOutput_error_(output, error):
        print "Failed to add output delegate."
        return

    # Start the capture
    print "Initiating capture..."
    session.startRunning()


def main():
    # Open camera and start capturing frames
    startImageCapture()

    # Setup a timer to quit in 10 seconds (hack for now)
    quitInst = QuitClass.alloc().init()
    NSTimer.scheduledTimerWithTimeInterval_target_selector_userInfo_repeats_(10.0, 
                                                                             quitInst, 
                                                                             'quitMainLoop:', 
                                                                             None, 
                                                                             False)
    # Start Cocoa's main event loop
    AppHelper.runConsoleEventLoop(installInterrupt=True)

    print "After event loop"


if __name__ == "__main__":
    main()

感谢您能提供的任何帮助!
2个回答

15

好的,我花了一天时间深入研究PyObjC并让它正常工作。

为了记录,问题中的代码无法正常工作的原因是变量作用域和垃圾回收。当session变量超出作用域时被删除,而这发生在事件处理器运行之前。必须采取措施来保留它,以便在运行之前不被释放。

将所有内容移动到一个类中,并使session成为一个类变量即可使回调开始工作。此外,下面的代码演示了如何通过Cocoa调用将帧的像素数据转换为位图格式并保存,以及如何将其复制回Python的视图中作为缓冲区或字符串。

下面的脚本将捕获单个帧。

#!/usr/bin/env python2.7
#
# camera.py -- by Trevor Bentley (02/04/2011)
# 
# This work is licensed under a Creative Commons Attribution 3.0 Unported License.
#
# Run from the command line on an Apple laptop running OS X 10.6, this script will
# take a single frame capture using the built-in iSight camera and save it to disk
# using three methods.
#

import sys
import os
import time
import objc
import QTKit
from AppKit import *
from Foundation import NSObject
from Foundation import NSTimer
from PyObjCTools import AppHelper

class NSImageTest(NSObject):
    def init(self):
        self = super(NSImageTest, self).init()
        if self is None:
            return None

        self.session = None
        self.running = True

        return self

    def captureOutput_didOutputVideoFrame_withSampleBuffer_fromConnection_(self, captureOutput, 
                                                                           videoFrame, sampleBuffer, 
                                                                           connection):
        self.session.stopRunning() # I just want one frame

        # Get a bitmap representation of the frame using CoreImage and Cocoa calls
        ciimage = CIImage.imageWithCVImageBuffer_(videoFrame)
        rep = NSCIImageRep.imageRepWithCIImage_(ciimage)
        bitrep = NSBitmapImageRep.alloc().initWithCIImage_(ciimage)
        bitdata = bitrep.representationUsingType_properties_(NSBMPFileType, objc.NULL)

        # Save image to disk using Cocoa
        t0 = time.time()
        bitdata.writeToFile_atomically_("grab.bmp", False)
        t1 = time.time()
        print "Cocoa saved in %.5f seconds" % (t1-t0)

        # Save a read-only buffer of image to disk using Python
        t0 = time.time()
        bitbuf = bitdata.bytes()
        f = open("python.bmp", "w")
        f.write(bitbuf)
        f.close()
        t1 = time.time()
        print "Python saved buffer in %.5f seconds" % (t1-t0)

        # Save a string-copy of the buffer to disk using Python
        t0 = time.time()
        bitbufstr = str(bitbuf)
        f = open("python2.bmp", "w")
        f.write(bitbufstr)
        f.close()
        t1 = time.time()
        print "Python saved string in %.5f seconds" % (t1-t0)

        # Will exit on next execution of quitMainLoop_()
        self.running = False

    def quitMainLoop_(self, aTimer):
        # Stop the main loop after one frame is captured.  Call rapidly from timer.
        if not self.running:
            AppHelper.stopEventLoop()

    def startImageCapture(self, aTimer):
        error = None
        print "Finding camera"

        # Create a QT Capture session
        self.session = QTKit.QTCaptureSession.alloc().init()

        # Find iSight device and open it
        dev = QTKit.QTCaptureDevice.defaultInputDeviceWithMediaType_(QTKit.QTMediaTypeVideo)
        print "Device: %s" % dev
        if not dev.open_(error):
            print "Couldn't open capture device."
            return

        # Create an input instance with the device we found and add to session
        input = QTKit.QTCaptureDeviceInput.alloc().initWithDevice_(dev)
        if not self.session.addInput_error_(input, error):
            print "Couldn't add input device."
            return

        # Create an output instance with a delegate for callbacks and add to session
        output = QTKit.QTCaptureDecompressedVideoOutput.alloc().init()
        output.setDelegate_(self)
        if not self.session.addOutput_error_(output, error):
            print "Failed to add output delegate."
            return

        # Start the capture
        print "Initiating capture..."
        self.session.startRunning()


    def main(self):
        # Callback that quits after a frame is captured
        NSTimer.scheduledTimerWithTimeInterval_target_selector_userInfo_repeats_(0.1, 
                                                                                 self, 
                                                                                 'quitMainLoop:', 
                                                                                 None, 
                                                                                 True)

        # Turn on the camera and start the capture
        self.startImageCapture(None)

        # Start Cocoa's main event loop
        AppHelper.runConsoleEventLoop(installInterrupt=True)

        print "Frame capture completed."

if __name__ == "__main__":
    test = NSImageTest.alloc().init()
    test.main()

这个脚本运行得很好,但在写入字节文件时失败了。你应该将 open('filename', 'w') 更改为 open('filename', 'wb') 以打开一个字节模式的文件,然后它就可以工作了。 - andli

0

QTKit已被弃用,PyObjC是一个巨大的依赖项(如果您想在HomeBrew中使用它,则似乎很棘手)。此外,PyObjC没有大部分AVFoundation,因此我创建了Python的简单相机扩展,它使用AVFoundation来记录视频或拍照片,不需要任何依赖项(Cython中间文件已提交以避免大多数用户需要Cython)。

应该可以像这样构建它:

pip install -e git+https://github.com/dashesy/pyavfcam.git

然后我们可以使用它来拍照

import pyavfcam

# Open the default video source
cam = pyavfcam.AVFCam(sinks='image')
frame = cam.snap_picture('test.jpg')  # frame is a memory buffer np.asarray(frame) can retrieve

与这个问题无关,但如果AVFCam类被子类化,则覆盖的方法将使用结果调用。


pip 安装失败: ``pip install -e git+https://github.com/dashesy/pyavfcam.git--editable=git+https://github.com/dashesy/pyavfcam.git 不是正确的格式; 必须有 #egg=Package。`` - DanHickstein

网页内容由stack overflow 提供, 点击上面的
可以查看英文原文,
原文链接