カメラ（またはWebカメラ）からPythonでビデオ（およびオーディオ）をキャプチャする方法

Question

私はLinuxまたはWindowsのいずれかで、私にできる解決策を探しています

webカメラとマイクから同時にビデオ（+オーディオ）を記録します。
それをfile.AVI（またはmpgなど）として保存します。
録画中に画面にビデオを表示する

私の場合、圧縮は問題ではなく、実際にはRAWをキャプチャして後で圧縮することを好みます。

これまでのところ、すべてを処理するVBのActiveXコンポーネントを使用してそれを実行しました。python（VBソリューションで進めたいと思います不安定で、信頼できません）。

これまでのところ、ビデオのみ、または個々のフレームをキャプチャするコードを見てきました...

これまで見てきました

OpenCV-そこにオーディオキャプチャが見つかりませんでした
PyGame-同時音声キャプチャなし（AFAIK）
VideoCapture-単一フレームのみを提供します。
SimpleCV-音声なし
VLC-VideoLANプログラムをwxPthonにバインド-うまくいけば（まだこのオプションを調査中）
kivy-それについて聞いたばかりで、windows SO FARで動作させることができませんでした。

質問-Python用のビデオとオーディオのキャプチャライブラリはありますか？

または-他にどんなオプションがありますか？

JRodrigoF · Answer

回答：いいえ。ビデオ/オーディオの録音を同時に行うには、python=に単一のライブラリ/ソリューションはありません。両方を個別に実装し、オーディオとビデオの信号をスマートな方法でマージして、ビデオ/オーディオファイルで。

あなたが提示する問題の解決策を得ました。私のコードはあなたの3つの問題に対処します：

ウェブカメラとマイクから同時にビデオとオーディオを記録します。
最終的なビデオ/オーディオファイルを.AVIとして保存します
コメント行76、77、78のコメントを外すと、録画中にビデオが画面に表示されます。

私のソリューションでは、オーディオ録音にpyaudio、ビデオ録音にopencv、2つの信号の多重化にffmpegを使用しています。両方を同時に記録できるように、私はマルチスレッドを使用しています。 1つのスレッドはビデオを記録し、2番目のスレッドはオーディオを記録します。私は自分のコードをgithubにアップロードし、すべての重要な部分をここに含めました。

https://github.com/JRodrigoF/AVrecordeR

注：opencvは、ウェブカメラが記録を行うfpsを制御できません。ファイルのエンコーディングで目的の最終的なfpsを指定することしかできませんが、通常、Webカメラの動作は仕様と照明条件に応じて異なります（私が見つけました）。したがって、fpsはコードのレベルで制御する必要があります。

import cv2 import pyaudio import wave import threading import time import subprocess import os class VideoRecorder(): # Video class based on openCV def __init__(self): self.open = True self.device_index = 0 self.fps = 6 # fps should be the minimum constant rate at which the camera can self.fourcc = "MJPG" # capture images (with no decrease in speed over time; testing is required) self.frameSize = (640,480) # video formats and sizes also depend and vary according to the camera used self.video_filename = "temp_video.avi" self.video_cap = cv2.VideoCapture(self.device_index) self.video_writer = cv2.VideoWriter_fourcc(*self.fourcc) self.video_out = cv2.VideoWriter(self.video_filename, self.video_writer, self.fps, self.frameSize) self.frame_counts = 1 self.start_time = time.time() # Video starts being recorded def record(self): # counter = 1 timer_start = time.time() timer_current = 0 while(self.open==True): ret, video_frame = self.video_cap.read() if (ret==True): self.video_out.write(video_frame) # print str(counter) + " " + str(self.frame_counts) + " frames written " + str(timer_current) self.frame_counts += 1 # counter += 1 # timer_current = time.time() - timer_start time.sleep(0.16) # gray = cv2.cvtColor(video_frame, cv2.COLOR_BGR2GRAY) # cv2.imshow('video_frame', gray) # cv2.waitKey(1) else: break # 0.16 delay -> 6 fps # # Finishes the video recording therefore the thread too def stop(self): if self.open==True: self.open=False self.video_out.release() self.video_cap.release() cv2.destroyAllWindows() else: pass # Launches the video recording function using a thread def start(self): video_thread = threading.Thread(target=self.record) video_thread.start() class AudioRecorder(): # Audio class based on pyAudio and Wave def __init__(self): self.open = True self.rate = 44100 self.frames_per_buffer = 1024 self.channels = 2 self.format = pyaudio.Paint16 self.audio_filename = "temp_audio.wav" self.audio = pyaudio.PyAudio() self.stream = self.audio.open(format=self.format, channels=self.channels, rate=self.rate, input=True, frames_per_buffer = self.frames_per_buffer) self.audio_frames = [] # Audio starts being recorded def record(self): self.stream.start_stream() while(self.open == True): data = self.stream.read(self.frames_per_buffer) self.audio_frames.append(data) if self.open==False: break # Finishes the audio recording therefore the thread too def stop(self): if self.open==True: self.open = False self.stream.stop_stream() self.stream.close() self.audio.terminate() waveFile = wave.open(self.audio_filename, 'wb') waveFile.setnchannels(self.channels) waveFile.setsampwidth(self.audio.get_sample_size(self.format)) waveFile.setframerate(self.rate) waveFile.writeframes(b''.join(self.audio_frames)) waveFile.close() pass # Launches the audio recording function using a thread def start(self): audio_thread = threading.Thread(target=self.record) audio_thread.start() def start_AVrecording(filename): global video_thread global audio_thread video_thread = VideoRecorder() audio_thread = AudioRecorder() audio_thread.start() video_thread.start() return filename def start_video_recording(filename): global video_thread video_thread = VideoRecorder() video_thread.start() return filename def start_audio_recording(filename): global audio_thread audio_thread = AudioRecorder() audio_thread.start() return filename def stop_AVrecording(filename): audio_thread.stop() frame_counts = video_thread.frame_counts elapsed_time = time.time() - video_thread.start_time recorded_fps = frame_counts / elapsed_time print "total frames " + str(frame_counts) print "elapsed time " + str(elapsed_time) print "recorded fps " + str(recorded_fps) video_thread.stop() # Makes sure the threads have finished while threading.active_count() > 1: time.sleep(1) # Merging audio and video signal if abs(recorded_fps - 6) >= 0.01: # If the fps rate was higher/lower than expected, re-encode it to the expected print "Re-encoding" cmd = "ffmpeg -r " + str(recorded_fps) + " -i temp_video.avi -pix_fmt yuv420p -r 6 temp_video2.avi" subprocess.call(cmd, Shell=True) print "Muxing" cmd = "ffmpeg -ac 2 -channel_layout stereo -i temp_audio.wav -i temp_video2.avi -pix_fmt yuv420p " + filename + ".avi" subprocess.call(cmd, Shell=True) else: print "Normal recording
Muxing" cmd = "ffmpeg -ac 2 -channel_layout stereo -i temp_audio.wav -i temp_video.avi -pix_fmt yuv420p " + filename + ".avi" subprocess.call(cmd, Shell=True) print ".." # Required and wanted processing of final files def file_manager(filename): local_path = os.getcwd() if os.path.exists(str(local_path) + "/temp_audio.wav"): os.remove(str(local_path) + "/temp_audio.wav") if os.path.exists(str(local_path) + "/temp_video.avi"): os.remove(str(local_path) + "/temp_video.avi") if os.path.exists(str(local_path) + "/temp_video2.avi"): os.remove(str(local_path) + "/temp_video2.avi") if os.path.exists(str(local_path) + "/" + filename + ".avi"): os.remove(str(local_path) + "/" + filename + ".avi")

bunkus · Answer

上記の質問に対して：はい、コードはPython3でも動作するはずです。私はそれを少し調整してpython2とpython3で動作するようになりました（2.7と3.6のWindows7でテストしましたが、少なくとも同じディレクトリにffmpegがインストールされているか実行可能ファイルffmpeg.exeが必要ですが、ここから入手できます：- https://www.ffmpeg.org/download.html ）。もちろん、他のすべてのライブラリcv2、numpy、pyaudioも必要です。

pip install opencv-python numpy pyaudio

これで、コードを直接実行できます。

#!/usr/bin/env python # -*- coding: utf-8 -*- # VideoRecorder.py from __future__ import print_function, division import numpy as np import cv2 import pyaudio import wave import threading import time import subprocess import os class VideoRecorder(): "Video class based on openCV" def __init__(self, name="temp_video.avi", fourcc="MJPG", sizex=640, sizey=480, camindex=0, fps=30): self.open = True self.device_index = camindex self.fps = fps # fps should be the minimum constant rate at which the camera can self.fourcc = fourcc # capture images (with no decrease in speed over time; testing is required) self.frameSize = (sizex, sizey) # video formats and sizes also depend and vary according to the camera used self.video_filename = name self.video_cap = cv2.VideoCapture(self.device_index) self.video_writer = cv2.VideoWriter_fourcc(*self.fourcc) self.video_out = cv2.VideoWriter(self.video_filename, self.video_writer, self.fps, self.frameSize) self.frame_counts = 1 self.start_time = time.time() def record(self): "Video starts being recorded" # counter = 1 timer_start = time.time() timer_current = 0 while self.open: ret, video_frame = self.video_cap.read() if ret: self.video_out.write(video_frame) # print(str(counter) + " " + str(self.frame_counts) + " frames written " + str(timer_current)) self.frame_counts += 1 # counter += 1 # timer_current = time.time() - timer_start time.sleep(1/self.fps) # gray = cv2.cvtColor(video_frame, cv2.COLOR_BGR2GRAY) # cv2.imshow('video_frame', gray) # cv2.waitKey(1) else: break def stop(self): "Finishes the video recording therefore the thread too" if self.open: self.open=False self.video_out.release() self.video_cap.release() cv2.destroyAllWindows() def start(self): "Launches the video recording function using a thread" video_thread = threading.Thread(target=self.record) video_thread.start() class AudioRecorder(): "Audio class based on pyAudio and Wave" def __init__(self, filename="temp_audio.wav", rate=44100, fpb=1024, channels=2): self.open = True self.rate = rate self.frames_per_buffer = fpb self.channels = channels self.format = pyaudio.Paint16 self.audio_filename = filename self.audio = pyaudio.PyAudio() self.stream = self.audio.open(format=self.format, channels=self.channels, rate=self.rate, input=True, frames_per_buffer = self.frames_per_buffer) self.audio_frames = [] def record(self): "Audio starts being recorded" self.stream.start_stream() while self.open: data = self.stream.read(self.frames_per_buffer) self.audio_frames.append(data) if not self.open: break def stop(self): "Finishes the audio recording therefore the thread too" if self.open: self.open = False self.stream.stop_stream() self.stream.close() self.audio.terminate() waveFile = wave.open(self.audio_filename, 'wb') waveFile.setnchannels(self.channels) waveFile.setsampwidth(self.audio.get_sample_size(self.format)) waveFile.setframerate(self.rate) waveFile.writeframes(b''.join(self.audio_frames)) waveFile.close() def start(self): "Launches the audio recording function using a thread" audio_thread = threading.Thread(target=self.record) audio_thread.start() def start_AVrecording(filename="test"): global video_thread global audio_thread video_thread = VideoRecorder() audio_thread = AudioRecorder() audio_thread.start() video_thread.start() return filename def start_video_recording(filename="test"): global video_thread video_thread = VideoRecorder() video_thread.start() return filename def start_audio_recording(filename="test"): global audio_thread audio_thread = AudioRecorder() audio_thread.start() return filename def stop_AVrecording(filename="test"): audio_thread.stop() frame_counts = video_thread.frame_counts elapsed_time = time.time() - video_thread.start_time recorded_fps = frame_counts / elapsed_time print("total frames " + str(frame_counts)) print("elapsed time " + str(elapsed_time)) print("recorded fps " + str(recorded_fps)) video_thread.stop() # Makes sure the threads have finished while threading.active_count() > 1: time.sleep(1) # Merging audio and video signal if abs(recorded_fps - 6) >= 0.01: # If the fps rate was higher/lower than expected, re-encode it to the expected print("Re-encoding") cmd = "ffmpeg -r " + str(recorded_fps) + " -i temp_video.avi -pix_fmt yuv420p -r 6 temp_video2.avi" subprocess.call(cmd, Shell=True) print("Muxing") cmd = "ffmpeg -y -ac 2 -channel_layout stereo -i temp_audio.wav -i temp_video2.avi -pix_fmt yuv420p " + filename + ".avi" subprocess.call(cmd, Shell=True) else: print("Normal recording
Muxing") cmd = "ffmpeg -y -ac 2 -channel_layout stereo -i temp_audio.wav -i temp_video.avi -pix_fmt yuv420p " + filename + ".avi" subprocess.call(cmd, Shell=True) print("..") def file_manager(filename="test"): "Required and wanted processing of final files" local_path = os.getcwd() if os.path.exists(str(local_path) + "/temp_audio.wav"): os.remove(str(local_path) + "/temp_audio.wav") if os.path.exists(str(local_path) + "/temp_video.avi"): os.remove(str(local_path) + "/temp_video.avi") if os.path.exists(str(local_path) + "/temp_video2.avi"): os.remove(str(local_path) + "/temp_video2.avi") # if os.path.exists(str(local_path) + "/" + filename + ".avi"): # os.remove(str(local_path) + "/" + filename + ".avi") if __name__ == '__main__': start_AVrecording() time.sleep(5) stop_AVrecording() file_manager()

Tuim · Answer

私はffmpegをお勧めします。 pythonラッパーがあります。

http://code.google.com/p/pyffmpeg/

Kevin Hill · Answer

私はこれに対する良い答えを探していました、そしてそれは GStreamer ...だと思います.

pythonバインディングのドキュメントは非常に軽量であり、そのほとんどは新しい1.Xバージョンではなく古い0.10バージョンのGStreamerを中心としたものでしたが、GStreamerは非常に強力なクロスほぼ何でもストリーミング、マルチプレクサ、トランスコード、表示できるプラットフォームマルチメディアフレームワーク。