mirror of
https://github.com/openlibrecommunity/olcrtc.git
synced 2026-05-26 07:08:11 +00:00
- Add -ffmpeg flag for custom path - Allow FFMPEG_BIN env var to set path - Update ffmpeg
597 lines
14 KiB
Go
597 lines
14 KiB
Go
package videochannel
|
|
|
|
import (
|
|
"bytes"
|
|
"context"
|
|
"encoding/binary"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
"os/exec"
|
|
"strconv"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"github.com/pion/rtp"
|
|
"github.com/pion/rtp/codecs"
|
|
"github.com/pion/webrtc/v4"
|
|
"github.com/pion/webrtc/v4/pkg/media/ivfreader"
|
|
)
|
|
|
|
const (
|
|
ffmpegFrameTimeout = 10 * time.Second
|
|
|
|
argCodecVideo = "-c:v"
|
|
argPixFmt = "-pix_fmt"
|
|
codecLibVPX = "libvpx"
|
|
pixFmtYUV420P = "yuv420p"
|
|
)
|
|
|
|
var (
|
|
// ErrFFmpegUnavailable is returned when ffmpeg is not available on PATH.
|
|
ErrFFmpegUnavailable = errors.New("ffmpeg is required for videochannel")
|
|
// ErrUnsupportedVideoCodec is returned when videochannel cannot decode the negotiated codec.
|
|
ErrUnsupportedVideoCodec = errors.New("unsupported video codec")
|
|
// ErrEncoderTimeout is returned when the encoder does not produce a frame within the deadline.
|
|
ErrEncoderTimeout = errors.New("encoder timeout")
|
|
// ErrPopFrameTimeout is returned when no decoded frame is available within the deadline.
|
|
ErrPopFrameTimeout = errors.New("pop frame timeout")
|
|
// ErrUnexpectedFrameSize is returned when the raw frame size does not match expectations.
|
|
ErrUnexpectedFrameSize = errors.New("unexpected encoder frame size")
|
|
)
|
|
|
|
// FFmpegPath defines the path to the ffmpeg executable.
|
|
var FFmpegPath = "ffmpeg"
|
|
|
|
type codecSpec struct {
|
|
mimeType string
|
|
fourCC string
|
|
encoder string
|
|
capability webrtc.RTPCodecCapability
|
|
depacketizer func() rtp.Depacketizer
|
|
encodeArgs []string
|
|
}
|
|
|
|
func codecSpecForCarrier(_ string) codecSpec {
|
|
return vp8CodecSpec()
|
|
}
|
|
|
|
func codecSpecForMime(mimeType string) (codecSpec, bool) {
|
|
switch strings.ToLower(mimeType) {
|
|
case strings.ToLower(webrtc.MimeTypeH264):
|
|
return h264CodecSpec(), true
|
|
case strings.ToLower(webrtc.MimeTypeVP9):
|
|
return vp9CodecSpec(), true
|
|
case strings.ToLower(webrtc.MimeTypeVP8):
|
|
return vp8CodecSpec(), true
|
|
default:
|
|
return codecSpec{}, false
|
|
}
|
|
}
|
|
|
|
func h264CodecSpec() codecSpec {
|
|
return codecSpec{
|
|
mimeType: webrtc.MimeTypeH264,
|
|
fourCC: "H264",
|
|
encoder: "libx264",
|
|
capability: webrtc.RTPCodecCapability{
|
|
MimeType: webrtc.MimeTypeH264,
|
|
ClockRate: 90000,
|
|
},
|
|
depacketizer: func() rtp.Depacketizer { return &codecs.H264Packet{} },
|
|
encodeArgs: []string{
|
|
argCodecVideo, "libx264",
|
|
"-preset", "ultrafast",
|
|
"-tune", "zerolatency",
|
|
"-g", "1",
|
|
argPixFmt, pixFmtYUV420P,
|
|
},
|
|
}
|
|
}
|
|
|
|
func vp9CodecSpec() codecSpec {
|
|
return codecSpec{
|
|
mimeType: webrtc.MimeTypeVP9,
|
|
fourCC: "VP90",
|
|
encoder: "libvpx-vp9",
|
|
capability: webrtc.RTPCodecCapability{
|
|
MimeType: webrtc.MimeTypeVP9,
|
|
ClockRate: 90000,
|
|
},
|
|
depacketizer: func() rtp.Depacketizer { return &codecs.VP9Packet{} },
|
|
encodeArgs: []string{
|
|
argCodecVideo, "libvpx-vp9",
|
|
"-deadline", "realtime",
|
|
"-cpu-used", "8",
|
|
"-error-resilient", "1",
|
|
"-static-thresh", "0",
|
|
"-g", "1",
|
|
argPixFmt, pixFmtYUV420P,
|
|
},
|
|
}
|
|
}
|
|
|
|
func vp8CodecSpec() codecSpec {
|
|
return codecSpec{
|
|
mimeType: webrtc.MimeTypeVP8,
|
|
fourCC: "VP80",
|
|
encoder: codecLibVPX,
|
|
capability: webrtc.RTPCodecCapability{
|
|
MimeType: webrtc.MimeTypeVP8,
|
|
ClockRate: 90000,
|
|
},
|
|
depacketizer: func() rtp.Depacketizer { return &codecs.VP8Packet{} },
|
|
encodeArgs: []string{
|
|
argCodecVideo, codecLibVPX,
|
|
"-deadline", "realtime",
|
|
"-cpu-used", "8",
|
|
"-error-resilient", "1",
|
|
"-static-thresh", "0",
|
|
"-g", "1",
|
|
argPixFmt, pixFmtYUV420P,
|
|
},
|
|
}
|
|
}
|
|
|
|
func resolveEncoderCodec(spec codecSpec, hw string) string {
|
|
if hw != "nvenc" {
|
|
return spec.encoder
|
|
}
|
|
switch spec.mimeType {
|
|
case webrtc.MimeTypeH264:
|
|
return "h264_nvenc"
|
|
case webrtc.MimeTypeVP8:
|
|
return "vp8_nvenc"
|
|
case webrtc.MimeTypeVP9:
|
|
return "vp9_nvenc"
|
|
case webrtc.MimeTypeAV1:
|
|
return "av1_nvenc"
|
|
default:
|
|
return spec.encoder
|
|
}
|
|
}
|
|
|
|
func buildEncoderArgs(spec codecSpec, vcodec string, width, height, fps int, bitrate string) []string {
|
|
args := []string{
|
|
"-loglevel", "error", "-threads", "1",
|
|
"-f", "rawvideo",
|
|
argPixFmt, "gray",
|
|
"-video_size", strconv.Itoa(width) + "x" + strconv.Itoa(height),
|
|
"-framerate", strconv.Itoa(fps),
|
|
"-i", "pipe:0",
|
|
"-an",
|
|
}
|
|
|
|
if strings.HasSuffix(vcodec, "_nvenc") {
|
|
args = append(args, argCodecVideo, vcodec, "-preset", "p1", "-tune", "ull", "-rc", "vbr")
|
|
} else {
|
|
args = append(args, spec.encodeArgs...)
|
|
}
|
|
|
|
args = append(args, "-g", "1", argPixFmt, pixFmtYUV420P, "-b:v", bitrate)
|
|
|
|
if spec.mimeType == webrtc.MimeTypeH264 {
|
|
return append(args, "-f", "h264", "pipe:1")
|
|
}
|
|
return append(args, "-f", "ivf", "pipe:1")
|
|
}
|
|
|
|
type ffmpegEncoder struct {
|
|
cmd *exec.Cmd
|
|
stdin io.WriteCloser
|
|
stderr *bytes.Buffer
|
|
frames chan []byte
|
|
width int
|
|
height int
|
|
frameSize int
|
|
closed atomic.Bool
|
|
closeOnce sync.Once
|
|
errMu sync.Mutex
|
|
err error
|
|
}
|
|
|
|
func newFFmpegEncoder(
|
|
ctx context.Context,
|
|
spec codecSpec,
|
|
width, height, fps int,
|
|
bitrate, hw string,
|
|
) (*ffmpegEncoder, error) {
|
|
ffmpegBin := FFmpegPath
|
|
if envBin := os.Getenv("FFMPEG_BIN"); envBin != "" {
|
|
ffmpegBin = envBin
|
|
}
|
|
|
|
if ffmpegBin == "ffmpeg" {
|
|
if _, err := exec.LookPath("ffmpeg"); err != nil {
|
|
return nil, ErrFFmpegUnavailable
|
|
}
|
|
} else {
|
|
if _, err := os.Stat(ffmpegBin); err != nil {
|
|
return nil, fmt.Errorf("%w: %v", ErrFFmpegUnavailable, err)
|
|
}
|
|
}
|
|
|
|
vcodec := resolveEncoderCodec(spec, hw)
|
|
args := buildEncoderArgs(spec, vcodec, width, height, fps, bitrate)
|
|
|
|
cmd := exec.CommandContext(ctx, ffmpegBin, args...) //nolint:gosec
|
|
stdin, err := cmd.StdinPipe()
|
|
if err != nil {
|
|
return nil, fmt.Errorf("encoder stdin: %w", err)
|
|
}
|
|
stdout, err := cmd.StdoutPipe()
|
|
if err != nil {
|
|
return nil, fmt.Errorf("encoder stdout: %w", err)
|
|
}
|
|
stderr := &bytes.Buffer{}
|
|
cmd.Stderr = stderr
|
|
|
|
if err := cmd.Start(); err != nil {
|
|
return nil, fmt.Errorf("start encoder: %w", err)
|
|
}
|
|
|
|
enc := &ffmpegEncoder{
|
|
cmd: cmd,
|
|
stdin: stdin,
|
|
stderr: stderr,
|
|
frames: make(chan []byte, 8),
|
|
width: width,
|
|
height: height,
|
|
frameSize: width * height,
|
|
}
|
|
|
|
if spec.mimeType == webrtc.MimeTypeH264 {
|
|
go enc.readRawH264(stdout)
|
|
} else {
|
|
go enc.readIVF(stdout)
|
|
}
|
|
return enc, nil
|
|
}
|
|
|
|
func (e *ffmpegEncoder) EncodeFrame(frame []byte) ([]byte, error) {
|
|
if len(frame) != e.frameSize {
|
|
return nil, fmt.Errorf("%w: got %d expected %d", ErrUnexpectedFrameSize, len(frame), e.frameSize)
|
|
}
|
|
if err := e.processErr(); err != nil {
|
|
return nil, err
|
|
}
|
|
if err := writeAll(e.stdin, frame); err != nil {
|
|
return nil, fmt.Errorf("write encoder frame: %w", err)
|
|
}
|
|
|
|
select {
|
|
case sample, ok := <-e.frames:
|
|
if !ok {
|
|
return nil, e.processErr()
|
|
}
|
|
return sample, nil
|
|
case <-time.After(ffmpegFrameTimeout):
|
|
if err := e.processErr(); err != nil {
|
|
return nil, err
|
|
}
|
|
return nil, ErrEncoderTimeout
|
|
}
|
|
}
|
|
|
|
func (e *ffmpegEncoder) Close() error {
|
|
e.closeOnce.Do(func() {
|
|
e.closed.Store(true)
|
|
_ = e.stdin.Close()
|
|
if e.cmd.Process != nil {
|
|
_ = e.cmd.Process.Kill()
|
|
}
|
|
_ = e.cmd.Wait()
|
|
})
|
|
return nil
|
|
}
|
|
|
|
func (e *ffmpegEncoder) readIVF(stdout io.Reader) {
|
|
defer close(e.frames)
|
|
reader, _, err := ivfreader.NewWith(stdout)
|
|
if err != nil {
|
|
e.setErr(fmt.Errorf("encoder ivf header: %w", err))
|
|
return
|
|
}
|
|
for {
|
|
frame, _, err := reader.ParseNextFrame()
|
|
if err != nil {
|
|
if !e.closed.Load() {
|
|
e.setErr(fmt.Errorf("encoder ivf read: %w", err))
|
|
}
|
|
return
|
|
}
|
|
copyFrame := append([]byte(nil), frame...)
|
|
if e.closed.Load() {
|
|
return
|
|
}
|
|
e.frames <- copyFrame
|
|
}
|
|
}
|
|
|
|
func (e *ffmpegEncoder) readRawH264(stdout io.Reader) {
|
|
defer close(e.frames)
|
|
buf := make([]byte, 1024*1024)
|
|
for {
|
|
n, err := stdout.Read(buf)
|
|
if err != nil {
|
|
if !e.closed.Load() {
|
|
e.setErr(fmt.Errorf("encoder h264 read: %w", err))
|
|
}
|
|
return
|
|
}
|
|
if n > 0 {
|
|
copyFrame := append([]byte(nil), buf[:n]...)
|
|
if e.closed.Load() {
|
|
return
|
|
}
|
|
e.frames <- copyFrame
|
|
}
|
|
}
|
|
}
|
|
|
|
func (e *ffmpegEncoder) setErr(err error) {
|
|
if err == nil {
|
|
return
|
|
}
|
|
e.errMu.Lock()
|
|
defer e.errMu.Unlock()
|
|
if e.err == nil {
|
|
e.err = withStderr(err, e.stderr)
|
|
}
|
|
}
|
|
|
|
func (e *ffmpegEncoder) processErr() error {
|
|
e.errMu.Lock()
|
|
defer e.errMu.Unlock()
|
|
if e.err != nil {
|
|
return e.err
|
|
}
|
|
if e.closed.Load() {
|
|
return ErrTransportClosed
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func resolveDecoderName(spec codecSpec, hw string) string {
|
|
if hw != "nvenc" {
|
|
return strings.ToLower(strings.TrimPrefix(spec.mimeType, "video/"))
|
|
}
|
|
switch spec.mimeType {
|
|
case webrtc.MimeTypeH264:
|
|
return "h264_cuvid"
|
|
case webrtc.MimeTypeVP8:
|
|
return "vp8_cuvid"
|
|
case webrtc.MimeTypeVP9:
|
|
return "vp9_cuvid"
|
|
default:
|
|
return strings.ToLower(strings.TrimPrefix(spec.mimeType, "video/"))
|
|
}
|
|
}
|
|
|
|
func buildDecoderArgs(spec codecSpec, decoderName string, width, height int, outputPixFmt string) []string {
|
|
args := []string{"-loglevel", "error", "-threads", "1"}
|
|
if spec.mimeType == webrtc.MimeTypeH264 {
|
|
args = append(args, "-f", "h264")
|
|
} else {
|
|
args = append(args, "-f", "ivf")
|
|
}
|
|
|
|
vfFilter := fmt.Sprintf("scale=%d:%d:flags=neighbor,format=%s", width, height, outputPixFmt)
|
|
return append(args,
|
|
"-flags", "low_delay",
|
|
"-vcodec", decoderName,
|
|
"-i", "pipe:0",
|
|
"-an",
|
|
"-vf", vfFilter,
|
|
argPixFmt, outputPixFmt,
|
|
"-f", "rawvideo",
|
|
"pipe:1",
|
|
)
|
|
}
|
|
|
|
type ffmpegDecoder struct {
|
|
cmd *exec.Cmd
|
|
stdin io.WriteCloser
|
|
stderr *bytes.Buffer
|
|
frames chan []byte
|
|
pts uint64
|
|
mimeType string
|
|
frameSize int
|
|
closed atomic.Bool
|
|
closeOnce sync.Once
|
|
errMu sync.Mutex
|
|
err error
|
|
}
|
|
|
|
func newFFmpegDecoder(
|
|
ctx context.Context,
|
|
spec codecSpec,
|
|
width, height, fps int,
|
|
hw string,
|
|
) (*ffmpegDecoder, error) {
|
|
ffmpegBin := FFmpegPath
|
|
if envBin := os.Getenv("FFMPEG_BIN"); envBin != "" {
|
|
ffmpegBin = envBin
|
|
}
|
|
|
|
if ffmpegBin == "ffmpeg" {
|
|
if _, err := exec.LookPath("ffmpeg"); err != nil {
|
|
return nil, ErrFFmpegUnavailable
|
|
}
|
|
} else {
|
|
if _, err := os.Stat(ffmpegBin); err != nil {
|
|
return nil, fmt.Errorf("%w: %v", ErrFFmpegUnavailable, err)
|
|
}
|
|
}
|
|
|
|
decoderName := resolveDecoderName(spec, hw)
|
|
args := buildDecoderArgs(spec, decoderName, width, height, "gray")
|
|
|
|
cmd := exec.CommandContext(ctx, ffmpegBin, args...) //nolint:gosec
|
|
stdin, err := cmd.StdinPipe()
|
|
if err != nil {
|
|
return nil, fmt.Errorf("decoder stdin: %w", err)
|
|
}
|
|
stdout, err := cmd.StdoutPipe()
|
|
if err != nil {
|
|
return nil, fmt.Errorf("decoder stdout: %w", err)
|
|
}
|
|
stderr := &bytes.Buffer{}
|
|
cmd.Stderr = stderr
|
|
|
|
if err := cmd.Start(); err != nil {
|
|
return nil, fmt.Errorf("start decoder: %w", err)
|
|
}
|
|
|
|
dec := &ffmpegDecoder{
|
|
cmd: cmd,
|
|
stdin: stdin,
|
|
stderr: stderr,
|
|
frames: make(chan []byte, 32),
|
|
mimeType: spec.mimeType,
|
|
frameSize: width * height,
|
|
}
|
|
|
|
if spec.mimeType != webrtc.MimeTypeH264 {
|
|
if err := writeIVFHeader(stdin, spec.fourCC, width, height, fps); err != nil {
|
|
_ = dec.Close()
|
|
return nil, fmt.Errorf("decoder ivf header: %w", err)
|
|
}
|
|
}
|
|
|
|
go dec.readRawFrames(stdout)
|
|
return dec, nil
|
|
}
|
|
|
|
func (d *ffmpegDecoder) PushSample(sample []byte) error {
|
|
if err := d.processErr(); err != nil {
|
|
return err
|
|
}
|
|
if d.mimeType == webrtc.MimeTypeH264 {
|
|
if err := writeAll(d.stdin, sample); err != nil {
|
|
return fmt.Errorf("write h264 decoder frame: %w", err)
|
|
}
|
|
} else {
|
|
if err := writeIVFFrame(d.stdin, d.pts, sample); err != nil {
|
|
return fmt.Errorf("write ivf decoder frame: %w", err)
|
|
}
|
|
d.pts++
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (d *ffmpegDecoder) PopFrame() ([]byte, error) {
|
|
select {
|
|
case frame, ok := <-d.frames:
|
|
if !ok {
|
|
return nil, d.processErr()
|
|
}
|
|
return frame, nil
|
|
case <-time.After(10 * time.Second):
|
|
return nil, ErrPopFrameTimeout
|
|
}
|
|
}
|
|
|
|
func (d *ffmpegDecoder) Close() error {
|
|
d.closeOnce.Do(func() {
|
|
d.closed.Store(true)
|
|
_ = d.stdin.Close()
|
|
if d.cmd.Process != nil {
|
|
_ = d.cmd.Process.Kill()
|
|
}
|
|
_ = d.cmd.Wait()
|
|
})
|
|
return nil
|
|
}
|
|
|
|
func (d *ffmpegDecoder) readRawFrames(stdout io.Reader) {
|
|
defer close(d.frames)
|
|
buf := make([]byte, d.frameSize)
|
|
for {
|
|
if _, err := io.ReadFull(stdout, buf); err != nil {
|
|
if !d.closed.Load() {
|
|
d.setErr(fmt.Errorf("decoder raw read: %w", err))
|
|
}
|
|
return
|
|
}
|
|
copyFrame := append([]byte(nil), buf...)
|
|
if d.closed.Load() {
|
|
return
|
|
}
|
|
d.frames <- copyFrame
|
|
}
|
|
}
|
|
|
|
func (d *ffmpegDecoder) setErr(err error) {
|
|
if err == nil {
|
|
return
|
|
}
|
|
d.errMu.Lock()
|
|
defer d.errMu.Unlock()
|
|
if d.err == nil {
|
|
d.err = withStderr(err, d.stderr)
|
|
}
|
|
}
|
|
|
|
func (d *ffmpegDecoder) processErr() error {
|
|
d.errMu.Lock()
|
|
defer d.errMu.Unlock()
|
|
if d.err != nil {
|
|
return d.err
|
|
}
|
|
if d.closed.Load() {
|
|
return ErrTransportClosed
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func withStderr(err error, stderr *bytes.Buffer) error {
|
|
if err == nil {
|
|
return nil
|
|
}
|
|
msg := strings.TrimSpace(stderr.String())
|
|
if msg == "" {
|
|
return err
|
|
}
|
|
return fmt.Errorf("%w: %s", err, msg)
|
|
}
|
|
|
|
func writeIVFHeader(w io.Writer, fourCC string, width, height, frameRate int) error {
|
|
header := make([]byte, 32)
|
|
copy(header[0:4], []byte("DKIF"))
|
|
binary.LittleEndian.PutUint16(header[4:6], 0)
|
|
binary.LittleEndian.PutUint16(header[6:8], 32)
|
|
copy(header[8:12], []byte(fourCC))
|
|
binary.LittleEndian.PutUint16(header[12:14], uint16(width)) //nolint:gosec
|
|
binary.LittleEndian.PutUint16(header[14:16], uint16(height)) //nolint:gosec
|
|
binary.LittleEndian.PutUint32(header[16:20], uint32(frameRate)) //nolint:gosec
|
|
binary.LittleEndian.PutUint32(header[20:24], 1)
|
|
binary.LittleEndian.PutUint32(header[24:28], 0)
|
|
binary.LittleEndian.PutUint32(header[28:32], 0)
|
|
return writeAll(w, header)
|
|
}
|
|
|
|
func writeIVFFrame(w io.Writer, pts uint64, frame []byte) error {
|
|
header := make([]byte, 12)
|
|
binary.LittleEndian.PutUint32(header[0:4], uint32(len(frame))) //nolint:gosec
|
|
binary.LittleEndian.PutUint64(header[4:12], pts)
|
|
if err := writeAll(w, header); err != nil {
|
|
return err
|
|
}
|
|
return writeAll(w, frame)
|
|
}
|
|
|
|
func writeAll(w io.Writer, data []byte) error {
|
|
for len(data) > 0 {
|
|
n, err := w.Write(data)
|
|
if err != nil {
|
|
return fmt.Errorf("write: %w", err)
|
|
}
|
|
data = data[n:]
|
|
}
|
|
return nil
|
|
}
|