mirror of
https://github.com/Genymobile/scrcpy.git
synced 2026-04-21 01:33:36 +00:00
The new chlayout API has been introduced in FFmpeg 5.1. Use the old channel_layout API on older versions.
304 lines
9.5 KiB
C
304 lines
9.5 KiB
C
#include "audio_player.h"
|
|
|
|
#include <libavutil/opt.h>
|
|
|
|
#include "util/log.h"
|
|
|
|
#define SC_AUDIO_PLAYER_NDEBUG // comment to debug
|
|
|
|
/** Downcast frame_sink to sc_audio_player */
|
|
#define DOWNCAST(SINK) container_of(SINK, struct sc_audio_player, frame_sink)
|
|
|
|
#define SC_AV_SAMPLE_FMT AV_SAMPLE_FMT_FLT
|
|
#define SC_SDL_SAMPLE_FMT AUDIO_F32
|
|
|
|
#define SC_AUDIO_OUTPUT_BUFFER_SAMPLES 480 // 10ms at 48000Hz
|
|
|
|
// The target number of buffered samples between the producer and the consumer.
|
|
// This value is directly use for compensation.
|
|
#define SC_TARGET_BUFFERED_SAMPLES (3 * SC_AUDIO_OUTPUT_BUFFER_SAMPLES)
|
|
|
|
// If the consumer is too late, skip samples to keep at most this value
|
|
#define SC_BUFFERED_SAMPLES_THRESHOLD 2400 // 50ms at 48000Hz
|
|
|
|
// Use a ring-buffer of 1 second (at 48000Hz) between the producer and the
|
|
// consumer. It too big, but it guarantees that the producer and the consumer
|
|
// will be able to access it in parallel without locking.
|
|
#define SC_BYTEBUF_SIZE_IN_SAMPLES 48000
|
|
|
|
void
|
|
sc_audio_player_sdl_callback(void *userdata, uint8_t *stream, int len_int) {
|
|
struct sc_audio_player *ap = userdata;
|
|
|
|
// This callback is called with the lock used by SDL_AudioDeviceLock(), so
|
|
// the bytebuf is protected
|
|
|
|
assert(len_int > 0);
|
|
size_t len = len_int;
|
|
|
|
#ifndef SC_AUDIO_PLAYER_NDEBUG
|
|
LOGD("[Audio] SDL callback requests %" SC_PRIsizet " samples",
|
|
len / (ap->nb_channels * ap->out_bytes_per_sample));
|
|
#endif
|
|
|
|
size_t read = sc_bytebuf_read_remaining(&ap->buf);
|
|
size_t max_buffered_bytes = SC_BUFFERED_SAMPLES_THRESHOLD
|
|
* ap->nb_channels * ap->out_bytes_per_sample;
|
|
if (read > max_buffered_bytes + len) {
|
|
size_t skip = read - (max_buffered_bytes + len);
|
|
#ifndef SC_AUDIO_PLAYER_NDEBUG
|
|
LOGD("[Audio] Buffered samples threshold exceeded: %" SC_PRIsizet
|
|
" bytes, skipping %" SC_PRIsizet " bytes", read, skip);
|
|
#endif
|
|
// After this callback, exactly max_buffered_bytes will remain
|
|
sc_bytebuf_skip(&ap->buf, skip);
|
|
read = max_buffered_bytes + len;
|
|
}
|
|
|
|
// Number of buffered samples (may be negative on underflow)
|
|
float buffered_samples = ((float) read - len_int)
|
|
/ (ap->nb_channels * ap->out_bytes_per_sample);
|
|
sc_average_push(&ap->avg_buffered_samples, buffered_samples);
|
|
|
|
if (read) {
|
|
if (read > len) {
|
|
read = len;
|
|
}
|
|
sc_bytebuf_read(&ap->buf, stream, read);
|
|
}
|
|
|
|
if (read < len) {
|
|
// Insert silence
|
|
#ifndef SC_AUDIO_PLAYER_NDEBUG
|
|
LOGD("[Audio] Buffer underflow, inserting silence: %" SC_PRIsizet
|
|
" bytes", len - read);
|
|
#endif
|
|
memset(stream + read, 0, len - read);
|
|
}
|
|
}
|
|
|
|
static size_t
|
|
sc_audio_player_get_buf_size(struct sc_audio_player *ap, size_t samples) {
|
|
assert(ap->nb_channels);
|
|
assert(ap->out_bytes_per_sample);
|
|
return samples * ap->nb_channels * ap->out_bytes_per_sample;
|
|
}
|
|
|
|
static uint8_t *
|
|
sc_audio_player_get_swr_buf(struct sc_audio_player *ap, size_t min_samples) {
|
|
size_t min_buf_size = sc_audio_player_get_buf_size(ap, min_samples);
|
|
if (min_buf_size < ap->swr_buf_alloc_size) {
|
|
size_t new_size = min_buf_size + 4096;
|
|
uint8_t *buf = realloc(ap->swr_buf, new_size);
|
|
if (!buf) {
|
|
LOG_OOM();
|
|
// Could not realloc to the requested size
|
|
return NULL;
|
|
}
|
|
ap->swr_buf = buf;
|
|
ap->swr_buf_alloc_size = new_size;
|
|
}
|
|
|
|
return ap->swr_buf;
|
|
}
|
|
|
|
static bool
|
|
sc_audio_player_frame_sink_open(struct sc_frame_sink *sink,
|
|
const AVCodecContext *ctx) {
|
|
struct sc_audio_player *ap = DOWNCAST(sink);
|
|
#ifdef SCRCPY_LAVU_HAS_CHLAYOUT
|
|
assert(ctx->ch_layout.nb_channels > 0);
|
|
unsigned nb_channels = ctx->ch_layout.nb_channels;
|
|
#else
|
|
int tmp = av_get_channel_layout_nb_channels(ctx->channel_layout);
|
|
assert(tmp > 0);
|
|
unsigned nb_channels = tmp;
|
|
#endif
|
|
|
|
SDL_AudioSpec desired = {
|
|
.freq = ctx->sample_rate,
|
|
.format = SC_SDL_SAMPLE_FMT,
|
|
.channels = nb_channels,
|
|
.samples = SC_AUDIO_OUTPUT_BUFFER_SAMPLES,
|
|
.callback = sc_audio_player_sdl_callback,
|
|
.userdata = ap,
|
|
};
|
|
SDL_AudioSpec obtained;
|
|
|
|
ap->device = SDL_OpenAudioDevice(NULL, 0, &desired, &obtained, 0);
|
|
if (!ap->device) {
|
|
LOGE("Could not open audio device: %s", SDL_GetError());
|
|
return false;
|
|
}
|
|
|
|
SwrContext *swr_ctx = swr_alloc();
|
|
if (!swr_ctx) {
|
|
LOG_OOM();
|
|
goto error_close_audio_device;
|
|
}
|
|
ap->swr_ctx = swr_ctx;
|
|
|
|
assert(ctx->sample_rate > 0);
|
|
assert(!av_sample_fmt_is_planar(SC_AV_SAMPLE_FMT));
|
|
|
|
int out_bytes_per_sample = av_get_bytes_per_sample(SC_AV_SAMPLE_FMT);
|
|
assert(out_bytes_per_sample > 0);
|
|
|
|
#ifdef SCRCPY_LAVU_HAS_CHLAYOUT
|
|
av_opt_set_chlayout(swr_ctx, "in_chlayout", &ctx->ch_layout, 0);
|
|
av_opt_set_chlayout(swr_ctx, "out_chlayout", &ctx->ch_layout, 0);
|
|
#else
|
|
av_opt_set_channel_layout(swr_ctx, "in_channel_layout",
|
|
ctx->channel_layout, 0);
|
|
av_opt_set_channel_layout(swr_ctx, "out_channel_layout",
|
|
ctx->channel_layout, 0);
|
|
#endif
|
|
|
|
av_opt_set_int(swr_ctx, "in_sample_rate", ctx->sample_rate, 0);
|
|
av_opt_set_int(swr_ctx, "out_sample_rate", ctx->sample_rate, 0);
|
|
|
|
av_opt_set_sample_fmt(swr_ctx, "in_sample_fmt", ctx->sample_fmt, 0);
|
|
av_opt_set_sample_fmt(swr_ctx, "out_sample_fmt", SC_AV_SAMPLE_FMT, 0);
|
|
|
|
int ret = swr_init(swr_ctx);
|
|
if (ret) {
|
|
LOGE("Failed to initialize the resampling context");
|
|
goto error_free_swr_ctx;
|
|
}
|
|
|
|
ap->sample_rate = ctx->sample_rate;
|
|
ap->nb_channels = nb_channels;
|
|
ap->out_bytes_per_sample = out_bytes_per_sample;
|
|
|
|
size_t bytebuf_size =
|
|
sc_audio_player_get_buf_size(ap, SC_BYTEBUF_SIZE_IN_SAMPLES);
|
|
|
|
bool ok = sc_bytebuf_init(&ap->buf, bytebuf_size);
|
|
if (!ok) {
|
|
goto error_free_swr_ctx;
|
|
}
|
|
|
|
ap->safe_empty_buffer = sc_bytebuf_write_remaining(&ap->buf);
|
|
|
|
size_t initial_swr_buf_size = sc_audio_player_get_buf_size(ap, 4096);
|
|
ap->swr_buf = malloc(initial_swr_buf_size);
|
|
if (!ap->swr_buf) {
|
|
LOG_OOM();
|
|
goto error_destroy_bytebuf;
|
|
}
|
|
ap->swr_buf_alloc_size = initial_swr_buf_size;
|
|
|
|
sc_average_init(&ap->avg_buffered_samples, 32);
|
|
ap->samples_since_resync = 0;
|
|
|
|
SDL_PauseAudioDevice(ap->device, 0);
|
|
|
|
return true;
|
|
|
|
error_destroy_bytebuf:
|
|
sc_bytebuf_destroy(&ap->buf);
|
|
error_free_swr_ctx:
|
|
swr_free(&ap->swr_ctx);
|
|
error_close_audio_device:
|
|
SDL_CloseAudioDevice(ap->device);
|
|
|
|
return false;
|
|
}
|
|
|
|
static void
|
|
sc_audio_player_frame_sink_close(struct sc_frame_sink *sink) {
|
|
struct sc_audio_player *ap = DOWNCAST(sink);
|
|
|
|
assert(ap->device);
|
|
SDL_PauseAudioDevice(ap->device, 1);
|
|
SDL_CloseAudioDevice(ap->device);
|
|
|
|
free(ap->swr_buf);
|
|
sc_bytebuf_destroy(&ap->buf);
|
|
swr_free(&ap->swr_ctx);
|
|
}
|
|
|
|
static bool
|
|
sc_audio_player_frame_sink_push(struct sc_frame_sink *sink, const AVFrame *frame) {
|
|
struct sc_audio_player *ap = DOWNCAST(sink);
|
|
|
|
SwrContext *swr_ctx = ap->swr_ctx;
|
|
|
|
int64_t delay = swr_get_delay(swr_ctx, ap->sample_rate);
|
|
// No need to av_rescale_rnd(), input and output sample rates are the same
|
|
int dst_nb_samples = delay + frame->nb_samples;
|
|
|
|
uint8_t *swr_buf = sc_audio_player_get_swr_buf(ap, frame->nb_samples);
|
|
if (!swr_buf) {
|
|
return false;
|
|
}
|
|
|
|
int ret = swr_convert(swr_ctx, &swr_buf, dst_nb_samples,
|
|
(const uint8_t **) frame->data, frame->nb_samples);
|
|
if (ret < 0) {
|
|
LOGE("Resampling failed: %d", ret);
|
|
return false;
|
|
}
|
|
|
|
size_t samples_written = ret;
|
|
size_t swr_buf_size = sc_audio_player_get_buf_size(ap, samples_written);
|
|
#ifndef SC_AUDIO_PLAYER_NDEBUG
|
|
LOGI("[Audio] %" SC_PRIsizet " samples written to buffer", samples_written);
|
|
#endif
|
|
|
|
// It should almost always be possible to write without lock
|
|
bool can_write_without_lock = swr_buf_size <= ap->safe_empty_buffer;
|
|
if (can_write_without_lock) {
|
|
sc_bytebuf_prepare_write(&ap->buf, swr_buf, swr_buf_size);
|
|
}
|
|
|
|
SDL_LockAudioDevice(ap->device);
|
|
if (can_write_without_lock) {
|
|
sc_bytebuf_commit_write(&ap->buf, swr_buf_size);
|
|
} else {
|
|
sc_bytebuf_write(&ap->buf, swr_buf, swr_buf_size);
|
|
}
|
|
|
|
// The next time, it will remain at least the current empty space
|
|
ap->safe_empty_buffer = sc_bytebuf_write_remaining(&ap->buf);
|
|
|
|
// Read the value written by the SDL thread under lock
|
|
float avg;
|
|
bool has_avg = sc_average_get(&ap->avg_buffered_samples, &avg);
|
|
|
|
SDL_UnlockAudioDevice(ap->device);
|
|
|
|
if (has_avg) {
|
|
ap->samples_since_resync += samples_written;
|
|
if (ap->samples_since_resync >= ap->sample_rate) {
|
|
// Resync every second
|
|
ap->samples_since_resync = 0;
|
|
|
|
int diff = SC_TARGET_BUFFERED_SAMPLES - avg;
|
|
#ifndef SC_AUDIO_PLAYER_NDEBUG
|
|
LOGI("[Audio] Average buffered samples = %f, compensation %d",
|
|
avg, diff);
|
|
#endif
|
|
// Compensate the diff over 3 seconds (but will be recomputed after
|
|
// 1 second)
|
|
int ret = swr_set_compensation(swr_ctx, diff, 3 * ap->sample_rate);
|
|
if (ret < 0) {
|
|
LOGW("Resampling compensation failed: %d", ret);
|
|
// not fatal
|
|
}
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
void
|
|
sc_audio_player_init(struct sc_audio_player *ap) {
|
|
static const struct sc_frame_sink_ops ops = {
|
|
.open = sc_audio_player_frame_sink_open,
|
|
.close = sc_audio_player_frame_sink_close,
|
|
.push = sc_audio_player_frame_sink_push,
|
|
};
|
|
|
|
ap->frame_sink.ops = &ops;
|
|
}
|