/* Copyright (c) 2012 The Chromium OS Authors. All rights reserved. * Use of this source code is governed by a BSD-style license that can be * found in the LICENSE file. */ /* For now just use speex, can add more resamplers later. */ #include <speex/speex_resampler.h> #include <sys/param.h> #include <syslog.h> #include "cras_fmt_conv.h" #include "cras_audio_format.h" #include "cras_util.h" #include "linear_resampler.h" /* The quality level is a value between 0 and 10. This is a tradeoff between * performance, latency, and quality. */ #define SPEEX_QUALITY_LEVEL 4 /* Max number of converters, src, down/up mix, 2xformat, and linear resample. */ #define MAX_NUM_CONVERTERS 5 /* Channel index for stereo. */ #define STEREO_L 0 #define STEREO_R 1 typedef void (*sample_format_converter_t)(const uint8_t *in, size_t in_samples, uint8_t *out); typedef size_t (*channel_converter_t)(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out); /* Member data for the resampler. */ struct cras_fmt_conv { SpeexResamplerState *speex_state; channel_converter_t channel_converter; float **ch_conv_mtx; /* Coefficient matrix for mixing channels. */ sample_format_converter_t in_format_converter; sample_format_converter_t out_format_converter; struct linear_resampler *resampler; struct cras_audio_format in_fmt; struct cras_audio_format out_fmt; uint8_t *tmp_bufs[MAX_NUM_CONVERTERS - 1]; size_t tmp_buf_frames; size_t pre_linear_resample; size_t num_converters; /* Incremented once for SRC, channel, format. */ }; /* Add and clip two s16 samples. */ static int16_t s16_add_and_clip(int16_t a, int16_t b) { int32_t sum; sum = a + b; sum = MAX(sum, -0x8000); sum = MIN(sum, 0x7fff); return (int16_t)sum; } /* * Convert between different sample formats. */ /* Converts from U8 to S16. */ static void convert_u8_to_s16le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; uint16_t *_out = (uint16_t *)out; for (i = 0; i < in_samples; i++, in++, _out++) *_out = (uint16_t)((int16_t)*in - 0x80) << 8; } /* Converts from S24 to S16. */ static void convert_s24le_to_s16le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int32_t *_in = (int32_t *)in; uint16_t *_out = (uint16_t *)out; for (i = 0; i < in_samples; i++, _in++, _out++) *_out = (int16_t)((*_in & 0x00ffffff) >> 8); } /* Converts from S32 to S16. */ static void convert_s32le_to_s16le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int32_t *_in = (int32_t *)in; uint16_t *_out = (uint16_t *)out; for (i = 0; i < in_samples; i++, _in++, _out++) *_out = (int16_t)(*_in >> 16); } /* Converts from S24_3LE to S16. */ static void convert_s243le_to_s16le(const uint8_t *in, size_t in_samples, uint8_t *out) { /* find how to calculate in and out size, implement the conversion * between S24_3LE and S16 */ size_t i; int8_t *_in = (int8_t *)in; uint16_t *_out = (uint16_t *)out; for (i = 0; i < in_samples; i++, _in += 3, _out++) memcpy(_out, _in + 1, 2); } /* Converts from S16 to U8. */ static void convert_s16le_to_u8(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int16_t *_in = (int16_t *)in; for (i = 0; i < in_samples; i++, _in++, out++) *out = (uint8_t)(*_in >> 8) + 128; } /* Converts from S16 to S24. */ static void convert_s16le_to_s24le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int16_t *_in = (int16_t *)in; uint32_t *_out = (uint32_t *)out; for (i = 0; i < in_samples; i++, _in++, _out++) *_out = ((uint32_t)(int32_t)*_in << 8); } /* Converts from S16 to S32. */ static void convert_s16le_to_s32le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int16_t *_in = (int16_t *)in; uint32_t *_out = (uint32_t *)out; for (i = 0; i < in_samples; i++, _in++, _out++) *_out = ((uint32_t)(int32_t)*_in << 16); } /* Converts from S16 to S24_3LE. */ static void convert_s16le_to_s243le(const uint8_t *in, size_t in_samples, uint8_t *out) { size_t i; int16_t *_in = (int16_t *)in; uint8_t *_out = (uint8_t *)out; for (i = 0; i < in_samples; i++, _in++, _out += 3) { *_out = 0; memcpy(_out + 1, _in, 2); } } /* * Convert between different channel numbers. */ /* Converts S16 mono to S16 stereo. The out buffer must be double the size of * the input buffer. */ static size_t s16_mono_to_stereo(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i; for (i = 0; i < in_frames; i++) { out[2 * i] = in[i]; out[2 * i + 1] = in[i]; } return in_frames; } /* Converts S16 Stereo to S16 mono. The output buffer only need be big enough * for mono samples. */ static size_t s16_stereo_to_mono(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i; for (i = 0; i < in_frames; i++) out[i] = s16_add_and_clip(in[2 * i], in[2 * i + 1]); return in_frames; } /* Converts S16 mono to 5.1 surround. Fit mono to front center of the * output, or split to front left/right if front center is missing * from the output channel layout. */ static size_t s16_mono_to_51(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i, left, right, center; memset(out, 0, sizeof(*out) * 6 * in_frames); left = conv->out_fmt.channel_layout[CRAS_CH_FL]; right = conv->out_fmt.channel_layout[CRAS_CH_FR]; center = conv->out_fmt.channel_layout[CRAS_CH_FC]; if (center != -1) for (i = 0; i < in_frames; i++) out[6 * i + center] = in[i]; else if (left != -1 && right != -1) for (i = 0; i < in_frames; i++) { out[6 * i + right] = in[i] / 2; out[6 * 1 + left] = in[i] / 2; } else /* Select the first channel to convert to as the * default behavior. */ for (i = 0; i < in_frames; i++) out[6 * i] = in[i]; return in_frames; } /* Converts S16 stereo to 5.1 surround. Fit the left/right of input * to the front left/right of output respectively and fill others * with zero. If any of the front left/right is missed from the output * channel layout, mix to front center. */ static size_t s16_stereo_to_51(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i, left, right, center; memset(out, 0, sizeof(*out) * 6 * in_frames); left = conv->out_fmt.channel_layout[CRAS_CH_FL]; right = conv->out_fmt.channel_layout[CRAS_CH_FR]; center = conv->out_fmt.channel_layout[CRAS_CH_FC]; if (left != -1 && right != -1) for (i = 0; i < in_frames; i++) { out[6 * i + left] = in[2 * i]; out[6 * i + right] = in[2 * i + 1]; } else if (center != -1) for (i = 0; i < in_frames; i++) out[6 * i + center] = s16_add_and_clip( in[2 * i], in[2 * i + 1]); else /* Select the first two channels to convert to as the * default behavior. */ for (i = 0; i < in_frames; i++) { out[6 * i] = in[2 * i]; out[6 * i + 1] = in[2 * i + 1]; } return in_frames; } /* Converts S16 5.1 to S16 stereo. The out buffer can have room for just * stereo samples. This convert function is used as the default behavior * when channel layout is not set from the client side. */ static size_t s16_51_to_stereo(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { static const unsigned int left_idx = 0; static const unsigned int right_idx = 1; /* static const unsigned int left_surround_idx = 2; */ /* static const unsigned int right_surround_idx = 3; */ static const unsigned int center_idx = 4; /* static const unsigned int lfe_idx = 5; */ size_t i; for (i = 0; i < in_frames; i++) { unsigned int half_center; half_center = in[6 * i + center_idx] / 2; out[2 * i + left_idx] = s16_add_and_clip(in[6 * i + left_idx], half_center); out[2 * i + right_idx] = s16_add_and_clip(in[6 * i + right_idx], half_center); } return in_frames; } /* Converts S16 stereo to quad (front L/R, rear L/R). Fit left/right of input * to the front left/right of output respectively and fill others * with zero. */ static size_t s16_stereo_to_quad(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i, front_left, front_right, rear_left, rear_right; front_left = conv->out_fmt.channel_layout[CRAS_CH_FL]; front_right = conv->out_fmt.channel_layout[CRAS_CH_FR]; rear_left = conv->out_fmt.channel_layout[CRAS_CH_RL]; rear_right = conv->out_fmt.channel_layout[CRAS_CH_RR]; if (front_left != -1 && front_right != -1 && rear_left != -1 && rear_right != -1) for (i = 0; i < in_frames; i++) { out[4 * i + front_left] = in[2 * i]; out[4 * i + front_right] = in[2 * i + 1]; out[4 * i + rear_left] = in[2 * i]; out[4 * i + rear_right] = in[2 * i + 1]; } else /* Select the first four channels to convert to as the * default behavior. */ for (i = 0; i < in_frames; i++) { out[4 * i] = in[2 * i]; out[4 * i + 1] = in[2 * i + 1]; out[4 * i + 2] = in[2 * i]; out[4 * i + 3] = in[2 * i + 1]; } return in_frames; } /* Converts S16 quad (front L/R, rear L/R) to S16 stereo. The out buffer * can have room for just stereo samples. */ static size_t s16_quad_to_stereo(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { size_t i; unsigned int left_idx = conv->in_fmt.channel_layout[CRAS_CH_FL]; unsigned int right_idx = conv->in_fmt.channel_layout[CRAS_CH_FR]; unsigned int left_rear_idx = conv->in_fmt.channel_layout[CRAS_CH_RL]; unsigned int right_rear_idx = conv->in_fmt.channel_layout[CRAS_CH_RR]; if (left_idx == -1 || right_idx == -1 || left_rear_idx == -1 || right_rear_idx == -1) { left_idx = 0; right_idx = 1; left_rear_idx = 2; right_rear_idx = 3; } for (i = 0; i < in_frames; i++) { out[2 * i] = s16_add_and_clip( in[4 * i + left_idx], in[4 * i + left_rear_idx] / 4); out[2 * i + 1] = s16_add_and_clip( in[4 * i + right_idx], in[4 * i + right_rear_idx] / 4); } return in_frames; } /* Converts S16 N channels to S16 M channels. The out buffer must have room for * M channel. This convert function is used as the default behavior when channel * layout is not set from the client side. */ static size_t s16_default_all_to_all(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { unsigned int num_in_ch = conv->in_fmt.num_channels; unsigned int num_out_ch = conv->out_fmt.num_channels; unsigned int in_ch, out_ch, i; memset(out, 0, in_frames * cras_get_format_bytes(&conv->out_fmt)); for (out_ch = 0; out_ch < num_out_ch; out_ch++) { for (in_ch = 0; in_ch < num_in_ch; in_ch++) { for (i = 0; i < in_frames; i++) { out[out_ch + i * num_out_ch] += in[in_ch + i * num_in_ch] / num_in_ch; } } } return in_frames; } static int is_channel_layout_equal(const struct cras_audio_format *a, const struct cras_audio_format *b) { int ch; for (ch = 0; ch < CRAS_CH_MAX; ch++) if (a->channel_layout[ch] != b->channel_layout[ch]) return 0; return 1; } /* Multiplies buffer vector with coefficient vector. */ static int16_t multiply_buf_with_coef(float *coef, const int16_t *buf, size_t size) { int32_t sum = 0; int i; for (i = 0; i < size; i++) sum += coef[i] * buf[i]; sum = MAX(sum, -0x8000); sum = MIN(sum, 0x7fff); return (int16_t)sum; } static void normalize_buf(float *buf, size_t size) { int i; float squre_sum = 0.0; for (i = 0; i < size; i++) squre_sum += buf[i] * buf[i]; for (i = 0; i < size; i ++) buf[i] /= squre_sum; } /* Converts channels based on the channel conversion * coefficient matrix. */ static size_t convert_channels(struct cras_fmt_conv *conv, const int16_t *in, size_t in_frames, int16_t *out) { unsigned i, fr; unsigned in_idx = 0; unsigned out_idx = 0; for (fr = 0; fr < in_frames; fr++) { for (i = 0; i < conv->out_fmt.num_channels; i++) out[out_idx + i] = multiply_buf_with_coef( conv->ch_conv_mtx[i], &in[in_idx], conv->in_fmt.num_channels); in_idx += conv->in_fmt.num_channels; out_idx += conv->out_fmt.num_channels; } return in_frames; } /* Populates the down mix matrix by rules: * 1. Front/side left(right) channel will mix to left(right) of * full scale. * 2. Center and LFE will be split equally to left and right. * Rear * 3. Rear left/right will split 1/4 of the power to opposite * channel. */ static void surround51_to_stereo_downmix_mtx(float **mtx, int8_t layout[CRAS_CH_MAX]) { if (layout[CRAS_CH_FC] != -1) { mtx[STEREO_L][layout[CRAS_CH_FC]] = 0.707; mtx[STEREO_R][layout[CRAS_CH_FC]] = 0.707; } if (layout[CRAS_CH_FL] != -1 && layout[CRAS_CH_FR] != -1) { mtx[STEREO_L][layout[CRAS_CH_FL]] = 1.0; mtx[STEREO_R][layout[CRAS_CH_FR]] = 1.0; } if (layout[CRAS_CH_SL] != -1 && layout[CRAS_CH_SR] != -1) { mtx[STEREO_L][layout[CRAS_CH_SL]] = 1.0; mtx[STEREO_R][layout[CRAS_CH_SR]] = 1.0; } if (layout[CRAS_CH_RL] != -1 && layout[CRAS_CH_RR] != -1) { /* Split 1/4 power to the other side */ mtx[STEREO_L][layout[CRAS_CH_RL]] = 0.866; mtx[STEREO_R][layout[CRAS_CH_RL]] = 0.5; mtx[STEREO_R][layout[CRAS_CH_RR]] = 0.866; mtx[STEREO_L][layout[CRAS_CH_RR]] = 0.5; } if (layout[CRAS_CH_LFE] != -1) { mtx[STEREO_L][layout[CRAS_CH_LFE]] = 0.707; mtx[STEREO_R][layout[CRAS_CH_LFE]] = 0.707; } normalize_buf(mtx[STEREO_L], 6); normalize_buf(mtx[STEREO_R], 6); } /* * Exported interface */ struct cras_fmt_conv *cras_fmt_conv_create(const struct cras_audio_format *in, const struct cras_audio_format *out, size_t max_frames, size_t pre_linear_resample) { struct cras_fmt_conv *conv; int rc; unsigned i; conv = calloc(1, sizeof(*conv)); if (conv == NULL) return NULL; conv->in_fmt = *in; conv->out_fmt = *out; conv->tmp_buf_frames = max_frames; conv->pre_linear_resample = pre_linear_resample; /* Set up sample format conversion. */ /* TODO(dgreid) - modify channel and sample rate conversion so * converting to s16 isnt necessary. */ if (in->format != SND_PCM_FORMAT_S16_LE) { conv->num_converters++; syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format, out->format); switch(in->format) { case SND_PCM_FORMAT_U8: conv->in_format_converter = convert_u8_to_s16le; break; case SND_PCM_FORMAT_S24_LE: conv->in_format_converter = convert_s24le_to_s16le; break; case SND_PCM_FORMAT_S32_LE: conv->in_format_converter = convert_s32le_to_s16le; break; case SND_PCM_FORMAT_S24_3LE: conv->in_format_converter = convert_s243le_to_s16le; break; default: syslog(LOG_WARNING, "Invalid format %d", in->format); cras_fmt_conv_destroy(&conv); return NULL; } } if (out->format != SND_PCM_FORMAT_S16_LE) { conv->num_converters++; syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format, out->format); switch (out->format) { case SND_PCM_FORMAT_U8: conv->out_format_converter = convert_s16le_to_u8; break; case SND_PCM_FORMAT_S24_LE: conv->out_format_converter = convert_s16le_to_s24le; break; case SND_PCM_FORMAT_S32_LE: conv->out_format_converter = convert_s16le_to_s32le; break; case SND_PCM_FORMAT_S24_3LE: conv->out_format_converter = convert_s16le_to_s243le; break; default: syslog(LOG_WARNING, "Invalid format %d", out->format); cras_fmt_conv_destroy(&conv); return NULL; } } /* Set up channel number conversion. */ if (in->num_channels != out->num_channels) { conv->num_converters++; syslog(LOG_DEBUG, "Convert from %zu to %zu channels.", in->num_channels, out->num_channels); /* Populate the conversion matrix base on in/out channel count * and layout. */ if (in->num_channels == 1 && out->num_channels == 2) { conv->channel_converter = s16_mono_to_stereo; } else if (in->num_channels == 1 && out->num_channels == 6) { conv->channel_converter = s16_mono_to_51; } else if (in->num_channels == 2 && out->num_channels == 1) { conv->channel_converter = s16_stereo_to_mono; } else if (in->num_channels == 2 && out->num_channels == 4) { conv->channel_converter = s16_stereo_to_quad; } else if (in->num_channels == 4 && out->num_channels == 2) { conv->channel_converter = s16_quad_to_stereo; } else if (in->num_channels == 2 && out->num_channels == 6) { conv->channel_converter = s16_stereo_to_51; } else if (in->num_channels == 6 && out->num_channels == 2) { int in_channel_layout_set = 0; /* Checks if channel_layout is set in the incoming format */ for (i = 0; i < CRAS_CH_MAX; i++) if (in->channel_layout[i] != -1) in_channel_layout_set = 1; /* Use the conversion matrix based converter when a * channel layout is set, or default to use existing * converter to downmix to stereo */ if (in_channel_layout_set) { conv->ch_conv_mtx = cras_channel_conv_matrix_alloc( in->num_channels, out->num_channels); if (conv->ch_conv_mtx == NULL) { cras_fmt_conv_destroy(&conv); return NULL; } conv->channel_converter = convert_channels; surround51_to_stereo_downmix_mtx( conv->ch_conv_mtx, conv->in_fmt.channel_layout); } else { conv->channel_converter = s16_51_to_stereo; } } else { syslog(LOG_WARNING, "Using default channel map for %zu to %zu", in->num_channels, out->num_channels); conv->channel_converter = s16_default_all_to_all; } } else if (in->num_channels > 2 && !is_channel_layout_equal(in, out)){ conv->num_converters++; conv->ch_conv_mtx = cras_channel_conv_matrix_create(in, out); if (conv->ch_conv_mtx == NULL) { syslog(LOG_ERR, "Failed to create channel conversion matrix"); cras_fmt_conv_destroy(&conv); return NULL; } conv->channel_converter = convert_channels; } /* Set up sample rate conversion. */ if (in->frame_rate != out->frame_rate) { conv->num_converters++; syslog(LOG_DEBUG, "Convert from %zu to %zu Hz.", in->frame_rate, out->frame_rate); conv->speex_state = speex_resampler_init(out->num_channels, in->frame_rate, out->frame_rate, SPEEX_QUALITY_LEVEL, &rc); if (conv->speex_state == NULL) { syslog(LOG_ERR, "Fail to create speex:%zu %zu %zu %d", out->num_channels, in->frame_rate, out->frame_rate, rc); cras_fmt_conv_destroy(&conv); return NULL; } } /* Set up linear resampler. */ conv->num_converters++; conv->resampler = linear_resampler_create( out->num_channels, cras_get_format_bytes(out), out->frame_rate, out->frame_rate); if (conv->resampler == NULL) { syslog(LOG_ERR, "Fail to create linear resampler"); cras_fmt_conv_destroy(&conv); return NULL; } /* Need num_converters-1 temp buffers, the final converter renders * directly into the output. */ for (i = 0; i < conv->num_converters - 1; i++) { conv->tmp_bufs[i] = malloc( max_frames * 4 * /* width in bytes largest format. */ MAX(in->num_channels, out->num_channels)); if (conv->tmp_bufs[i] == NULL) { cras_fmt_conv_destroy(&conv); return NULL; } } assert(conv->num_converters <= MAX_NUM_CONVERTERS); return conv; } void cras_fmt_conv_destroy(struct cras_fmt_conv **convp) { unsigned i; struct cras_fmt_conv *conv = *convp; if (conv->ch_conv_mtx) cras_channel_conv_matrix_destroy(conv->ch_conv_mtx, conv->out_fmt.num_channels); if (conv->speex_state) speex_resampler_destroy(conv->speex_state); if (conv->resampler) linear_resampler_destroy(conv->resampler); for (i = 0; i < MAX_NUM_CONVERTERS - 1; i++) free(conv->tmp_bufs[i]); free(conv); *convp = NULL; } struct cras_fmt_conv *cras_channel_remix_conv_create( unsigned int num_channels, const float *coefficient) { struct cras_fmt_conv *conv; unsigned out_ch, in_ch; conv = calloc(1, sizeof(*conv)); if (conv == NULL) return NULL; conv->in_fmt.num_channels = num_channels; conv->out_fmt.num_channels = num_channels; conv->ch_conv_mtx = cras_channel_conv_matrix_alloc(num_channels, num_channels); /* Convert the coeffiencnt array to conversion matrix. */ for (out_ch = 0; out_ch < num_channels; out_ch++) for (in_ch = 0; in_ch < num_channels; in_ch++) conv->ch_conv_mtx[out_ch][in_ch] = coefficient[in_ch + out_ch * num_channels]; conv->num_converters = 1; conv->tmp_bufs[0] = malloc(4 * /* width in bytes largest format. */ num_channels); return conv; } void cras_channel_remix_convert(struct cras_fmt_conv *conv, const struct cras_audio_format *fmt, uint8_t *in_buf, size_t nframes) { unsigned ch, fr; int16_t *tmp = (int16_t *)conv->tmp_bufs[0]; int16_t *buf = (int16_t *)in_buf; /* Do remix only when input buffer has the same number of channels. */ if (fmt->num_channels != conv->in_fmt.num_channels) return; for (fr = 0; fr < nframes; fr++) { for (ch = 0; ch < conv->in_fmt.num_channels; ch++) tmp[ch] = multiply_buf_with_coef( conv->ch_conv_mtx[ch], buf, conv->in_fmt.num_channels); for (ch = 0; ch < conv->in_fmt.num_channels; ch++) buf[ch] = tmp[ch]; buf += conv->in_fmt.num_channels; } } const struct cras_audio_format *cras_fmt_conv_in_format( const struct cras_fmt_conv *conv) { return &conv->in_fmt; } const struct cras_audio_format *cras_fmt_conv_out_format( const struct cras_fmt_conv *conv) { return &conv->out_fmt; } size_t cras_fmt_conv_in_frames_to_out(struct cras_fmt_conv *conv, size_t in_frames) { if (!conv) return in_frames; if (conv->pre_linear_resample) in_frames = linear_resampler_in_frames_to_out( conv->resampler, in_frames); in_frames = cras_frames_at_rate(conv->in_fmt.frame_rate, in_frames, conv->out_fmt.frame_rate); if (!conv->pre_linear_resample) in_frames = linear_resampler_in_frames_to_out( conv->resampler, in_frames); return in_frames; } size_t cras_fmt_conv_out_frames_to_in(struct cras_fmt_conv *conv, size_t out_frames) { if (!conv) return out_frames; if (!conv->pre_linear_resample) out_frames = linear_resampler_out_frames_to_in( conv->resampler, out_frames); out_frames = cras_frames_at_rate(conv->out_fmt.frame_rate, out_frames, conv->in_fmt.frame_rate); if (conv->pre_linear_resample) out_frames = linear_resampler_out_frames_to_in( conv->resampler, out_frames); return out_frames; } void cras_fmt_conv_set_linear_resample_rates(struct cras_fmt_conv *conv, float from, float to) { linear_resampler_set_rates(conv->resampler, from, to); } size_t cras_fmt_conv_convert_frames(struct cras_fmt_conv *conv, const uint8_t *in_buf, uint8_t *out_buf, unsigned int *in_frames, size_t out_frames) { uint32_t fr_in, fr_out; uint8_t *buffers[MAX_NUM_CONVERTERS + 1]; /* converters + out buffer. */ size_t buf_idx = 0; static int logged_frames_dont_fit; unsigned int used_converters = conv->num_converters; unsigned int post_linear_resample = 0; unsigned int pre_linear_resample = 0; unsigned int linear_resample_fr = 0; assert(conv); assert(*in_frames <= conv->tmp_buf_frames); if (linear_resampler_needed(conv->resampler)) { post_linear_resample = !conv->pre_linear_resample; pre_linear_resample = conv->pre_linear_resample; } /* If no SRC, then in_frames should = out_frames. */ if (conv->speex_state == NULL) { fr_in = MIN(*in_frames, out_frames); if (out_frames < *in_frames && !logged_frames_dont_fit) { syslog(LOG_INFO, "fmt_conv: %u to %zu no SRC.", *in_frames, out_frames); logged_frames_dont_fit = 1; } } else { fr_in = *in_frames; } fr_out = fr_in; /* Set up a chain of buffers. The output buffer of the first conversion * is used as input to the second and so forth, ending in the output * buffer. */ if (!linear_resampler_needed(conv->resampler)) used_converters--; buffers[4] = (uint8_t *)conv->tmp_bufs[3]; buffers[3] = (uint8_t *)conv->tmp_bufs[2]; buffers[2] = (uint8_t *)conv->tmp_bufs[1]; buffers[1] = (uint8_t *)conv->tmp_bufs[0]; buffers[0] = (uint8_t *)in_buf; buffers[used_converters] = out_buf; if (pre_linear_resample) { linear_resample_fr = fr_in; unsigned resample_limit = out_frames; /* If there is a 2nd fmt conversion we should convert the * resample limit and round it to the lower bound in order * not to convert too many frames in the pre linear resampler. */ if (conv->speex_state != NULL) { resample_limit = resample_limit * conv->in_fmt.frame_rate / conv->out_fmt.frame_rate; /* * However if the limit frames count is less than * |out_rate / in_rate|, the final limit value could be * rounded to zero so it confuses linear resampler to * do nothing. Make sure it's non-zero in that case. */ if (resample_limit == 0) resample_limit = 1; } resample_limit = MIN(resample_limit, conv->tmp_buf_frames); fr_in = linear_resampler_resample( conv->resampler, buffers[buf_idx], &linear_resample_fr, buffers[buf_idx + 1], resample_limit); buf_idx++; } /* If the input format isn't S16_LE convert to it. */ if (conv->in_fmt.format != SND_PCM_FORMAT_S16_LE) { conv->in_format_converter(buffers[buf_idx], fr_in * conv->in_fmt.num_channels, (uint8_t *)buffers[buf_idx + 1]); buf_idx++; } /* Then channel conversion. */ if (conv->channel_converter != NULL) { conv->channel_converter(conv, (int16_t *)buffers[buf_idx], fr_in, (int16_t *)buffers[buf_idx + 1]); buf_idx++; } /* Then SRC. */ if (conv->speex_state != NULL) { unsigned int out_limit = out_frames; if (post_linear_resample) out_limit = linear_resampler_out_frames_to_in( conv->resampler, out_limit); fr_out = cras_frames_at_rate(conv->in_fmt.frame_rate, fr_in, conv->out_fmt.frame_rate); if (fr_out > out_frames + 1 && !logged_frames_dont_fit) { syslog(LOG_INFO, "fmt_conv: put %u frames in %zu sized buffer", fr_out, out_frames); logged_frames_dont_fit = 1; } /* limit frames to the output size. */ fr_out = MIN(fr_out, out_limit); speex_resampler_process_interleaved_int( conv->speex_state, (int16_t *)buffers[buf_idx], &fr_in, (int16_t *)buffers[buf_idx + 1], &fr_out); buf_idx++; } if (post_linear_resample) { linear_resample_fr = fr_out; unsigned resample_limit = MIN(conv->tmp_buf_frames, out_frames); fr_out = linear_resampler_resample( conv->resampler, buffers[buf_idx], &linear_resample_fr, buffers[buf_idx + 1], resample_limit); buf_idx++; } /* If the output format isn't S16_LE convert to it. */ if (conv->out_fmt.format != SND_PCM_FORMAT_S16_LE) { conv->out_format_converter(buffers[buf_idx], fr_out * conv->out_fmt.num_channels, (uint8_t *)buffers[buf_idx + 1]); buf_idx++; } if (pre_linear_resample) { *in_frames = linear_resample_fr; /* When buffer sizes are small, there's a corner case that * speex library resamples 0 frame to N-1 frames, where N * is the integer ratio of output and input rate. For example, * 16KHz to 48KHz. In this case fmt_conv should claim zero * frames processed, instead of using the linear resampler * processed frames count. Otherwise there will be a frame * leak and, if accumulated, causes delay in multiple devices * use case. */ if (conv->speex_state && (fr_in == 0)) *in_frames = 0; } else { *in_frames = fr_in; } return fr_out; } int cras_fmt_conversion_needed(const struct cras_fmt_conv *conv) { return linear_resampler_needed(conv->resampler) || (conv->num_converters > 1); } /* If the server cannot provide the requested format, configures an audio format * converter that handles transforming the input format to the format used by * the server. */ int config_format_converter(struct cras_fmt_conv **conv, enum CRAS_STREAM_DIRECTION dir, const struct cras_audio_format *from, const struct cras_audio_format *to, unsigned int frames) { struct cras_audio_format target; /* For input, preserve the channel count and layout of * from format */ if (dir == CRAS_STREAM_INPUT) { target = *from; target.format = to->format; target.frame_rate = to->frame_rate; } else { target = *to; } syslog(LOG_DEBUG, "format convert: from:%d %zu %zu target: %d %zu %zu " "frames = %u", from->format, from->frame_rate, from->num_channels, target.format, target.frame_rate, target.num_channels, frames); *conv = cras_fmt_conv_create(from, &target, frames, (dir == CRAS_STREAM_INPUT)); if (!*conv) { syslog(LOG_ERR, "Failed to create format converter"); return -ENOMEM; } return 0; }