#include "audioconverter.h" #include "logcategories.h" #include "ulaw.h" audioConverter::audioConverter(QObject* parent) : QObject(parent) { } bool audioConverter::init(QAudioFormat inFormat, QAudioFormat outFormat, quint8 opusComplexity, quint8 resampleQuality) { this->inFormat = inFormat; this->outFormat = outFormat; this->opusComplexity = opusComplexity; this->resampleQuality = resampleQuality; qInfo(logAudioConverter) << "Starting audioConverter() Input:" << inFormat.channelCount() << "Channels of" << inFormat.codec() << inFormat.sampleRate() << inFormat.sampleType() << inFormat.sampleSize() << "Output:" << outFormat.channelCount() << "Channels of" << outFormat.codec() << outFormat.sampleRate() << outFormat.sampleType() << outFormat.sampleSize(); if (inFormat.byteOrder() != outFormat.byteOrder()) { qInfo(logAudioConverter) << "Byteorder mismatch in:" << inFormat.byteOrder() << "out:" << outFormat.byteOrder(); } if (inFormat.codec() == "audio/opus") { // Create instance of opus decoder int opus_err = 0; opusDecoder = opus_decoder_create(inFormat.sampleRate(), inFormat.channelCount(), &opus_err); qInfo(logAudioConverter()) << "Creating opus decoder: " << opus_strerror(opus_err); } if (outFormat.codec() == "audio/opus") { // Create instance of opus encoder int opus_err = 0; opusEncoder = opus_encoder_create(outFormat.sampleRate(), outFormat.channelCount(), OPUS_APPLICATION_AUDIO, &opus_err); //opus_encoder_ctl(opusEncoder, OPUS_SET_LSB_DEPTH(16)); //opus_encoder_ctl(opusEncoder, OPUS_SET_INBAND_FEC(1)); //opus_encoder_ctl(opusEncoder, OPUS_SET_DTX(1)); //opus_encoder_ctl(opusEncoder, OPUS_SET_PACKET_LOSS_PERC(5)); opus_encoder_ctl(opusEncoder, OPUS_SET_COMPLEXITY(opusComplexity)); // Reduce complexity to maybe lower CPU? qInfo(logAudioConverter()) << "Creating opus encoder: " << opus_strerror(opus_err); } if (inFormat.sampleRate() != outFormat.sampleRate()) { int resampleError = 0; unsigned int ratioNum; unsigned int ratioDen; // Sample rate conversion required. resampler = wf_resampler_init(outFormat.channelCount(), inFormat.sampleRate(), outFormat.sampleRate(), resampleQuality, &resampleError); wf_resampler_get_ratio(resampler, &ratioNum, &ratioDen); resampleRatio = static_cast(ratioDen) / ratioNum; qInfo(logAudioConverter()) << "wf_resampler_init() returned: " << resampleError << " resampleRatio: " << resampleRatio; } return true; } audioConverter::~audioConverter() { qInfo(logAudioConverter) << "Closing audioConverter() Input:" << inFormat.channelCount() << "Channels of" << inFormat.codec() << inFormat.sampleRate() << inFormat.sampleType() << inFormat.sampleSize() << "Output:" << outFormat.channelCount() << "Channels of" << outFormat.codec() << outFormat.sampleRate() << outFormat.sampleType() << outFormat.sampleSize(); if (opusEncoder != Q_NULLPTR) { qInfo(logAudioConverter()) << "Destroying opus encoder"; opus_encoder_destroy(opusEncoder); } if (opusDecoder != Q_NULLPTR) { qInfo(logAudioConverter()) << "Destroying opus decoder"; opus_decoder_destroy(opusDecoder); } if (resampler != Q_NULLPTR) { speex_resampler_destroy(resampler); qDebug(logAudioConverter()) << "Resampler closed"; } } bool audioConverter::convert(audioPacket audio) { // If inFormat and outFormat are identical, just emit the data back (removed as it doesn't then process amplitude) if (audio.data.size() > 0) { if (inFormat.codec() == "audio/opus") { unsigned char* in = (unsigned char*)audio.data.data(); //Decode the frame. int nSamples = opus_packet_get_nb_samples(in, audio.data.size(), inFormat.sampleRate()); if (nSamples == -1) { // No opus data yet? return false; } QByteArray outPacket(nSamples * sizeof(float) * inFormat.channelCount(), (char)0xff); // Preset the output buffer size. float* out = (float*)outPacket.data(); //if (audio.seq > lastAudioSequence + 1) { // nSamples = opus_decode_float(opusDecoder, Q_NULLPTR, 0, out, nSamples, 1); //} //else { nSamples = opus_decode_float(opusDecoder, in, audio.data.size(), out, nSamples, 0); //} //lastAudioSequence = audio.seq; audio.data.clear(); audio.data = outPacket; // Replace incoming data with converted. } else if (inFormat.codec() == "audio/PCMU") { // Current packet is "technically" 8bit so need to create a new buffer that is 16bit QByteArray outPacket((int)audio.data.length() * 2, (char)0xff); qint16* out = (qint16*)outPacket.data(); for (int f = 0; f < audio.data.length(); f++) { *out++ = ulaw_decode[(quint8)audio.data[f]]; } audio.data.clear(); audio.data = outPacket; // Replace incoming data with converted. // Make sure that sample size/type is set correctly } Eigen::VectorXf samplesF; if (inFormat.sampleType() == QAudioFormat::SignedInt && inFormat.sampleSize() == 32) { Eigen::Ref samplesI = Eigen::Map(reinterpret_cast(audio.data.data()), audio.data.size() / int(sizeof(qint32))); samplesF = samplesI.cast() / float(std::numeric_limits::max()); } else if (inFormat.sampleType() == QAudioFormat::SignedInt && inFormat.sampleSize() == 16) { Eigen::Ref samplesI = Eigen::Map(reinterpret_cast(audio.data.data()), audio.data.size() / int(sizeof(qint16))); samplesF = samplesI.cast() / float(std::numeric_limits::max()); } else if (inFormat.sampleType() == QAudioFormat::SignedInt && inFormat.sampleSize() == 8) { Eigen::Ref samplesI = Eigen::Map(reinterpret_cast(audio.data.data()), audio.data.size() / int(sizeof(qint8))); samplesF = samplesI.cast() / float(std::numeric_limits::max());; } else if (inFormat.sampleType() == QAudioFormat::UnSignedInt && inFormat.sampleSize() == 8) { Eigen::Ref samplesI = Eigen::Map(reinterpret_cast(audio.data.data()), audio.data.size() / int(sizeof(quint8))); samplesF = samplesI.cast() / float(std::numeric_limits::max());; } else if (inFormat.sampleType() == QAudioFormat::Float) { samplesF = Eigen::Map(reinterpret_cast(audio.data.data()), audio.data.size() / int(sizeof(float))); } else { qInfo(logAudio()) << "Unsupported Input Sample Type:" << inFormat.sampleType() << "Size:" << inFormat.sampleSize(); } if (samplesF.size() > 0) { audio.amplitudePeak = samplesF.array().abs().maxCoeff(); audio.amplitudeRMS = samplesF.squaredNorm(); // Set the volume samplesF *= audio.volume; /* samplesF is now an Eigen Vector of the current samples in float format The next step is to convert to the correct number of channels in outFormat.channelCount() */ if (inFormat.channelCount() == 2 && outFormat.channelCount() == 1) { // If we need to drop one of the audio channels, do it now Eigen::VectorXf samplesTemp(samplesF.size() / 2); samplesTemp = Eigen::Map >(samplesF.data(), samplesF.size() / 2); samplesF = samplesTemp; } else if (inFormat.channelCount() == 1 && outFormat.channelCount() == 2) { // Convert mono to stereo if required Eigen::VectorXf samplesTemp(samplesF.size() * 2); Eigen::Map >(samplesTemp.data(), samplesF.size()) = samplesF; Eigen::Map >(samplesTemp.data() + 1, samplesF.size()) = samplesF; samplesF = samplesTemp; } /* Next step is to resample (if needed) */ if (resampler != Q_NULLPTR && resampleRatio != 1.0) { quint32 outFrames = ((samplesF.size() / outFormat.channelCount()) * resampleRatio); quint32 inFrames = (samplesF.size() / outFormat.channelCount()); QByteArray outPacket(outFrames * outFormat.channelCount() * sizeof(float), (char)0xff); // Preset the output buffer size. const float* in = (float*)samplesF.data(); float* out = (float*)outPacket.data(); int err = 0; if (outFormat.channelCount() == 1) { err = wf_resampler_process_float(resampler, 0, in, &inFrames, out, &outFrames); } else { err = wf_resampler_process_interleaved_float(resampler, in, &inFrames, out, &outFrames); } if (err) { qInfo(logAudioConverter()) << "Resampler error " << err << " inFrames:" << inFrames << " outFrames:" << outFrames; } samplesF = Eigen::Map(reinterpret_cast(outPacket.data()), outPacket.size() / int(sizeof(float))); } /* If output is Opus so encode it now, don't do any more conversion on the output of Opus. */ if (outFormat.codec() == "audio/opus") { float* in = (float*)samplesF.data(); QByteArray outPacket(1275, (char)0xff); // Preset the output buffer size to MAXIMUM possible Opus frame size unsigned char* out = (unsigned char*)outPacket.data(); int nbBytes = opus_encode_float(opusEncoder, in, (samplesF.size() / outFormat.channelCount()), out, outPacket.length()); if (nbBytes < 0) { qInfo(logAudioConverter()) << "Opus encode failed:" << opus_strerror(nbBytes) << "Num Samples:" << samplesF.size(); return false; } else { outPacket.resize(nbBytes); audio.data.clear(); audio.data = outPacket; // Copy output packet back to input buffer. //samplesF = Eigen::Map(reinterpret_cast(outPacket.data()), outPacket.size() / int(sizeof(float))); } } else { /* Now convert back into the output format required */ audio.data.clear(); if (outFormat.sampleType() == QAudioFormat::UnSignedInt && outFormat.sampleSize() == 8) { Eigen::VectorXf samplesITemp = samplesF * float(std::numeric_limits::max()); samplesITemp.array() += 127; VectorXuint8 samplesI = samplesITemp.cast(); audio.data = QByteArray(reinterpret_cast(samplesI.data()), int(samplesI.size()) * int(sizeof(quint8))); } else if (outFormat.sampleType() == QAudioFormat::SignedInt && outFormat.sampleSize() == 8) { Eigen::VectorXf samplesITemp = samplesF * float(std::numeric_limits::max()); VectorXint8 samplesI = samplesITemp.cast(); audio.data = QByteArray(reinterpret_cast(samplesI.data()), int(samplesI.size()) * int(sizeof(qint8))); } else if (outFormat.sampleType() == QAudioFormat::SignedInt && outFormat.sampleSize() == 16) { Eigen::VectorXf samplesITemp = samplesF * float(std::numeric_limits::max()); VectorXint16 samplesI = samplesITemp.cast(); audio.data = QByteArray(reinterpret_cast(samplesI.data()), int(samplesI.size()) * int(sizeof(qint16))); } else if (outFormat.sampleType() == QAudioFormat::SignedInt && outFormat.sampleSize() == 32) { Eigen::VectorXf samplesITemp = samplesF * float(std::numeric_limits::max()); VectorXint32 samplesI = samplesITemp.cast(); audio.data = QByteArray(reinterpret_cast(samplesI.data()), int(samplesI.size()) * int(sizeof(qint32))); } else if (outFormat.sampleType() == QAudioFormat::Float) { audio.data = QByteArray(reinterpret_cast(samplesF.data()), int(samplesF.size()) * int(sizeof(float))); } else { qInfo(logAudio()) << "Unsupported Output Sample Type:" << outFormat.sampleType() << "Size:" << outFormat.sampleSize(); } /* As we currently don't have a float based uLaw encoder, this must be done after all other conversion has taken place. */ if (outFormat.codec() == "audio/PCMU") { QByteArray outPacket((int)audio.data.length() / 2, (char)0xff); qint16* in = (qint16*)audio.data.data(); for (int f = 0; f < outPacket.length(); f++) { qint16 sample = *in++; int sign = (sample >> 8) & 0x80; if (sign) sample = (short)-sample; if (sample > cClip) sample = cClip; sample = (short)(sample + cBias); int exponent = (int)MuLawCompressTable[(sample >> 7) & 0xFF]; int mantissa = (sample >> (exponent + 3)) & 0x0F; int compressedByte = ~(sign | (exponent << 4) | mantissa); outPacket[f] = (quint8)compressedByte; } audio.data.clear(); audio.data = outPacket; // Copy output packet back to input buffer. } } } else { qDebug(logAudioConverter) << "Detected empty packet"; } } emit converted(audio); return true; }