mirror of
https://github.com/HifiExperiments/overte.git
synced 2025-06-19 23:49:24 +02:00
447 lines
17 KiB
C++
447 lines
17 KiB
C++
//
|
|
// Audio.cpp
|
|
// interface
|
|
//
|
|
// Created by Stephen Birarda on 1/22/13.
|
|
// Copyright (c) 2013 High Fidelity, Inc. All rights reserved.
|
|
//
|
|
|
|
#include <iostream>
|
|
#include <fstream>
|
|
#include <pthread.h>
|
|
#include <sys/time.h>
|
|
#include <sys/stat.h>
|
|
#include <cstring>
|
|
#include "Audio.h"
|
|
#include "Util.h"
|
|
#include "UDPSocket.h"
|
|
|
|
Oscilloscope * scope;
|
|
|
|
const short BUFFER_LENGTH_BYTES = 1024;
|
|
const short BUFFER_LENGTH_SAMPLES = BUFFER_LENGTH_BYTES / sizeof(int16_t);
|
|
|
|
const short PACKET_LENGTH_BYTES = 1024;
|
|
const short PACKET_LENGTH_SAMPLES = PACKET_LENGTH_BYTES / sizeof(int16_t);
|
|
|
|
const int PHASE_DELAY_AT_90 = 20;
|
|
const float AMPLITUDE_RATIO_AT_90 = 0.5;
|
|
|
|
const short RING_BUFFER_FRAMES = 10;
|
|
const short RING_BUFFER_SIZE_SAMPLES = RING_BUFFER_FRAMES * BUFFER_LENGTH_SAMPLES;
|
|
|
|
const int SAMPLE_RATE = 22050;
|
|
const float JITTER_BUFFER_LENGTH_MSECS = 30.0;
|
|
const short JITTER_BUFFER_SAMPLES = JITTER_BUFFER_LENGTH_MSECS * (SAMPLE_RATE / 1000.0);
|
|
|
|
const short NUM_AUDIO_SOURCES = 2;
|
|
const short ECHO_SERVER_TEST = 1;
|
|
|
|
const char LOCALHOST_MIXER[] = "0.0.0.0";
|
|
const char WORKCLUB_MIXER[] = "192.168.1.19";
|
|
const char EC2_WEST_MIXER[] = "54.241.92.53";
|
|
|
|
const int AUDIO_UDP_LISTEN_PORT = 55444;
|
|
|
|
int starve_counter = 0;
|
|
bool stopAudioReceiveThread = false;
|
|
|
|
StDev stdev;
|
|
|
|
#define LOG_SAMPLE_DELAY 1
|
|
|
|
std::ofstream logFile;
|
|
|
|
/**
|
|
* Audio callback used by portaudio.
|
|
* Communicates with Audio via a shared pointer to Audio::data.
|
|
* Writes input audio channels (if they exist) into Audio::data->buffer,
|
|
multiplied by Audio::data->inputGain.
|
|
* Then writes Audio::data->buffer into output audio channels, and clears
|
|
the portion of Audio::data->buffer that has been read from for reuse.
|
|
*
|
|
* @param[in] inputBuffer A pointer to an internal portaudio data buffer containing data read by portaudio.
|
|
* @param[out] outputBuffer A pointer to an internal portaudio data buffer to be read by the configured output device.
|
|
* @param[in] frames Number of frames that portaudio requests to be read/written.
|
|
(Valid size of input/output buffers = frames * number of channels (2) * sizeof data type (float)).
|
|
* @param[in] timeInfo Portaudio time info. Currently unused.
|
|
* @param[in] statusFlags Portaudio status flags. Currently unused.
|
|
* @param[in] userData Pointer to supplied user data (in this case, a pointer to Audio::data).
|
|
Used to communicate with external code (since portaudio calls this function from another thread).
|
|
* @return Should be of type PaStreamCallbackResult. Return paComplete to end the stream, or paContinue to continue (default).
|
|
Can be used to end the stream from within the callback.
|
|
*/
|
|
|
|
int audioCallback (const void *inputBuffer,
|
|
void *outputBuffer,
|
|
unsigned long frames,
|
|
const PaStreamCallbackTimeInfo *timeInfo,
|
|
PaStreamCallbackFlags statusFlags,
|
|
void *userData)
|
|
{
|
|
AudioData *data = (AudioData *) userData;
|
|
|
|
int16_t *inputLeft = ((int16_t **) inputBuffer)[0];
|
|
// int16_t *inputRight = ((int16_t **) inputBuffer)[1];
|
|
|
|
if (inputLeft != NULL) {
|
|
|
|
if (data->mixerAddress != 0) {
|
|
sockaddr_in audioMixerSocket;
|
|
audioMixerSocket.sin_family = AF_INET;
|
|
audioMixerSocket.sin_addr.s_addr = data->mixerAddress;
|
|
audioMixerSocket.sin_port = data->mixerPort;
|
|
data->audioSocket->send((sockaddr *)&audioMixerSocket, (void *)inputLeft, BUFFER_LENGTH_BYTES);
|
|
}
|
|
|
|
//
|
|
// Measure the loudness of the signal from the microphone and store in audio object
|
|
//
|
|
float loudness = 0;
|
|
for (int i = 0; i < BUFFER_LENGTH_SAMPLES; i++) {
|
|
loudness += abs(inputLeft[i]);
|
|
}
|
|
loudness /= BUFFER_LENGTH_SAMPLES;
|
|
data->lastInputLoudness = loudness;
|
|
data->averagedInputLoudness = 0.66*data->averagedInputLoudness + 0.33*loudness;
|
|
//
|
|
// If scope is turned on, copy input buffer to scope
|
|
//
|
|
if (scope->getState()) {
|
|
for (int i = 0; i < BUFFER_LENGTH_SAMPLES; i++) {
|
|
scope->addData((float)inputLeft[i]/32767.0, 1, i);
|
|
}
|
|
}
|
|
}
|
|
|
|
int16_t *outputLeft = ((int16_t **) outputBuffer)[0];
|
|
int16_t *outputRight = ((int16_t **) outputBuffer)[1];
|
|
|
|
memset(outputLeft, 0, BUFFER_LENGTH_BYTES);
|
|
memset(outputRight, 0, BUFFER_LENGTH_BYTES);
|
|
|
|
// Copy output data to oscilloscope
|
|
if (scope->getState()) {
|
|
for (int i = 0; i < BUFFER_LENGTH_SAMPLES; i++) {
|
|
scope->addData((float)outputRight[i]/32767.0, 2, i);
|
|
}
|
|
}
|
|
|
|
AudioRingBuffer *ringBuffer = data->ringBuffer;
|
|
|
|
int16_t *queueBuffer = data->samplesToQueue;
|
|
memset(queueBuffer, 0, BUFFER_LENGTH_BYTES);
|
|
|
|
// if we've been reset, and there isn't any new packets yet
|
|
// just play some silence
|
|
|
|
if (ringBuffer->endOfLastWrite != NULL) {
|
|
|
|
if (!ringBuffer->started && ringBuffer->diffLastWriteNextOutput() <= PACKET_LENGTH_SAMPLES + JITTER_BUFFER_SAMPLES) {
|
|
printf("Held back\n");
|
|
} else if (ringBuffer->diffLastWriteNextOutput() < PACKET_LENGTH_SAMPLES) {
|
|
ringBuffer->started = false;
|
|
|
|
starve_counter++;
|
|
printf("Starved #%d\n", starve_counter);
|
|
data->wasStarved = 10; // Frames to render the indication that the system was starved.
|
|
} else {
|
|
ringBuffer->started = true;
|
|
// play whatever we have in the audio buffer
|
|
|
|
// no sample overlap, either a direct copy of the audio data, or a copy with some appended silence
|
|
memcpy(queueBuffer, ringBuffer->nextOutput, BUFFER_LENGTH_BYTES);
|
|
|
|
ringBuffer->nextOutput += BUFFER_LENGTH_SAMPLES;
|
|
|
|
if (ringBuffer->nextOutput == ringBuffer->buffer + RING_BUFFER_SIZE_SAMPLES) {
|
|
ringBuffer->nextOutput = ringBuffer->buffer;
|
|
}
|
|
}
|
|
}
|
|
|
|
// copy whatever is in the queueBuffer to the outputLeft and outputRight buffers
|
|
memcpy(outputLeft, queueBuffer, BUFFER_LENGTH_BYTES);
|
|
memcpy(outputRight, queueBuffer, BUFFER_LENGTH_BYTES);
|
|
|
|
gettimeofday(&data->lastCallback, NULL);
|
|
return paContinue;
|
|
}
|
|
|
|
void Audio::updateMixerParams(in_addr_t newMixerAddress, in_port_t newMixerPort) {
|
|
audioData->mixerAddress = newMixerAddress;
|
|
audioData->mixerPort = newMixerPort;
|
|
}
|
|
|
|
struct AudioRecThreadStruct {
|
|
AudioData *sharedAudioData;
|
|
};
|
|
|
|
void *receiveAudioViaUDP(void *args) {
|
|
AudioRecThreadStruct *threadArgs = (AudioRecThreadStruct *) args;
|
|
AudioData *sharedAudioData = threadArgs->sharedAudioData;
|
|
|
|
int16_t *receivedData = new int16_t[BUFFER_LENGTH_SAMPLES];
|
|
ssize_t receivedBytes;
|
|
|
|
timeval previousReceiveTime, currentReceiveTime = {};
|
|
|
|
if (LOG_SAMPLE_DELAY) {
|
|
gettimeofday(&previousReceiveTime, NULL);
|
|
|
|
char *directory = new char[50];
|
|
char *filename = new char[50];
|
|
|
|
sprintf(directory, "%s/Desktop/echo_tests", getenv("HOME"));
|
|
|
|
mkdir(directory, S_IRWXU | S_IRWXG | S_IRWXO);
|
|
sprintf(filename, "%s/%ld.csv", directory, previousReceiveTime.tv_sec);
|
|
|
|
logFile.open(filename, std::ios::out);
|
|
|
|
delete[] directory;
|
|
delete[] filename;
|
|
}
|
|
|
|
while (!stopAudioReceiveThread) {
|
|
if (sharedAudioData->audioSocket->receive((void *)receivedData, &receivedBytes)) {
|
|
|
|
bool firstSample = (currentReceiveTime.tv_sec == 0);
|
|
|
|
gettimeofday(¤tReceiveTime, NULL);
|
|
|
|
if (LOG_SAMPLE_DELAY) {
|
|
if (!firstSample) {
|
|
// write time difference (in microseconds) between packet receipts to file
|
|
double timeDiff = diffclock(&previousReceiveTime, ¤tReceiveTime);
|
|
logFile << timeDiff << std::endl;
|
|
}
|
|
}
|
|
|
|
// Compute and report standard deviation for jitter calculation
|
|
if (firstSample) {
|
|
stdev.reset();
|
|
} else {
|
|
double tDiff = diffclock(&previousReceiveTime, ¤tReceiveTime);
|
|
//printf(\n";
|
|
stdev.addValue(tDiff);
|
|
if (stdev.getSamples() > 500) {
|
|
sharedAudioData->measuredJitter = stdev.getStDev();
|
|
printf("Avg: %4.2f, Stdev: %4.2f\n", stdev.getAverage(), sharedAudioData->measuredJitter);
|
|
stdev.reset();
|
|
}
|
|
}
|
|
|
|
AudioRingBuffer *ringBuffer = sharedAudioData->ringBuffer;
|
|
|
|
if (ringBuffer->endOfLastWrite == NULL) {
|
|
ringBuffer->endOfLastWrite = ringBuffer->buffer;
|
|
} else if (ringBuffer->diffLastWriteNextOutput() > RING_BUFFER_SIZE_SAMPLES - PACKET_LENGTH_SAMPLES) {
|
|
std::cout << "NAB: " << ringBuffer->nextOutput - ringBuffer->buffer << "\n";
|
|
std::cout << "LAW: " << ringBuffer->endOfLastWrite - ringBuffer->buffer << "\n";
|
|
std::cout << "D: " << ringBuffer->diffLastWriteNextOutput() << "\n";
|
|
std::cout << "Full\n";
|
|
|
|
// reset us to started state
|
|
ringBuffer->endOfLastWrite = ringBuffer->buffer;
|
|
ringBuffer->nextOutput = ringBuffer->buffer;
|
|
ringBuffer->started = false;
|
|
}
|
|
|
|
int16_t *copyToPointer = ringBuffer->endOfLastWrite;
|
|
|
|
// just copy the recieved data to the right spot and then add packet length to previous pointer
|
|
memcpy(copyToPointer, receivedData, PACKET_LENGTH_BYTES);
|
|
ringBuffer->endOfLastWrite += PACKET_LENGTH_SAMPLES;
|
|
|
|
if (ringBuffer->endOfLastWrite == ringBuffer->buffer + RING_BUFFER_SIZE_SAMPLES) {
|
|
ringBuffer->endOfLastWrite = ringBuffer->buffer;
|
|
}
|
|
|
|
if (LOG_SAMPLE_DELAY) {
|
|
gettimeofday(&previousReceiveTime, NULL);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Initialize portaudio and start an audio stream.
|
|
* Should be called at the beginning of program exection.
|
|
* @seealso Audio::terminate
|
|
* @return Returns true if successful or false if an error occurred.
|
|
Use Audio::getError() to retrieve the error code.
|
|
*/
|
|
Audio::Audio(Oscilloscope * s)
|
|
{
|
|
paError = Pa_Initialize();
|
|
if (paError != paNoError) goto error;
|
|
|
|
scope = s;
|
|
|
|
audioData = new AudioData(BUFFER_LENGTH_BYTES);
|
|
|
|
// setup a UDPSocket
|
|
audioData->audioSocket = new UDPSocket(AUDIO_UDP_LISTEN_PORT);
|
|
audioData->ringBuffer = new AudioRingBuffer(RING_BUFFER_SIZE_SAMPLES);
|
|
|
|
AudioRecThreadStruct threadArgs;
|
|
threadArgs.sharedAudioData = audioData;
|
|
|
|
pthread_create(&audioReceiveThread, NULL, receiveAudioViaUDP, (void *) &threadArgs);
|
|
|
|
paError = Pa_OpenDefaultStream(&stream,
|
|
2, // input channels
|
|
2, // output channels
|
|
(paInt16 | paNonInterleaved), // sample format
|
|
22050, // sample rate (hz)
|
|
512, // frames per buffer
|
|
audioCallback, // callback function
|
|
(void *) audioData); // user data to be passed to callback
|
|
if (paError != paNoError) goto error;
|
|
|
|
initialized = true;
|
|
|
|
// start the stream now that sources are good to go
|
|
Pa_StartStream(stream);
|
|
if (paError != paNoError) goto error;
|
|
|
|
return;
|
|
|
|
error:
|
|
fprintf(stderr, "-- Failed to initialize portaudio --\n");
|
|
fprintf(stderr, "PortAudio error (%d): %s\n", paError, Pa_GetErrorText(paError));
|
|
initialized = false;
|
|
delete[] audioData;
|
|
}
|
|
|
|
|
|
void Audio::getInputLoudness(float * lastLoudness, float * averageLoudness) {
|
|
*lastLoudness = audioData->lastInputLoudness;
|
|
*averageLoudness = audioData->averagedInputLoudness;
|
|
}
|
|
|
|
void Audio::render(int screenWidth, int screenHeight)
|
|
{
|
|
if (initialized && ECHO_SERVER_TEST) {
|
|
glBegin(GL_LINES);
|
|
glColor3f(1,1,1);
|
|
|
|
int startX = 50.0;
|
|
int currentX = startX;
|
|
int topY = screenHeight - 90;
|
|
int bottomY = screenHeight - 50;
|
|
float frameWidth = 50.0;
|
|
float halfY = topY + ((bottomY - topY) / 2.0);
|
|
|
|
// draw the lines for the base of the ring buffer
|
|
|
|
glVertex2f(currentX, topY);
|
|
glVertex2f(currentX, bottomY);
|
|
|
|
for (int i = 0; i < RING_BUFFER_FRAMES; i++) {
|
|
glVertex2f(currentX, halfY);
|
|
glVertex2f(currentX + frameWidth, halfY);
|
|
currentX += frameWidth;
|
|
|
|
glVertex2f(currentX, topY);
|
|
glVertex2f(currentX, bottomY);
|
|
}
|
|
glEnd();
|
|
|
|
|
|
// Show a bar with the amount of audio remaining in ring buffer beyond current playback
|
|
float remainingBuffer = 0;
|
|
timeval currentTime;
|
|
gettimeofday(¤tTime, NULL);
|
|
float timeLeftInCurrentBuffer = 0;
|
|
if (audioData->lastCallback.tv_usec > 0) timeLeftInCurrentBuffer = diffclock(&audioData->lastCallback, ¤tTime)/(1000.0*(float)BUFFER_LENGTH_SAMPLES/(float)SAMPLE_RATE) * frameWidth;
|
|
|
|
if (audioData->ringBuffer->endOfLastWrite != NULL)
|
|
remainingBuffer = audioData->ringBuffer->diffLastWriteNextOutput() / BUFFER_LENGTH_SAMPLES * frameWidth;
|
|
|
|
if (audioData->wasStarved == 0) glColor3f(0, 1, 0);
|
|
else {
|
|
glColor3f(0.5 + (float)audioData->wasStarved/20.0, 0, 0);
|
|
audioData->wasStarved--;
|
|
}
|
|
|
|
glBegin(GL_QUADS);
|
|
glVertex2f(startX, topY + 5);
|
|
glVertex2f(startX + remainingBuffer + timeLeftInCurrentBuffer, topY + 5);
|
|
glVertex2f(startX + remainingBuffer + timeLeftInCurrentBuffer, bottomY - 5);
|
|
glVertex2f(startX, bottomY - 5);
|
|
glEnd();
|
|
|
|
if (audioData->averagedLatency == 0.0) audioData->averagedLatency = remainingBuffer + timeLeftInCurrentBuffer;
|
|
else audioData->averagedLatency = 0.99*audioData->averagedLatency + 0.01*((float)remainingBuffer + (float)timeLeftInCurrentBuffer);
|
|
|
|
// Show a yellow bar with the averaged msecs latency you are hearing (from time of packet receipt)
|
|
glColor3f(1,1,0);
|
|
glBegin(GL_QUADS);
|
|
glVertex2f(startX + audioData->averagedLatency - 2, topY - 2);
|
|
glVertex2f(startX + audioData->averagedLatency + 2, topY - 2);
|
|
glVertex2f(startX + audioData->averagedLatency + 2, bottomY + 2);
|
|
glVertex2f(startX + audioData->averagedLatency - 2, bottomY + 2);
|
|
glEnd();
|
|
|
|
char out[20];
|
|
sprintf(out, "%3.0f\n", audioData->averagedLatency/(float)frameWidth*(1000.0*(float)BUFFER_LENGTH_SAMPLES/(float)SAMPLE_RATE));
|
|
drawtext(startX + audioData->averagedLatency - 10, topY-10, 0.08, 0, 1, 0, out, 1,1,0);
|
|
|
|
// Show a Cyan bar with the most recently measured jitter stdev
|
|
|
|
int jitterPels = (float) audioData->measuredJitter/ ((1000.0*(float)BUFFER_LENGTH_SAMPLES/(float)SAMPLE_RATE)) * (float)frameWidth;
|
|
|
|
glColor3f(0,1,1);
|
|
glBegin(GL_QUADS);
|
|
glVertex2f(startX + jitterPels - 2, topY - 2);
|
|
glVertex2f(startX + jitterPels + 2, topY - 2);
|
|
glVertex2f(startX + jitterPels + 2, bottomY + 2);
|
|
glVertex2f(startX + jitterPels - 2, bottomY + 2);
|
|
glEnd();
|
|
|
|
sprintf(out,"%3.1f\n", audioData->measuredJitter);
|
|
drawtext(startX + jitterPels - 5, topY-10, 0.08, 0, 1, 0, out, 0,1,1);
|
|
|
|
sprintf(out, "%3.1fms\n", JITTER_BUFFER_LENGTH_MSECS);
|
|
drawtext(startX - 10, bottomY + 20, 0.1, 0, 1, 0, out, 1, 0, 0);
|
|
|
|
sprintf(out, "%hd samples\n", JITTER_BUFFER_SAMPLES);
|
|
drawtext(startX - 10, bottomY + 35, 0.1, 0, 1, 0, out, 1, 0, 0);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Close the running audio stream, and deinitialize portaudio.
|
|
* Should be called at the end of program execution.
|
|
* @return Returns true if the initialization was successful, or false if an error occured.
|
|
The error code may be retrieved by Audio::getError().
|
|
*/
|
|
bool Audio::terminate ()
|
|
{
|
|
if (initialized) {
|
|
initialized = false;
|
|
|
|
paError = Pa_CloseStream(stream);
|
|
if (paError != paNoError) goto error;
|
|
|
|
paError = Pa_Terminate();
|
|
if (paError != paNoError) goto error;
|
|
|
|
delete audioData;
|
|
|
|
logFile.close();
|
|
}
|
|
|
|
stopAudioReceiveThread = true;
|
|
pthread_join(audioReceiveThread, NULL);
|
|
|
|
return true;
|
|
|
|
error:
|
|
fprintf(stderr, "-- portaudio termination error --\n");
|
|
fprintf(stderr, "PortAudio error (%d): %s\n", paError, Pa_GetErrorText(paError));
|
|
return false;
|
|
}
|
|
|