PortAudioからwebrtc :: AudioProcessingへの入力ストリームの入力

私はwebrtcのAudioProcessingクラスの実装にlibwebrtc-audio-processing-devel-0.3-1というcygwinパッケージを使用しています。PortAudioからwebrtc :: AudioProcessingへの入力ストリームの入力

PortAudioを使用してマイクから入力を読み取っていて、これをVADチェックのためにwebrtcに渡したいのですが、データをProcessStreamメソッドに渡す方法がわかりません。ここで

#define SAMPLE_RATE  (32000) 
#define FRAMES_PER_BUFFER (320) 
#define PA_SAMPLE_TYPE paFloat32 
#define SAMPLE_SIZE (4) 

... 

err = Pa_ReadStream(stream, sampleBlock, FRAMES_PER_BUFFER); 

// sampleBlock should now point to 320 32 bit floats 

.... 
apm->ProcessStream(<What goes here?>)

私はそうのような第一の方法についてAudioFrameをインスタンス化しようとするとProcessStream definitions

です：

AudioFrame frame;

は、私は次のエラーを取得する：

main.cpp:161:22: error: aggregate ‘webrtc::AudioFrame frame’ has incomplete type and cannot be defined 
    webrtc::AudioFrame frame;

2番目と3番目のメソッドは、データが "const float * const * s rc "とする。定数フロートポインタへの定数ポインタが必要なのですか？これは少し混乱しています。

次の完全な例もavailable on Pastebinで、デフォルトの入力デバイスから入力を取得し、ProcessStreamコール用にwebrtcを準備します。コールでの私の試行は、セグメンテーションの結果として含まれ、コメントアウトされています。

コードにはPortAudioとlibwebrtc-audio-processing-devel-0.3.1が必要です。は、私は、以下のものを使用してcygwinの上でコンパイル：

g++ main_example.cpp -o main -L./ -lcygportaudio-2 -lrt -lm -pthread -I/usr/include/webrtc_audio_processing/ -DWEBRTC_WIN -std=gnu++11 -L/bin/ -lcygwebrtc_audio_processing-1

#include <stdio.h> 
#include <stdlib.h> 
#include <string.h> 
#include "portaudio.h" 
#include <sys/time.h> 
#include <windows.h> 
#include <windowsx.h> 
#include <unistd.h> 

#include "webrtc/modules/audio_processing/include/audio_processing.h" 
using webrtc::AudioProcessing; 
using webrtc::AudioFrame; 
using webrtc::GainControl; 
using webrtc::NoiseSuppression; 
using webrtc::EchoCancellation; 
using webrtc::VoiceDetection; 


#define SAMPLE_RATE  (32000) 
#define FRAMES_PER_BUFFER (320) 
#define DITHER_FLAG   (0) 

#define PA_SAMPLE_TYPE paFloat32 
#define SAMPLE_SIZE (4) 
#define SAMPLE_SILENCE (0) 
#define PRINTF_S_FORMAT "%8f" 

/*******************************************************************/ 
int main(int argc, char **argv); 
/* error handling */ 
int xrun(PaStream *stream, int err, char* sampleBlock); 
void error1(PaStream *stream, char* sampleBlock); 
void error2(PaStream *stream, int err); 
int main (int argc, char **argv) 
{ 

    PaStreamParameters inputParameters; 
    PaStream *stream = NULL; 
    PaError err; 
    const PaDeviceInfo* inputInfo; 
    char *sampleBlock = NULL; 
    int i; 
    int numBytes; 
    int numChannels; 

    err = Pa_Initialize(); 
    if(err != paNoError) error2(stream, err); 

    inputParameters.device = Pa_GetDefaultInputDevice(); /* default input device */ 
    inputInfo = Pa_GetDeviceInfo(inputParameters.device); 
    numChannels = inputInfo->maxInputChannels; 
    inputParameters.channelCount = 1;// numChannels; 
    inputParameters.sampleFormat = PA_SAMPLE_TYPE; 
    inputParameters.suggestedLatency = inputInfo->defaultHighInputLatency ; 
    inputParameters.hostApiSpecificStreamInfo = NULL; 
    printf("Input device # %d.\n", inputParameters.device); 
    printf(" Name: %s\n", inputInfo->name); 

    /* -- setup -- */ 

    err = Pa_OpenStream(
       &stream, 
       &inputParameters, 
       NULL, 
       SAMPLE_RATE, 
       FRAMES_PER_BUFFER, 
       paClipOff,  /* we won't output out of range samples so don't bother clipping them */ 
       NULL, /* no callback, use blocking API */ 
       NULL); /* no callback, so no callback userData */ 
    if(err != paNoError) error2(stream, err); 

    numBytes = FRAMES_PER_BUFFER * numChannels * SAMPLE_SIZE ; 
    sampleBlock = (char *) malloc(numBytes); 
    if(sampleBlock == NULL) 
    { 
     printf("Could not allocate record array.\n"); 
     error1(stream, sampleBlock); 
    } 

    err = Pa_StartStream(stream); 
    if(err != paNoError) error1(stream, sampleBlock); 

     // Configure webrtc::audioprocessing 
     AudioProcessing* apm = AudioProcessing::Create(); 

     apm->high_pass_filter()->Enable(true); 

     apm->echo_cancellation()->enable_drift_compensation(false); 
     apm->echo_cancellation()->Enable(true); 

     apm->noise_suppression()->set_level(apm->noise_suppression()->kHigh); 
     apm->noise_suppression()->Enable(true); 

     apm->gain_control()->set_analog_level_limits(0, 255); 
     apm->gain_control()->set_mode(apm->gain_control()->kAdaptiveAnalog); 
     apm->gain_control()->Enable(true); 

     apm->voice_detection()->Enable(true); 

     int analog_level = apm->gain_control()->stream_analog_level(); 
     int delay_ms = 20; 
     int voiceDetected = 0; 


    long int holdTime = 600; //milliseconds 
    int prevVoiceDetected = -1; 
    int holding = 0; 
    int transmitting = 0; 
    int prevTransmitting = -1; 
    struct timeval startHoldTime, currentTime, elapsedHoldTime; 

     while (1) { 
       // Read in input frames 
     err = Pa_ReadStream(stream, sampleBlock, FRAMES_PER_BUFFER); 
     if(err) xrun(stream, err, sampleBlock); 

       // Run webrtc vad 
       apm->set_stream_delay_ms(delay_ms); 
       apm->gain_control()->set_stream_analog_level(analog_level); 

       /* 
       // A apm->ProcessStream call is required here. The one I've tried here seg faults, probably due to those casts I don't understand 
       webrtc::StreamConfig inputConfig = webrtc::StreamConfig(SAMPLE_RATE, numChannels, false); 
       webrtc::StreamConfig outputConfig = webrtc::StreamConfig(SAMPLE_RATE, numChannels, false); 
       apm->ProcessStream((const float* const*)sampleBlock, inputConfig, outputConfig, (float* const*)sampleBlock); 
       */ 


       analog_level = apm->gain_control()->stream_analog_level(); 
       voiceDetected = apm->voice_detection()->stream_has_voice(); 

       transmitting = 0; 
       if (voiceDetected) { 
         transmitting = 1; 
         holding = 0; 
       } else if (holding) { 
         gettimeofday (&currentTime, NULL); 
         long elapsedHoldTime = (((currentTime.tv_sec - startHoldTime.tv_sec)*1000000L+currentTime.tv_usec) - startHoldTime.tv_usec)/1000; 
         //printf("elapsedtime: %d\n", elapsedHoldTime); fflush(stdout); 
         if (elapsedHoldTime > holdTime) { 
           //printf("completedhold\n"); fflush(stdout); 
           holding = 0; 
         } else { 
           //printf("holding\n"); fflush(stdout); 
           transmitting = 1; 
         } 
       } else if (prevVoiceDetected) { 
         holding = 1; 
         gettimeofday (&startHoldTime, NULL); 
         transmitting = 1; 
       } 
       prevVoiceDetected = voiceDetected; 

       if (prevTransmitting != transmitting) { 
         printf("Transmitting: %s\n", (transmitting) ? "true" : "false"); fflush(stdout); 
       } 
       prevTransmitting = transmitting; 
    } 
    printf("Wire off.\n"); fflush(stdout); 

    err = Pa_StopStream(stream); 
    if(err != paNoError) error1(stream, sampleBlock); 

    free(sampleBlock); 

    Pa_Terminate(); 
    return 0; 

} 

int xrun(PaStream *stream, int err, char* sampleBlock) { 
    printf("err = %d\n", err); fflush(stdout); 
    if(stream) { 
     Pa_AbortStream(stream); 
     Pa_CloseStream(stream); 
    } 
    free(sampleBlock); 
    Pa_Terminate(); 
    if(err & paInputOverflow) 
     fprintf(stderr, "Input Overflow.\n"); 
    if(err & paOutputUnderflow) 
     fprintf(stderr, "Output Underflow.\n"); 
    return -2; 
} 

void error1(PaStream *stream, char* sampleBlock) { 
    free(sampleBlock); 
    exit(-1); 
} 
void error2(PaStream *stream, int err) { 
    if(stream) { 
     Pa_AbortStream(stream); 
     Pa_CloseStream(stream); 
    } 
    Pa_Terminate(); 
    fprintf(stderr, "An error occured while using the portaudio stream\n"); 
    fprintf(stderr, "Error number: %d\n", err); 
    fprintf(stderr, "Error message: %s\n", Pa_GetErrorText(err)); 
    exit(-1); 
}

出典

2017-03-05 Modf

は**再現可能な例がない**として閉じるように投票しました。 –

@ cheers-and-hth-alfを実行できる例で更新しました – Modf

良いですが、私はクローズ投票を取り下げ、コードを質問に貼り付けました（質問自体にある必要があります）。あなたはキャストを疑う権利があると思います。キャストを使用するためにクライアントコードを要求するようにAPIを設計するのは妥当ではありません。 –

私は個人的に@matzeri連絡し、彼は正しい方向に私を指摘gstreamerの中working example、に私を指摘しました。 module_common_types.hをインクルードし、WEBRTC_AUDIO_RPOCESSING_ONLY_BUILDディレクティブを追加し、cygwinのwebrtc/common_types.hの文字列比較関数の定義を修正することで、AudioFrameを定義して対応するProcessStream呼び出しを使用することができました。

ここでは、VADとPortAudioのcygwinでlibwebrtc-audio-processing-devel-0.3-1を使用した例を示します。

注：

g++ main.cpp -o main -L./ -lcygportaudio-2 -lrt -lm -pthread -L./cygspeexdsp-1 -I/usr/include/webrtc_audio_processing/ -DWEBRTC_WIN -DWEBRTC_AUDIO_PROCESSING_ONLY_BUILD -std=gnu++11 -L/bin/ -lcygwebrtc_audio_processing-1

：それは次の定義の代わりに、Win32のバージョン

#define STR_CASE_CMP(s1, s2) ::strcasecmp(s1, s2) 
#define STR_NCASE_CMP(s1, s2, n) ::strncasecmp(s1, s2, n)

main.cppに

#include <stdio.h> 
#include <stdlib.h> 
#include <string.h> 
#include "portaudio.h" 
#include <sys/time.h> 
#include <windows.h> 
#include <windowsx.h> 
#include <unistd.h> 

#include "webrtc/modules/audio_processing/include/audio_processing.h" 
#include "webrtc/modules/interface/module_common_types.h" 
#include "webrtc/system_wrappers/include/trace.h" 
using webrtc::AudioProcessing; 
using webrtc::AudioFrame; 
using webrtc::GainControl; 
using webrtc::NoiseSuppression; 
using webrtc::EchoCancellation; 
using webrtc::VoiceDetection; 


#define SAMPLE_RATE  (32000) 
#define FRAMES_PER_BUFFER (320) 
#define DITHER_FLAG   (0) 

#define PA_SAMPLE_TYPE paInt16 
#define SAMPLE_SIZE (2) 
#define SAMPLE_SILENCE (0) 
#define PRINTF_S_FORMAT "%d" 

/*******************************************************************/ 
int main(int argc, char **argv); 
/* error handling */ 
int xrun(PaStream *stream, int err, char* sampleBlock); 
void error1(PaStream *stream, char* sampleBlock); 
void error2(PaStream *stream, int err); 
int main (int argc, char **argv) 
{ 

    PaStreamParameters inputParameters; 
    PaStream *stream = NULL; 
    PaError err; 
    const PaDeviceInfo* inputInfo; 
    char *sampleBlock = NULL; 
    int i; 
    int numBytes; 
    int numChannels; 

    err = Pa_Initialize(); 
    if(err != paNoError) error2(stream, err); 

    inputParameters.device = Pa_GetDefaultInputDevice(); /* default input device */ 
    inputInfo = Pa_GetDeviceInfo(inputParameters.device); 
    numChannels = inputInfo->maxInputChannels; 
    inputParameters.channelCount = 1;// numChannels; 
    inputParameters.sampleFormat = PA_SAMPLE_TYPE; 
    inputParameters.suggestedLatency = inputInfo->defaultHighInputLatency ; 
    inputParameters.hostApiSpecificStreamInfo = NULL; 
    printf("Input device # %d.\n", inputParameters.device); 
    printf(" Name: %s\n", inputInfo->name); 

    /* -- setup -- */ 

    err = Pa_OpenStream(
       &stream, 
       &inputParameters, 
       NULL, 
       SAMPLE_RATE, 
       FRAMES_PER_BUFFER, 
       paClipOff,  /* we won't output out of range samples so don't bother clipping them */ 
       NULL, /* no callback, use blocking API */ 
       NULL); /* no callback, so no callback userData */ 
    if(err != paNoError) error2(stream, err); 

    numBytes = FRAMES_PER_BUFFER * numChannels * SAMPLE_SIZE ; 
    sampleBlock = (char *) malloc(numBytes); 
    if(sampleBlock == NULL) 
    { 
     printf("Could not allocate record array.\n"); 
     error1(stream, sampleBlock); 
    } 

    err = Pa_StartStream(stream); 
    if(err != paNoError) error1(stream, sampleBlock); 

     // Configure webrtc::audioprocessing 
     AudioProcessing* apm = AudioProcessing::Create(); 

     apm->high_pass_filter()->Enable(true); 

     apm->echo_cancellation()->enable_drift_compensation(false); 
     apm->echo_cancellation()->Enable(true); 

     apm->noise_suppression()->set_level(apm->noise_suppression()->kHigh); 
     apm->noise_suppression()->Enable(true); 

     apm->gain_control()->set_analog_level_limits(0, 255); 
     apm->gain_control()->set_mode(apm->gain_control()->kAdaptiveAnalog); 
     apm->gain_control()->Enable(true); 

     apm->voice_detection()->Enable(true); 

     int analog_level = apm->gain_control()->stream_analog_level(); 
     int delay_ms = 20; 
     int voiceDetected = 0; 


    long int holdTime = 600; //milliseconds 
    int prevVoiceDetected = -1; 
    int holding = 0; 
    int transmitting = 0; 
    int prevTransmitting = -1; 
    struct timeval startHoldTime, currentTime, elapsedHoldTime; 
     int webrtcErr = 0; 

     while (1) { 
       // Read in input frames 
     err = Pa_ReadStream(stream, sampleBlock, FRAMES_PER_BUFFER); 
     if(err) xrun(stream, err, sampleBlock); 

       // Run webrtc vad 
       apm->set_stream_delay_ms(delay_ms); 
       apm->gain_control()->set_stream_analog_level(analog_level); 

       webrtc::AudioFrame frame; 
       frame.num_channels_ = numChannels; 
       frame.sample_rate_hz_ = SAMPLE_RATE; 
       frame.samples_per_channel_ = FRAMES_PER_BUFFER; 
       memcpy(frame.data_, sampleBlock, numBytes); 

       if ((webrtcErr = apm->ProcessStream(&frame)) < 0) { 
         printf("Error Code: %d\n", webrtcErr); fflush(stdout); 
         return -1; 
       } 

       analog_level = apm->gain_control()->stream_analog_level(); 
       voiceDetected = apm->voice_detection()->stream_has_voice(); 

       transmitting = 0; 
       if (voiceDetected) { 
         transmitting = 1; 
         holding = 0; 
       } else if (holding) { 
         gettimeofday (&currentTime, NULL); 
         long elapsedHoldTime = (((currentTime.tv_sec - startHoldTime.tv_sec)*1000000L+currentTime.tv_usec) - startHoldTime.tv_usec)/1000; 
         //printf("elapsedtime: %d\n", elapsedHoldTime); fflush(stdout); 
         if (elapsedHoldTime > holdTime) { 
           //printf("completedhold\n"); fflush(stdout); 
           holding = 0; 
         } else { 
           //printf("holding\n"); fflush(stdout); 
           transmitting = 1; 
         } 
       } else if (prevVoiceDetected) { 
         holding = 1; 
         gettimeofday (&startHoldTime, NULL); 
         transmitting = 1; 
       } 
       prevVoiceDetected = voiceDetected; 

       if (prevTransmitting != transmitting) { 
         printf("Transmitting: %s\n", (transmitting) ? "true" : "false"); fflush(stdout); 
       } 
       prevTransmitting = transmitting; 
    } 
    printf("Wire off.\n"); fflush(stdout); 

    err = Pa_StopStream(stream); 
    if(err != paNoError) error1(stream, sampleBlock); 

    free(sampleBlock); 

    Pa_Terminate(); 
    return 0; 

} 

int xrun(PaStream *stream, int err, char* sampleBlock) { 
    printf("err = %d\n", err); fflush(stdout); 
    if(stream) { 
     Pa_AbortStream(stream); 
     Pa_CloseStream(stream); 
    } 
    free(sampleBlock); 
    Pa_Terminate(); 
    if(err & paInputOverflow) 
     fprintf(stderr, "Input Overflow.\n"); 
    if(err & paOutputUnderflow) 
     fprintf(stderr, "Output Underflow.\n"); 
    return -2; 
} 

void error1(PaStream *stream, char* sampleBlock) { 
    free(sampleBlock); 
    exit(-1); 
} 
void error2(PaStream *stream, int err) { 
    if(stream) { 
     Pa_AbortStream(stream); 
     Pa_CloseStream(stream); 
    } 
    Pa_Terminate(); 
    fprintf(stderr, "An error occured while using the portaudio stream\n"); 
    fprintf(stderr, "Error number: %d\n", err); 
    fprintf(stderr, "Error message: %s\n", Pa_GetErrorText(err)); 
    exit(-1); 
}

コンパイルを適用するので、私はのWebRTC/common_types.hを変更する場合は、必要に応じ

出典

2017-03-08 15:24:03 Modf

PortAudioからwebrtc :: AudioProcessingへの入力ストリームの入力

答えて

関連する問題