基于WASAPI的音频捕获和音频播放，注意“禁用前面板插孔检测”。

http://blog.csdn.net/XscKernel/article/details/52204853#cpp
参照该博主的文章，再次感谢。

需要安装windows SDKs，还用到ksuser和Ole32两个库。

写回答
好问题 0 提建议
关注问题
分享
邀请回答
编辑收藏删除结题
收藏举报

2条回答默认最新

huo821894237 2017-03-31 07:02

关注

录音：

 #include <mmdeviceapi.h>
#include <Audioclient.h>
#include <windows.h>
#include <stdio.h>
#include <string.h>

#define REFTIMES_PER_SEC        10000000
#define REFTIMES_PER_MILLISEC   10000

#define EXIT_ON_ERROR(hres)  \
    if (FAILED(hres)) { goto Exit; }

#define SAFE_RELEASE(punk)  \
    if ((punk) != NULL) { (punk)->Release(); (punk) = NULL; }

const CLSID CLSID_MMDeviceEnumerator    = __uuidof(MMDeviceEnumerator);
const IID IID_IMMDeviceEnumerator       = __uuidof(IMMDeviceEnumerator);
const IID IID_IAudioClient              = __uuidof(IAudioClient);
const IID IID_IAudioCaptureClient       = __uuidof(IAudioCaptureClient);

FILE *fp = NULL;

class MyAudioSink {
public:
    int SetFormat(WAVEFORMATEX *pwfx);
    int CopyData(char *pData, UINT32 numFramesAvailable, BOOL *pbDone);
};

int MyAudioSink::SetFormat(WAVEFORMATEX *pwfx)
{
    FILE *fp = fopen("capture_format.txt", "w");
    char str[128];
    sprintf(str, "wFormatTag \t\tis %x\nnChannels \t\tis %d\nnSamplesPerSec \tis %ld\nnAvgBytesPerSec is %ld\nwBitsPerSample \tis %d",
            pwfx->wFormatTag, pwfx->nChannels, pwfx->nSamplesPerSec, pwfx->nAvgBytesPerSec, pwfx->wBitsPerSample);
    fwrite(str, 1, strlen(str), fp);
    fclose(fp);
    return 0;
}

int MyAudioSink::CopyData(char *pData, UINT32 numFramesAvailable, BOOL *pbDone)
{
    if(pData != NULL)
        fwrite(pData, numFramesAvailable, 1, fp);
    return 0;
}

// pwfx->nSamplesPerSec = 44100;
BOOL AdjustFormatTo16Bits(WAVEFORMATEX *pwfx)
{
    BOOL bRet(FALSE);
    if(pwfx->wFormatTag == WAVE_FORMAT_IEEE_FLOAT)
        pwfx->wFormatTag = WAVE_FORMAT_PCM;
    else if(pwfx->wFormatTag == WAVE_FORMAT_EXTENSIBLE)
    {
        PWAVEFORMATEXTENSIBLE pEx = reinterpret_cast<PWAVEFORMATEXTENSIBLE>(pwfx);
        if (IsEqualGUID(KSDATAFORMAT_SUBTYPE_IEEE_FLOAT, pEx->SubFormat))
        {
            pEx->SubFormat = KSDATAFORMAT_SUBTYPE_PCM;
            pEx->Samples.wValidBitsPerSample = 16;
        }
    }
    else
        return bRet;
    pwfx->wBitsPerSample = 16;
    pwfx->nBlockAlign = pwfx->nChannels * pwfx->wBitsPerSample / 8;
    pwfx->nAvgBytesPerSec = pwfx->nBlockAlign * pwfx->nSamplesPerSec;
    bRet = TRUE;
    return bRet;
}

HRESULT RecordAudioStream(MyAudioSink *pMySink)
{
    HRESULT         hr;
//    REFERENCE_TIME  hnsActualDuration;
    UINT32          bufferFrameCount;
    UINT32          numFramesAvailable;
    BYTE *          pData;
    DWORD           flags;
    REFERENCE_TIME  hnsDefaultDevicePeriod(0);

    IMMDeviceEnumerator *   pEnumerator             = NULL;
    IMMDevice *             pDevice                 = NULL;
    IAudioClient *          pAudioClient            = NULL;
    IAudioCaptureClient *   pCaptureClient          = NULL;
    WAVEFORMATEX *          pwfx                    = NULL;
    UINT32                  packetLength            = 0;
    BOOL                    bDone                   = FALSE;
    HANDLE                  hTimerWakeUp            = NULL;

    hr = CoCreateInstance(CLSID_MMDeviceEnumerator, NULL, CLSCTX_ALL, IID_IMMDeviceEnumerator, (void**)&pEnumerator);
    EXIT_ON_ERROR(hr)

    hr = pEnumerator->GetDefaultAudioEndpoint(eRender, eConsole, &pDevice);
    EXIT_ON_ERROR(hr)

    hr = pDevice->Activate(IID_IAudioClient, CLSCTX_ALL, NULL, (void**)&pAudioClient);
    EXIT_ON_ERROR(hr)

    hr = pAudioClient->GetDevicePeriod(&hnsDefaultDevicePeriod, NULL);

    hr = pAudioClient->GetMixFormat(&pwfx);
    EXIT_ON_ERROR(hr)

    AdjustFormatTo16Bits(pwfx);

    hTimerWakeUp = CreateWaitableTimer(NULL, FALSE, NULL);

    hr = pAudioClient->Initialize(AUDCLNT_SHAREMODE_SHARED, AUDCLNT_STREAMFLAGS_LOOPBACK, 0, 0, pwfx, NULL);
    EXIT_ON_ERROR(hr)

    // Get the size of the allocated buffer.
    hr = pAudioClient->GetBufferSize(&bufferFrameCount);
    EXIT_ON_ERROR(hr)

    hr = pAudioClient->GetService(IID_IAudioCaptureClient, (void**)&pCaptureClient);
    EXIT_ON_ERROR(hr)

    LARGE_INTEGER liFirstFire;
    liFirstFire.QuadPart = -hnsDefaultDevicePeriod / 2; // negative means relative time
    LONG lTimeBetweenFires = (LONG)hnsDefaultDevicePeriod / 2 / (10 * 1000);

    SetWaitableTimer(hTimerWakeUp, &liFirstFire, lTimeBetweenFires, NULL, NULL, FALSE);

    // Notify the audio sink which format to use.
    hr = pMySink->SetFormat(pwfx);
    EXIT_ON_ERROR(hr)

    // Calculate the actual duration of the allocated buffer.
//    hnsActualDuration = (double)REFTIMES_PER_SEC * bufferFrameCount / pwfx->nSamplesPerSec;

    hr = pAudioClient->Start();  // Start recording.
    EXIT_ON_ERROR(hr)

    HANDLE waitArray[1] = {hTimerWakeUp};

    // Each loop fills about half of the shared buffer.
    while (bDone == FALSE)
    {
        WaitForMultipleObjects(sizeof(waitArray) / sizeof(waitArray[0]), waitArray, FALSE, INFINITE);

        hr = pCaptureClient->GetNextPacketSize(&packetLength);
        EXIT_ON_ERROR(hr)

        while (packetLength != 0)
        {
            // Get the available data in the shared buffer.
            hr = pCaptureClient->GetBuffer(&pData, &numFramesAvailable, &flags, NULL, NULL);
            EXIT_ON_ERROR(hr)

            // Copy the available capture data to the audio sink.
            hr = pMySink->CopyData((char *)pData, numFramesAvailable * pwfx->nBlockAlign, &bDone);
            EXIT_ON_ERROR(hr)

            hr = pCaptureClient->ReleaseBuffer(numFramesAvailable);
            EXIT_ON_ERROR(hr)

            hr = pCaptureClient->GetNextPacketSize(&packetLength);
            EXIT_ON_ERROR(hr)
        }
    }

    hr = pAudioClient->Stop();  // Stop recording.
    EXIT_ON_ERROR(hr)

Exit:
    CoTaskMemFree(pwfx);
    SAFE_RELEASE(pEnumerator)
    SAFE_RELEASE(pDevice)
    SAFE_RELEASE(pAudioClient)
    SAFE_RELEASE(pCaptureClient)

    return hr;
}

int main()
{
    fp = fopen("foobar","wb");
    MyAudioSink test;

    CoInitialize(NULL);
    RecordAudioStream(&test);
    CoUninitialize();

    fclose(fp);
    return 0;
}

播放：

 #include <mmdeviceapi.h>
#include <Audioclient.h>
#include <windows.h>
#include <stdio.h>
#include <string.h>

#define REFTIMES_PER_SEC        10000000
#define REFTIMES_PER_MILLISEC   10000

#define EXIT_ON_ERROR(hres)  \
    if (FAILED(hres)) { goto Exit; }

#define SAFE_RELEASE(punk)  \
    if ((punk) != NULL) { (punk)->Release(); (punk) = NULL; }

const CLSID CLSID_MMDeviceEnumerator    = __uuidof(MMDeviceEnumerator);
const IID IID_IMMDeviceEnumerator       = __uuidof(IMMDeviceEnumerator);
const IID IID_IAudioClient              = __uuidof(IAudioClient);
const IID IID_IAudioRenderClient        = __uuidof(IAudioRenderClient);

FILE *fp = NULL;

class MyAudioSource {
public:
    int SetFormat(WAVEFORMATEX *pwfx);
    int LoadData(UINT32 numFramesAvailable, char *pData, DWORD *pbDone);
};

int MyAudioSource::SetFormat(WAVEFORMATEX *pwfx)
{
    FILE *fp = fopen("render_format.txt", "w");
    char str[128];
    sprintf(str, "wFormatTag \t\tis %x\nnChannels \t\tis %d\nnSamplesPerSec \tis %ld\nnAvgBytesPerSec is %ld\nwBitsPerSample \tis %d",
            pwfx->wFormatTag, pwfx->nChannels, pwfx->nSamplesPerSec, pwfx->nAvgBytesPerSec, pwfx->wBitsPerSample);
    fwrite(str, 1, strlen(str), fp);
    fclose(fp);
    return 0;
}

int MyAudioSource::LoadData(UINT32 numFramesAvailable, char *pData, DWORD *pbDone)
{
    int ret = fread(pData, 1, numFramesAvailable, fp);
    printf("fread returns %d\n", ret);
    if(0 == ret)
        *pbDone = AUDCLNT_BUFFERFLAGS_SILENT;
    return 0;
}

BOOL AdjustFormatTo16Bits(WAVEFORMATEX *pwfx)
{
    BOOL bRet(FALSE);
    if(pwfx->wFormatTag == WAVE_FORMAT_IEEE_FLOAT)
        pwfx->wFormatTag = WAVE_FORMAT_PCM;
    else if(pwfx->wFormatTag == WAVE_FORMAT_EXTENSIBLE)
    {
        PWAVEFORMATEXTENSIBLE pEx = reinterpret_cast<PWAVEFORMATEXTENSIBLE>(pwfx);
        if (IsEqualGUID(KSDATAFORMAT_SUBTYPE_IEEE_FLOAT, pEx->SubFormat))
        {
            pEx->SubFormat = KSDATAFORMAT_SUBTYPE_PCM;
            pEx->Samples.wValidBitsPerSample = 16;
        }
    }
    else
        return bRet;
    pwfx->wBitsPerSample = 16;
    pwfx->nBlockAlign = pwfx->nChannels * pwfx->wBitsPerSample / 8;
    pwfx->nAvgBytesPerSec = pwfx->nBlockAlign * pwfx->nSamplesPerSec;
    bRet = TRUE;
    return bRet;
}

HRESULT PlayAudioStream(MyAudioSource *pMySource)
{
    HRESULT hr;
    REFERENCE_TIME hnsRequestedDuration = REFTIMES_PER_SEC;
    REFERENCE_TIME hnsActualDuration;
    IMMDeviceEnumerator *pEnumerator = NULL;
    IMMDevice *pDevice = NULL;
    IAudioClient *pAudioClient = NULL;
    IAudioRenderClient *pRenderClient = NULL;
    WAVEFORMATEX *pwfx = NULL;
    UINT32 bufferFrameCount;
    UINT32 numFramesAvailable;
    UINT32 numFramesPadding;
    BYTE *pData;
    DWORD flags = 0;

    hr = CoCreateInstance(CLSID_MMDeviceEnumerator, NULL, CLSCTX_ALL, IID_IMMDeviceEnumerator, (void**)&pEnumerator);
    EXIT_ON_ERROR(hr)

    hr = pEnumerator->GetDefaultAudioEndpoint(eRender, eConsole, &pDevice);
    EXIT_ON_ERROR(hr)

    hr = pDevice->Activate(IID_IAudioClient, CLSCTX_ALL, NULL, (void**)&pAudioClient);
    EXIT_ON_ERROR(hr)

    hr = pAudioClient->GetMixFormat(&pwfx);
    EXIT_ON_ERROR(hr)

    AdjustFormatTo16Bits(pwfx);

    hr = pAudioClient->Initialize(AUDCLNT_SHAREMODE_SHARED, 0, hnsRequestedDuration, 0, pwfx, NULL);
    EXIT_ON_ERROR(hr)

    // Tell the audio source which format to use.
    hr = pMySource->SetFormat(pwfx);
    EXIT_ON_ERROR(hr)

    // Get the actual size of the allocated buffer.
    hr = pAudioClient->GetBufferSize(&bufferFrameCount);
    EXIT_ON_ERROR(hr)

    hr = pAudioClient->GetService(IID_IAudioRenderClient, (void**)&pRenderClient);
    EXIT_ON_ERROR(hr)

    // Grab the entire buffer for the initial fill operation.
    hr = pRenderClient->GetBuffer(bufferFrameCount, &pData);
    EXIT_ON_ERROR(hr)

    // Load the initial data into the shared buffer.
    hr = pMySource->LoadData(bufferFrameCount * pwfx->nBlockAlign, (char *)pData, &flags);
    EXIT_ON_ERROR(hr)

    hr = pRenderClient->ReleaseBuffer(bufferFrameCount, flags);
    EXIT_ON_ERROR(hr)

    // Calculate the actual duration of the allocated buffer.
    hnsActualDuration = (double)REFTIMES_PER_SEC * bufferFrameCount / pwfx->nSamplesPerSec;

    hr = pAudioClient->Start();  // Start playing.
    EXIT_ON_ERROR(hr)

    // Each loop fills about half of the shared buffer.
    while (flags != AUDCLNT_BUFFERFLAGS_SILENT)
    {
        // Sleep for half the buffer duration.
        Sleep((DWORD)(hnsActualDuration / REFTIMES_PER_MILLISEC / 2));

        // See how much buffer space is available.
        hr = pAudioClient->GetCurrentPadding(&numFramesPadding);
        EXIT_ON_ERROR(hr)

        numFramesAvailable = bufferFrameCount - numFramesPadding;

        // Grab all the available space in the shared buffer.
        hr = pRenderClient->GetBuffer(numFramesAvailable, &pData);
        EXIT_ON_ERROR(hr)

        // Get next 1/2-second of data from the audio source.
        hr = pMySource->LoadData(numFramesAvailable * pwfx->nBlockAlign, (char *)pData, &flags);
        EXIT_ON_ERROR(hr)

        hr = pRenderClient->ReleaseBuffer(numFramesAvailable, flags);
        EXIT_ON_ERROR(hr)
    }

    // Wait for last data in buffer to play before stopping.
    Sleep((DWORD)(hnsActualDuration / REFTIMES_PER_MILLISEC / 2));

    hr = pAudioClient->Stop();  // Stop playing.
    EXIT_ON_ERROR(hr)

Exit:
    CoTaskMemFree(pwfx);
    SAFE_RELEASE(pEnumerator)
    SAFE_RELEASE(pDevice)
    SAFE_RELEASE(pAudioClient)
    SAFE_RELEASE(pRenderClient)

    return hr;
}

int main()
{
    fp = fopen("foobar","rb");
    MyAudioSource test;

    CoInitialize(NULL);
    PlayAudioStream(&test);
    CoUninitialize();

    fclose(fp);
    return 0;
}

报告相同问题？

关注问题

wasapi音频独占输出
2021-06-02 02:00

标题中的“wasapi音频独占输出”指的是Windows Audio Session API（WASAPI）的一种工作模式，它是微软在Windows Vista之后引入的音频处理技术。在独占模式下，应用程序可以直接与音频硬件进行通信，跳过了传统的混音...
简要介绍WASAPI播放音频的方法
2023-01-08 23:42

PeaZomboss的博客本文简要介绍了如何使用WASAPI来播放音频的方法，同时提供了相关代码。
miniaudio：用C编写的单文件音频回放和捕获库
2021-01-28 14:05

miniaudio是一个小巧而功能丰富的音频库，专为跨平台的音频回放和捕获设计。它由C语言编写，具有单文件的特性，方便集成到各种项目中，无论是在桌面系统（如Windows、macOS、Linux）还是移动平台（如Android、iOS）...
MixerDLL:用于会话音量管理的 WASAPI 音频混合器简化 DLL
2021-06-02 01:02

用于会话音量管理的 WASAPI 音频混合器简化 DLL 什么是 MixerDLL？它是一种包装器 dll，允许使用 WASAPI 会话卷管理，而无需深入研究它。它是在我们构建像 windows 音频混音器这样的硬件混音器时创建的，它可以...
WASAPI 捕获指定设备的音频
2021-12-14 12:34

傅华涛Fu的博客 #include "stdafx.h" #include <MMDeviceAPI.h> #include <AudioClient.h> #include <iostream> #include <stdio.h> #include <Functiondiscoverykeys_devpkey.h>...// 1秒=1000毫秒..
WASAPI 捕获默认设备的音频
2021-12-13 18:04

傅华涛Fu的博客 } } /* 设置AUDCLNT_STREAMFLAGS_LOOPBACK 这种模式下，音频engine会将rending设备正在播放的音频流，拷贝一份到音频的endpoint buffer 这样的话，WASAPI client可以采集到the stream. 此时仅采集到Speaker的声音 ...
在Windows Store应用程序中使用WASAPI将音频录制到WAV
2021-04-11 05:38

在Windows Store应用程序中使用WASAPI（Windows Audio Session API）将音频录制到WAV格式是一项技术挑战，因为Windows Store应用有其特定的安全性和资源管理限制。以下是对这一主题的详细阐述： **WASAPI概述** ...
使用WASAPI捕获声卡音频
2019-03-19 22:51

东方fan的博客主要的代码参考了官方文档的Capturing a Stream 和Loopback Recording 两篇 WAVHead 代码参考了C++生成简单WAV文件（三）——根据简谱生成菊花台直接上代码主体代码： #include "pch.h" #include "WAVHead.h" ...
Windows Audio Session (WASAPI) sample_wasapi_wasp_wasapicapture_
2021-09-29 12:20

下面将详细阐述WASAPI的主要特性、工作原理以及如何利用C++进行音频捕获和播放。 WASAPI是Windows Audio System Programming Interface的缩写，它提供了两种模式：独占模式和共享模式。独占模式下，应用程序可以...
音频处理开发库JUCE Linux版本：juce-8.0.8-linux.zip
2025-07-10 14:49

JUCE是一个跨平台的 C++ 应用程序框架，主要用于开发音频软件、游戏、图形界面和其他高性能应用程序。它提供了一套丰富的类和工具，简化了跨平台开发的复杂性，使开发者能够一次编写代码，在多个操作系统上运行。跨...
VC++ WASAPI音频捕获（麦克风或扬声器）
2019-12-20 21:46

老狼主的博客声音捕获PCM数据回调函数（CAudioCapture.h）： #ifndef _WAVEFORMATEX_ #define _WAVEFORMATEX_ typedef unsigned short WORD; typedef unsigned long DWORD; typedef struct tWAVEFORMATEX { WORD wFormatTag;....
RecordHWnd.rar_音频采集波形
2022-09-22 18:08

标题中的“RecordHWnd.rar_音频采集波形”暗示了一个基于VC++（Visual C++）开发的项目，其核心功能是实现音频数据的采集，并在界面上以波形图的形式展示出来。这样的系统通常用于音频处理、声音分析或音频编辑等...
WASAPI音频处理实战示例
2025-05-17 14:03

爱吃红豆沙的公子的博客缓冲区是计算机科学中的一个核心概念，它是在操作系统和硬件中普遍存在的一个区域，用于暂时存储在不同速度的硬件之间或者软件和硬件之间传输的数据。在WASAPI（Windows Audio Session API）中，缓冲区的角色尤为...
PeakMeter.rar_PeakMeter_peakmet_音频音柱
2022-09-24 05:39

在VC中，可以使用Windows Multimedia Library（MMSystem）或者WASAPI（Windows Audio Session API）来捕获音频流。 2. **信号处理**：音频数据在被显示为音柱之前，需要经过处理，例如计算每个时间帧的峰值或平均值...
PlayPcmWin:WASAPI音频播放器，用于发烧友-开源
2021-05-10 05:45

PlayPcmWin is yet another opensource audio player for audiophiles. Supported Platforms: Windows 10 / 8.1 / 7. Manuals: ... ■■■■■ Other apps from this project ■■■■■ ...
商业编程-源码-音频技术源代码 cdxCDynamicControlsManager_Project.zip
2022-06-24 01:18

在Windows平台下，可能使用了DirectSound或WASAPI等API来实现音频播放和控制。这些API提供了低延迟、高效率的音频处理功能，对于实时的音频控制至关重要。了解这些API的工作原理和使用方法是理解源代码的关键。 3....
基于Qt框架与WASAPI音频接口开发的Windows系统音频频谱实时可视化分析工具_支持环回采集_FFT频谱分析_20段对数频段显示_彩色柱状图渲染_峰值指示_衰减效果_多线程架.zip
2025-08-20 11:02

本篇文章将详细介绍一款基于Qt框架和WASAPI音频接口开发的Windows系统音频频谱实时可视化分析工具的特点及其技术实现。首先，该分析工具采用了Qt框架作为主要的开发平台。Qt是一个跨平台的C++应用程序框架，它提供...
商业编程-源码-音频技术源代码_cdxCDynamicControlsManager_source.zip
2022-06-24 01:54

这个组件很可能是一个用于管理和控制音频播放的核心模块，可能包含了一些关键的音频处理算法和接口设计。以下是基于这个主题的详细知识点： 1. **音频技术基础**：音频技术涵盖了声音的数字化、编码、解码、混音、...
声卡的检测及声音、音频设备属性的设置
2017-06-28 23:17

NAudio库提供了对DirectSound、WASAPI、WaveOut、MIDI等多种音频接口的支持，可以方便地进行声卡检测、音频流处理、设备属性设置等操作。在你提供的文件"C#333-声卡的检测及声音、音频设备属性的设置"中，可能包含...
C++修改默认音频输出设备
2018-08-03 13:34

在C++编程中，改变默认的音频输出设备是一项涉及到操作系统底层接口和音频处理技术的任务。在Windows操作系统中，这项功能通常需要使用特定的API或库来实现，如本例中提到的`PolicyConfig.h`库。`PolicyConfig.h`是...
没有解决我的问题, 去提问

码龄粉丝数原力等级 --

基于WASAPI的音频捕获和音频播放，注意“禁用前面板插孔检测”。

2条回答默认最新

码龄粉丝数原力等级 --

基于WASAPI的音频捕获和音频播放，注意“禁用前面板插孔检测”。

2条回答 默认 最新

2条回答默认最新