wasapi_loopback_capturer.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357
  1. #include "wasapi_loopback_capturer.h"
  2. #include <audioclient.h>
  3. #include <comdef.h>
  4. #include <mmdeviceapi.h>
  5. #include <windows.h>
  6. #include <QDebug>
  7. #undef min
  8. class WASAPILoopbackCapturerPrivate
  9. {
  10. public:
  11. IAudioCapturer::Type deviceType;
  12. WASAPILoopbackCapturerPrivate()
  13. {
  14. CoInitialize(nullptr);
  15. }
  16. ~WASAPILoopbackCapturerPrivate()
  17. {
  18. if (pwfx)
  19. CoTaskMemFree(pwfx);
  20. if (pCaptureClient)
  21. pCaptureClient->Release();
  22. if (pAudioClient)
  23. pAudioClient->Release();
  24. if (pDevice)
  25. pDevice->Release();
  26. if (pEnumerator)
  27. pEnumerator->Release();
  28. CoUninitialize();
  29. }
  30. bool init(IAudioCapturer::Type type)
  31. {
  32. HRESULT hr;
  33. hr = CoCreateInstance(__uuidof(MMDeviceEnumerator),
  34. nullptr,
  35. CLSCTX_ALL,
  36. __uuidof(IMMDeviceEnumerator),
  37. (void**)&pEnumerator);
  38. if (FAILED(hr)) {
  39. qDebug() << "Failed to create MMDeviceEnumerator";
  40. return false;
  41. }
  42. deviceType = type;
  43. EDataFlow dataFlow = (deviceType == IAudioCapturer::Type::Speaker) ? eRender : eCapture;
  44. hr = pEnumerator->GetDefaultAudioEndpoint(dataFlow, eConsole, &pDevice);
  45. if (FAILED(hr)) {
  46. qDebug() << "Failed to get default audio endpoint";
  47. return false;
  48. }
  49. hr = pDevice->Activate(__uuidof(IAudioClient), CLSCTX_ALL, nullptr, (void**)&pAudioClient);
  50. if (FAILED(hr)) {
  51. qDebug() << "Failed to activate audio client";
  52. return false;
  53. }
  54. return true;
  55. }
  56. // 初始化音频客户端
  57. bool initializeAudioClient()
  58. {
  59. AUDCLNT_SHAREMODE shareMode = AUDCLNT_SHAREMODE_SHARED;
  60. DWORD streamFlags = AUDCLNT_STREAMFLAGS_AUTOCONVERTPCM
  61. | AUDCLNT_STREAMFLAGS_SRC_DEFAULT_QUALITY;
  62. if (deviceType == IAudioCapturer::Type::Speaker) {
  63. streamFlags |= AUDCLNT_STREAMFLAGS_LOOPBACK;
  64. }
  65. REFERENCE_TIME hnsBufferDuration = 0;
  66. HRESULT hr
  67. = pAudioClient->Initialize(shareMode, streamFlags, hnsBufferDuration, 0, pwfx, nullptr);
  68. if (FAILED(hr)) {
  69. qDebug() << "Failed to initialize audio client, HRESULT:" << QString::number(hr, 16);
  70. return false;
  71. }
  72. qDebug() << "Audio client initialized successfully";
  73. return true;
  74. }
  75. bool setupCaptureClient()
  76. {
  77. if (!pAudioClient) {
  78. qDebug() << "Audio client is null, cannot get capture client";
  79. return false;
  80. }
  81. HRESULT hr = pAudioClient->GetService(__uuidof(IAudioCaptureClient), (void**) &pCaptureClient);
  82. if (FAILED(hr)) {
  83. qDebug() << "Failed to get capture client, HRESULT:" << QString::number(hr, 16)
  84. << "AudioClient:" << pAudioClient << "CaptureClient:" << pCaptureClient;
  85. return false;
  86. }
  87. qDebug() << "Capture client obtained successfully:" << pCaptureClient;
  88. return true;
  89. }
  90. bool startCapture()
  91. {
  92. if (!pAudioClient) {
  93. qDebug() << "Audio client is null, cannot start capture";
  94. return false;
  95. }
  96. HRESULT hr = pAudioClient->Start();
  97. if (FAILED(hr)) {
  98. qDebug() << "Failed to start audio client, HRESULT:" << QString::number(hr, 16);
  99. return false;
  100. }
  101. qDebug() << "Audio client started successfully";
  102. return true;
  103. }
  104. void stopCapture()
  105. {
  106. if (pAudioClient) {
  107. pAudioClient->Stop();
  108. }
  109. }
  110. // 获取音频格式并设置到AudioFormat结构中
  111. bool setupAudioFormat(AudioFormat& audioFormat)
  112. {
  113. if (!pwfx) {
  114. return false;
  115. }
  116. // 设置音频格式
  117. audioFormat.sampleRate = pwfx->nSamplesPerSec;
  118. audioFormat.channels = pwfx->nChannels;
  119. audioFormat.bitsPerSample = pwfx->wBitsPerSample;
  120. audioFormat.blockAlign = pwfx->nBlockAlign;
  121. audioFormat.avgBytesPerSec = pwfx->nAvgBytesPerSec;
  122. // 如果是浮点格式,保持32bit,让混音器处理格式转换
  123. if (pwfx->wFormatTag == WAVE_FORMAT_IEEE_FLOAT) {
  124. qDebug() << "Keeping 32t float format for mixer processing";
  125. }
  126. return true;
  127. }
  128. // 处理音频数据
  129. int processAudioData(std::vector<char>& buffer, std::mutex& mutex)
  130. {
  131. UINT32 packetLength = 0;
  132. HRESULT hr = pCaptureClient->GetNextPacketSize(&packetLength);
  133. if (FAILED(hr)) {
  134. qDebug() << "Failed to get next packet size";
  135. return -1;
  136. }
  137. if (packetLength == 0) {
  138. return 0;
  139. }
  140. BYTE* pData = nullptr;
  141. UINT32 numFrames = 0;
  142. DWORD flags = 0;
  143. hr = pCaptureClient->GetBuffer(&pData, &numFrames, &flags, nullptr, nullptr);
  144. if (FAILED(hr)) {
  145. qDebug() << "Failed to get buffer";
  146. return -1;
  147. }
  148. int bytes = numFrames * pwfx->nBlockAlign;
  149. if (pwfx->wFormatTag == WAVE_FORMAT_IEEE_FLOAT) {
  150. // 32bit浮点格式,直接传递原始数据,让混音器处理格式转换
  151. std::lock_guard<std::mutex> lock(mutex);
  152. // 限制缓冲区大小,避免内存无限增长
  153. const size_t maxBufferSize = 1024 * 1024; // 1MB
  154. int bytesToAdd = numFrames * pwfx->nBlockAlign;
  155. if (buffer.size() + bytesToAdd > maxBufferSize) {
  156. buffer.erase(buffer.begin(), buffer.begin() + (buffer.size() - bytesToAdd));
  157. }
  158. buffer.insert(buffer.end(),
  159. (char*) pData,
  160. (char*) pData + bytesToAdd);
  161. } else {
  162. // PCM 直接拷贝
  163. std::lock_guard<std::mutex> lock(mutex);
  164. // 限制缓冲区大小,避免内存无限增长
  165. const size_t maxBufferSize = 1024 * 1024; // 1MB
  166. int bytesToAdd = numFrames * pwfx->nBlockAlign;
  167. if (buffer.size() + bytesToAdd > maxBufferSize) {
  168. buffer.erase(buffer.begin(), buffer.begin() + (buffer.size() - bytesToAdd));
  169. }
  170. buffer.insert(buffer.end(),
  171. (char*) pData,
  172. (char*) pData + bytesToAdd);
  173. }
  174. pCaptureClient->ReleaseBuffer(numFrames);
  175. return bytes;
  176. }
  177. IMMDeviceEnumerator* pEnumerator = nullptr;
  178. IMMDevice* pDevice = nullptr;
  179. IAudioClient* pAudioClient = nullptr;
  180. IAudioCaptureClient* pCaptureClient = nullptr;
  181. WAVEFORMATEX* pwfx = nullptr;
  182. WAVEFORMATEXTENSIBLE _formatex;
  183. };
  184. WASAPILoopbackCapturer::WASAPILoopbackCapturer(QObject* parent)
  185. : QObject(parent)
  186. , d(new WASAPILoopbackCapturerPrivate)
  187. {
  188. }
  189. WASAPILoopbackCapturer::~WASAPILoopbackCapturer()
  190. {
  191. Stop();
  192. delete d;
  193. }
  194. bool WASAPILoopbackCapturer::Init(Type deviceType)
  195. {
  196. m_deviceType = deviceType;
  197. if (!d->init(deviceType)) {
  198. qDebug() << "Failed to initialize WASAPI components";
  199. return false;
  200. }
  201. // 尝试使用默认格式
  202. AudioFormat defaultFormat = IAudioCapturer::GetDefaultFormat();
  203. WAVEFORMATEX* formatToUse = (WAVEFORMATEX*)CoTaskMemAlloc(sizeof(WAVEFORMATEX));
  204. if (!formatToUse) {
  205. qDebug() << "Failed to allocate memory for WAVEFORMATEX";
  206. return false;
  207. }
  208. formatToUse->wFormatTag = WAVE_FORMAT_PCM;
  209. formatToUse->nChannels = defaultFormat.channels;
  210. formatToUse->nSamplesPerSec = defaultFormat.sampleRate;
  211. formatToUse->wBitsPerSample = defaultFormat.bitsPerSample;
  212. formatToUse->nBlockAlign = (formatToUse->nChannels * formatToUse->wBitsPerSample) / 8;
  213. formatToUse->nAvgBytesPerSec = formatToUse->nSamplesPerSec * formatToUse->nBlockAlign;
  214. formatToUse->cbSize = 0;
  215. d->pwfx = formatToUse;
  216. // 尝试使用默认格式初始化,如果失败则回退
  217. if (!d->initializeAudioClient()) {
  218. qWarning("Default audio format not supported, falling back to GetMixFormat.");
  219. CoTaskMemFree(d->pwfx);
  220. d->pwfx = nullptr;
  221. // 使用GetMixFormat获取系统首选格式
  222. HRESULT hr = d->pAudioClient->GetMixFormat(&d->pwfx);
  223. if (FAILED(hr)) {
  224. qDebug() << "Failed to GetMixFormat on fallback, HRESULT:" << QString::number(hr, 16);
  225. return false;
  226. }
  227. // 再次尝试初始化
  228. if (!d->initializeAudioClient()) {
  229. qDebug() << "Failed to initialize audio client on fallback.";
  230. CoTaskMemFree(d->pwfx);
  231. d->pwfx = nullptr;
  232. return false;
  233. }
  234. }
  235. // 设置音频格式
  236. if (!d->setupAudioFormat(m_audioFormat)) {
  237. qDebug() << "Failed to setup audio format";
  238. return false;
  239. }
  240. qDebug() << "WASAPI Loopback Capturer initialized successfully";
  241. return true;
  242. }
  243. bool WASAPILoopbackCapturer::Start()
  244. {
  245. if (m_running)
  246. return false;
  247. if (!d->setupCaptureClient()) {
  248. return false;
  249. }
  250. if (!d->startCapture()) {
  251. return false;
  252. }
  253. m_running = true;
  254. m_captureThread = std::thread(&WASAPILoopbackCapturer::captureThreadFunc, this);
  255. return true;
  256. }
  257. void WASAPILoopbackCapturer::Stop()
  258. {
  259. if (!m_running)
  260. return;
  261. m_running = false;
  262. if (m_captureThread.joinable())
  263. m_captureThread.join();
  264. d->stopCapture();
  265. }
  266. const AudioFormat& WASAPILoopbackCapturer::GetFormat() const
  267. {
  268. return m_audioFormat;
  269. }
  270. int WASAPILoopbackCapturer::readAudioData(char* buf, int maxLen)
  271. {
  272. std::unique_lock<std::mutex> lock(m_mutex);
  273. // 按帧对齐读取,确保不会破坏音频帧
  274. int blockAlign = m_audioFormat.blockAlign;
  275. if (blockAlign <= 0) {
  276. return 0;
  277. }
  278. // 计算可以读取的完整帧数
  279. int availableFrames = m_buffer.size() / blockAlign;
  280. int requestedFrames = maxLen / blockAlign;
  281. int framesToRead = std::min(availableFrames, requestedFrames);
  282. if (framesToRead > 0) {
  283. int bytesToRead = framesToRead * blockAlign;
  284. memcpy(buf, m_buffer.data(), bytesToRead);
  285. m_buffer.erase(m_buffer.begin(), m_buffer.begin() + bytesToRead);
  286. return bytesToRead;
  287. }
  288. return 0;
  289. }
  290. void WASAPILoopbackCapturer::captureThreadFunc()
  291. {
  292. qDebug() << "WASAPI Loopback capture started successfully";
  293. while (m_running) {
  294. int result = d->processAudioData(m_buffer, m_mutex);
  295. if (result < 0) {
  296. qDebug() << "Error processing audio data";
  297. break;
  298. }
  299. if (result == 0) {
  300. Sleep(10);
  301. }
  302. }
  303. qDebug() << "WASAPI Loopback capture stopped";
  304. }