capture_audio_capturer.cpp 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907
  1. #include "capture_audio_capturer.h"
  2. #include "../base/logger.h"
  3. #include "../base/media_common.h"
  4. #include <algorithm>
  5. #include <cmath>
  6. #ifdef _WIN32
  7. #include <windows.h>
  8. #include <mmdeviceapi.h>
  9. #include <audioclient.h>
  10. #include <endpointvolume.h>
  11. #pragma comment(lib, "ole32.lib")
  12. #endif
  13. extern "C" {
  14. #include <libavformat/avformat.h>
  15. #include <libavdevice/avdevice.h>
  16. #include <libswresample/swresample.h>
  17. #include <libavutil/opt.h>
  18. #include <libavutil/channel_layout.h>
  19. }
  20. namespace av {
  21. namespace capture {
  22. AudioCapturer::AudioCapturer() : audioParams_(CapturerType::AUDIO_MIC) {
  23. AV_LOGGER_DEBUG("创建音频采集器");
  24. // 注册设备
  25. avdevice_register_all();
  26. lastLevelUpdate_ = std::chrono::steady_clock::now();
  27. }
  28. AudioCapturer::~AudioCapturer() {
  29. close();
  30. AV_LOGGER_DEBUG("音频采集器已销毁");
  31. }
  32. ErrorCode AudioCapturer::initialize(const CapturerParams& params) {
  33. if (params.mediaType != MediaType::AUDIO) {
  34. AV_LOGGER_ERROR("参数媒体类型不是音频");
  35. return ErrorCode::INVALID_PARAMS;
  36. }
  37. audioParams_ = static_cast<const AudioCaptureParams&>(params);
  38. if (!validateParams(audioParams_)) {
  39. return ErrorCode::INVALID_PARAMS;
  40. }
  41. ErrorCode result = ErrorCode::SUCCESS;
  42. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  43. result = initializeMicrophone();
  44. } else if (audioParams_.type == CapturerType::AUDIO_SYSTEM ||
  45. audioParams_.type == CapturerType::AUDIO_LOOPBACK) {
  46. result = initializeSystemAudio();
  47. } else {
  48. AV_LOGGER_ERROR("不支持的音频采集器类型");
  49. return ErrorCode::NOT_SUPPORTED;
  50. }
  51. if (result == ErrorCode::SUCCESS) {
  52. setState(CapturerState::INITIALIZED);
  53. AV_LOGGER_INFOF("音频采集器初始化成功: {}Hz, {}ch, {}",
  54. audioParams_.sampleRate, audioParams_.channels,
  55. av_get_sample_fmt_name(audioParams_.sampleFormat));
  56. }
  57. return result;
  58. }
  59. ErrorCode AudioCapturer::start() {
  60. std::lock_guard<std::mutex> lock(captureMutex_);
  61. if (getState() != CapturerState::INITIALIZED) {
  62. AV_LOGGER_ERROR("采集器状态无效,无法启动");
  63. return ErrorCode::INVALID_STATE;
  64. }
  65. shouldStop_ = false;
  66. // 启动采集线程
  67. try {
  68. captureThread_ = std::thread(&AudioCapturer::captureThreadFunc, this);
  69. setState(CapturerState::STARTED);
  70. AV_LOGGER_INFO("音频采集已启动");
  71. return ErrorCode::SUCCESS;
  72. } catch (const std::exception& e) {
  73. AV_LOGGER_ERRORF("启动音频采集线程失败: {}", e.what());
  74. return ErrorCode::THREAD_ERROR;
  75. }
  76. }
  77. ErrorCode AudioCapturer::stop() {
  78. std::lock_guard<std::mutex> lock(captureMutex_);
  79. if (getState() != CapturerState::STARTED) {
  80. return ErrorCode::SUCCESS;
  81. }
  82. shouldStop_ = true;
  83. // 唤醒暂停的线程
  84. {
  85. std::lock_guard<std::mutex> pauseLock(pauseMutex_);
  86. paused_ = false;
  87. pauseCondition_.notify_all();
  88. }
  89. // 等待线程结束
  90. if (captureThread_.joinable()) {
  91. captureThread_.join();
  92. }
  93. setState(CapturerState::STOPPED);
  94. AV_LOGGER_INFO("音频采集已停止");
  95. return ErrorCode::SUCCESS;
  96. }
  97. ErrorCode AudioCapturer::pause() {
  98. if (getState() != CapturerState::STARTED) {
  99. return ErrorCode::INVALID_STATE;
  100. }
  101. paused_ = true;
  102. AV_LOGGER_INFO("音频采集已暂停");
  103. return ErrorCode::SUCCESS;
  104. }
  105. ErrorCode AudioCapturer::resume() {
  106. if (getState() != CapturerState::STARTED) {
  107. return ErrorCode::INVALID_STATE;
  108. }
  109. {
  110. std::lock_guard<std::mutex> lock(pauseMutex_);
  111. paused_ = false;
  112. pauseCondition_.notify_all();
  113. }
  114. AV_LOGGER_INFO("音频采集已恢复");
  115. return ErrorCode::SUCCESS;
  116. }
  117. ErrorCode AudioCapturer::reset() {
  118. ErrorCode result = stop();
  119. if (result != ErrorCode::SUCCESS) {
  120. return result;
  121. }
  122. // 清空帧队列
  123. {
  124. std::lock_guard<std::mutex> lock(queueMutex_);
  125. while (!frameQueue_.empty()) {
  126. frameQueue_.pop();
  127. }
  128. }
  129. resetStats();
  130. audioLevel_ = 0.0f;
  131. setState(CapturerState::INITIALIZED);
  132. AV_LOGGER_INFO("音频采集器已重置");
  133. return ErrorCode::SUCCESS;
  134. }
  135. ErrorCode AudioCapturer::close() {
  136. stop();
  137. // 清理资源
  138. cleanupResampler();
  139. cleanupAudioProcessing();
  140. if (codecCtx_) {
  141. avcodec_free_context(&codecCtx_);
  142. codecCtx_ = nullptr;
  143. }
  144. if (formatCtx_) {
  145. avformat_close_input(&formatCtx_);
  146. formatCtx_ = nullptr;
  147. }
  148. codec_ = nullptr;
  149. audioStreamIndex_ = -1;
  150. setState(CapturerState::IDLE);
  151. AV_LOGGER_INFO("音频采集器已关闭");
  152. return ErrorCode::SUCCESS;
  153. }
  154. std::vector<std::string> AudioCapturer::getAvailableDevices() const {
  155. std::vector<std::string> devices;
  156. auto deviceInfos = getDetailedDeviceInfo();
  157. for (const auto& info : deviceInfos) {
  158. devices.push_back(info.name);
  159. }
  160. return devices;
  161. }
  162. std::string AudioCapturer::getCurrentDevice() const {
  163. return audioParams_.deviceName;
  164. }
  165. std::vector<AudioDeviceInfo> AudioCapturer::getDetailedDeviceInfo() const {
  166. std::lock_guard<std::mutex> lock(deviceCacheMutex_);
  167. if (!devicesCached_) {
  168. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  169. cachedDevices_ = enumerateMicrophones();
  170. } else {
  171. cachedDevices_ = enumerateSystemAudioDevices();
  172. }
  173. devicesCached_ = true;
  174. }
  175. return cachedDevices_;
  176. }
  177. ErrorCode AudioCapturer::setAudioParams(int sampleRate, int channels, AVSampleFormat sampleFormat) {
  178. if (getState() == CapturerState::STARTED) {
  179. AV_LOGGER_ERROR("无法在采集过程中修改音频参数");
  180. return ErrorCode::INVALID_STATE;
  181. }
  182. audioParams_.sampleRate = sampleRate;
  183. audioParams_.channels = channels;
  184. audioParams_.sampleFormat = sampleFormat;
  185. AV_LOGGER_INFOF("音频参数已更新: {}Hz, {}ch, {}",
  186. sampleRate, channels, av_get_sample_fmt_name(sampleFormat));
  187. return ErrorCode::SUCCESS;
  188. }
  189. ErrorCode AudioCapturer::setVolume(float volume) {
  190. if (volume < 0.0f || volume > 2.0f) {
  191. AV_LOGGER_ERROR("音量值超出范围 (0.0-2.0)");
  192. return ErrorCode::INVALID_PARAMS;
  193. }
  194. currentVolume_ = volume;
  195. audioParams_.volume = volume;
  196. AV_LOGGER_INFOF("音量已设置为: {:.2f}", volume);
  197. return ErrorCode::SUCCESS;
  198. }
  199. float AudioCapturer::getVolume() const {
  200. return currentVolume_;
  201. }
  202. ErrorCode AudioCapturer::setNoiseReduction(bool enable) {
  203. noiseReductionEnabled_ = enable;
  204. audioParams_.enableNoiseReduction = enable;
  205. AV_LOGGER_INFOF("Noise reduction {}", enable ? "enabled" : "disabled");
  206. return ErrorCode::SUCCESS;
  207. }
  208. ErrorCode AudioCapturer::setEchoCancellation(bool enable) {
  209. echoCancellationEnabled_ = enable;
  210. audioParams_.enableEchoCancellation = enable;
  211. AV_LOGGER_INFOF("Echo cancellation {}", enable ? "enabled" : "disabled");
  212. return ErrorCode::SUCCESS;
  213. }
  214. AudioCaptureParams AudioCapturer::getCurrentParams() const {
  215. return audioParams_;
  216. }
  217. float AudioCapturer::getAudioLevel() const {
  218. return audioLevel_.load();
  219. }
  220. bool AudioCapturer::validateParams(const CapturerParams& params) {
  221. const auto& audioParams = static_cast<const AudioCaptureParams&>(params);
  222. if (audioParams.sampleRate <= 0 || audioParams.sampleRate > 192000) {
  223. AV_LOGGER_ERROR("采样率无效");
  224. return false;
  225. }
  226. if (audioParams.channels <= 0 || audioParams.channels > 8) {
  227. AV_LOGGER_ERROR("声道数无效");
  228. return false;
  229. }
  230. if (audioParams.bufferSize <= 0 || audioParams.bufferSize > 8192) {
  231. AV_LOGGER_ERROR("缓冲区大小无效");
  232. return false;
  233. }
  234. if (audioParams.volume < 0.0f || audioParams.volume > 2.0f) {
  235. AV_LOGGER_ERROR("音量值无效");
  236. return false;
  237. }
  238. return true;
  239. }
  240. ErrorCode AudioCapturer::initializeMicrophone() {
  241. AV_LOGGER_INFOF("初始化麦克风采集器: 索引={}", audioParams_.micIndex);
  242. #ifdef _WIN32
  243. return setupDirectSoundMicrophone();
  244. #elif defined(__linux__)
  245. return setupALSAMicrophone();
  246. #elif defined(__APPLE__)
  247. return setupCoreAudioMicrophone();
  248. #else
  249. AV_LOGGER_ERROR("当前平台不支持麦克风采集");
  250. return ErrorCode::NOT_SUPPORTED;
  251. #endif
  252. }
  253. ErrorCode AudioCapturer::initializeSystemAudio() {
  254. AV_LOGGER_INFO("初始化系统音频采集器");
  255. #ifdef _WIN32
  256. return setupWASAPISystemAudio();
  257. #elif defined(__linux__)
  258. return setupPulseAudioCapture();
  259. #elif defined(__APPLE__)
  260. return setupCoreAudioSystemCapture();
  261. #else
  262. AV_LOGGER_ERROR("当前平台不支持系统音频采集");
  263. return ErrorCode::NOT_SUPPORTED;
  264. #endif
  265. }
  266. ErrorCode AudioCapturer::openInputDevice() {
  267. const AVInputFormat* inputFormat = getPlatformInputFormat();
  268. if (!inputFormat) {
  269. AV_LOGGER_ERROR("获取音频输入格式失败");
  270. return ErrorCode::NOT_SUPPORTED;
  271. }
  272. std::string deviceName = getPlatformDeviceName();
  273. if (deviceName.empty()) {
  274. AV_LOGGER_ERROR("获取音频设备名称失败");
  275. return ErrorCode::DEVICE_NOT_FOUND;
  276. }
  277. AV_LOGGER_INFOF("打开音频输入设备: {} (格式: {})", deviceName, inputFormat->name);
  278. // 设置输入选项
  279. AVDictionary* options = nullptr;
  280. // 设置音频参数
  281. av_dict_set(&options, "sample_rate", std::to_string(audioParams_.sampleRate).c_str(), 0);
  282. av_dict_set(&options, "channels", std::to_string(audioParams_.channels).c_str(), 0);
  283. // 设置缓冲区大小
  284. av_dict_set(&options, "audio_buffer_size", std::to_string(audioParams_.bufferSize).c_str(), 0);
  285. // 打开输入
  286. int ret = avformat_open_input(&formatCtx_, deviceName.c_str(), inputFormat, &options);
  287. av_dict_free(&options);
  288. if (ret < 0) {
  289. AV_LOGGER_ERRORF("打开音频输入设备失败: {} (设备: {})",
  290. ffmpeg_utils::errorToString(ret), deviceName);
  291. return static_cast<ErrorCode>(ret);
  292. }
  293. // 查找流信息
  294. ret = avformat_find_stream_info(formatCtx_, nullptr);
  295. if (ret < 0) {
  296. AV_LOGGER_ERRORF("查找音频流信息失败: {}", ffmpeg_utils::errorToString(ret));
  297. return static_cast<ErrorCode>(ret);
  298. }
  299. // 查找音频流
  300. audioStreamIndex_ = av_find_best_stream(formatCtx_, AVMEDIA_TYPE_AUDIO, -1, -1, &codec_, 0);
  301. if (audioStreamIndex_ < 0) {
  302. AV_LOGGER_ERROR("未找到音频流");
  303. return ErrorCode::STREAM_NOT_FOUND;
  304. }
  305. // 创建解码上下文
  306. codecCtx_ = avcodec_alloc_context3(codec_);
  307. if (!codecCtx_) {
  308. AV_LOGGER_ERROR("分配音频解码上下文失败");
  309. return ErrorCode::MEMORY_ALLOC_FAILED;
  310. }
  311. // 复制流参数到解码上下文
  312. ret = avcodec_parameters_to_context(codecCtx_, formatCtx_->streams[audioStreamIndex_]->codecpar);
  313. if (ret < 0) {
  314. AV_LOGGER_ERRORF("复制音频流参数失败: {}", ffmpeg_utils::errorToString(ret));
  315. return static_cast<ErrorCode>(ret);
  316. }
  317. // 打开解码器
  318. ret = avcodec_open2(codecCtx_, codec_, nullptr);
  319. if (ret < 0) {
  320. AV_LOGGER_ERRORF("打开音频解码器失败: {}", ffmpeg_utils::errorToString(ret));
  321. return static_cast<ErrorCode>(ret);
  322. }
  323. // 设置音频重采样
  324. return setupAudioResampling();
  325. }
  326. ErrorCode AudioCapturer::setupAudioResampling() {
  327. AVSampleFormat srcFormat = codecCtx_->sample_fmt;
  328. int srcSampleRate = codecCtx_->sample_rate;
  329. int srcChannels = codecCtx_->ch_layout.nb_channels;
  330. AVChannelLayout srcChannelLayout = codecCtx_->ch_layout;
  331. AVSampleFormat dstFormat = audioParams_.sampleFormat;
  332. int dstSampleRate = audioParams_.sampleRate;
  333. int dstChannels = audioParams_.channels;
  334. AVChannelLayout dstChannelLayout;
  335. av_channel_layout_default(&dstChannelLayout, dstChannels);
  336. needResampling_ = (srcFormat != dstFormat) ||
  337. (srcSampleRate != dstSampleRate) ||
  338. (srcChannels != dstChannels);
  339. if (needResampling_) {
  340. AV_LOGGER_INFOF("需要音频重采样: {}Hz,{}ch,{} -> {}Hz,{}ch,{}",
  341. srcSampleRate, srcChannels, av_get_sample_fmt_name(srcFormat),
  342. dstSampleRate, dstChannels, av_get_sample_fmt_name(dstFormat));
  343. swrCtx_ = swr_alloc();
  344. if (!swrCtx_) {
  345. AV_LOGGER_ERROR("分配音频重采样器失败");
  346. return ErrorCode::MEMORY_ALLOC_FAILED;
  347. }
  348. // 设置重采样参数
  349. av_opt_set_chlayout(swrCtx_, "in_chlayout", &srcChannelLayout, 0);
  350. av_opt_set_int(swrCtx_, "in_sample_rate", srcSampleRate, 0);
  351. av_opt_set_sample_fmt(swrCtx_, "in_sample_fmt", srcFormat, 0);
  352. av_opt_set_chlayout(swrCtx_, "out_chlayout", &dstChannelLayout, 0);
  353. av_opt_set_int(swrCtx_, "out_sample_rate", dstSampleRate, 0);
  354. av_opt_set_sample_fmt(swrCtx_, "out_sample_fmt", dstFormat, 0);
  355. // 初始化重采样器
  356. int ret = swr_init(swrCtx_);
  357. if (ret < 0) {
  358. AV_LOGGER_ERRORF("初始化音频重采样器失败: {}", ffmpeg_utils::errorToString(ret));
  359. cleanupResampler();
  360. return static_cast<ErrorCode>(ret);
  361. }
  362. // 创建重采样输出帧
  363. resampledFrame_ = makeAVFrame();
  364. if (!resampledFrame_) {
  365. return ErrorCode::MEMORY_ALLOC_FAILED;
  366. }
  367. resampledFrame_->format = dstFormat;
  368. resampledFrame_->sample_rate = dstSampleRate;
  369. av_channel_layout_copy(&resampledFrame_->ch_layout, &dstChannelLayout);
  370. }
  371. return ErrorCode::SUCCESS;
  372. }
  373. void AudioCapturer::captureThreadFunc() {
  374. AV_LOGGER_INFO("音频采集线程已启动");
  375. while (!shouldStop_) {
  376. // 检查暂停状态
  377. {
  378. std::unique_lock<std::mutex> lock(pauseMutex_);
  379. pauseCondition_.wait(lock, [this] { return !paused_ || shouldStop_; });
  380. }
  381. if (shouldStop_) {
  382. break;
  383. }
  384. ErrorCode result = captureFrame();
  385. if (result != ErrorCode::SUCCESS) {
  386. onError(result, "采集音频帧失败");
  387. // 短暂休眠后重试
  388. std::this_thread::sleep_for(std::chrono::milliseconds(5));
  389. }
  390. }
  391. AV_LOGGER_INFO("音频采集线程已退出");
  392. }
  393. ErrorCode AudioCapturer::captureFrame() {
  394. AVPacket* packet = av_packet_alloc();
  395. if (!packet) {
  396. return ErrorCode::MEMORY_ALLOC_FAILED;
  397. }
  398. // 读取包
  399. int ret = av_read_frame(formatCtx_, packet);
  400. if (ret < 0) {
  401. av_packet_free(&packet);
  402. if (ret == AVERROR_EOF) {
  403. AV_LOGGER_WARNING("音频流结束");
  404. return ErrorCode::END_OF_STREAM;
  405. } else {
  406. AV_LOGGER_ERRORF("读取音频帧失败: {}", ffmpeg_utils::errorToString(ret));
  407. return static_cast<ErrorCode>(ret);
  408. }
  409. }
  410. // 检查是否是音频包
  411. if (packet->stream_index != audioStreamIndex_) {
  412. av_packet_free(&packet);
  413. return ErrorCode::SUCCESS;
  414. }
  415. // 发送包到解码器
  416. ret = avcodec_send_packet(codecCtx_, packet);
  417. av_packet_free(&packet);
  418. if (ret < 0) {
  419. AV_LOGGER_ERRORF("发送音频包到解码器失败: {}", ffmpeg_utils::errorToString(ret));
  420. return static_cast<ErrorCode>(ret);
  421. }
  422. // 接收解码后的帧
  423. AVFramePtr frame = makeAVFrame();
  424. if (!frame) {
  425. return ErrorCode::MEMORY_ALLOC_FAILED;
  426. }
  427. ret = avcodec_receive_frame(codecCtx_, frame.get());
  428. if (ret == AVERROR(EAGAIN)) {
  429. return ErrorCode::SUCCESS; // 需要更多输入
  430. } else if (ret < 0) {
  431. AV_LOGGER_ERRORF("接收音频解码帧失败: {}", ffmpeg_utils::errorToString(ret));
  432. return static_cast<ErrorCode>(ret);
  433. }
  434. // 音频处理
  435. AVFramePtr processedFrame = processAudioFrame(frame);
  436. if (!processedFrame) {
  437. return ErrorCode::PROCESSING_ERROR;
  438. }
  439. // 计算音频电平
  440. calculateAudioLevel(processedFrame);
  441. // 回调
  442. onFrameCaptured(processedFrame);
  443. return ErrorCode::SUCCESS;
  444. }
  445. AVFramePtr AudioCapturer::processAudioFrame(const AVFramePtr& frame) {
  446. if (!frame) {
  447. return nullptr;
  448. }
  449. AVFramePtr processedFrame = std::move(const_cast<AVFramePtr&>(frame));
  450. // 重采样
  451. if (needResampling_) {
  452. processedFrame = resampleAudioFrame(processedFrame);
  453. if (!processedFrame) {
  454. return nullptr;
  455. }
  456. }
  457. // 音量控制
  458. if (currentVolume_ != 1.0f) {
  459. processedFrame = applyVolumeControl(processedFrame);
  460. }
  461. // 降噪处理
  462. if (noiseReductionEnabled_) {
  463. processedFrame = applyNoiseReduction(processedFrame);
  464. }
  465. return processedFrame;
  466. }
  467. AVFramePtr AudioCapturer::resampleAudioFrame(const AVFramePtr& frame) {
  468. if (!frame || !swrCtx_ || !resampledFrame_) {
  469. return nullptr;
  470. }
  471. // 计算输出采样数
  472. int outSamples = swr_get_out_samples(swrCtx_, frame->nb_samples);
  473. resampledFrame_->nb_samples = outSamples;
  474. // 重新分配缓冲区(如果需要)
  475. if (av_frame_get_buffer(resampledFrame_.get(), 0) < 0) {
  476. AV_LOGGER_ERROR("分配重采样缓冲区失败");
  477. return nullptr;
  478. }
  479. // 执行重采样
  480. int convertedSamples = swr_convert(swrCtx_,
  481. resampledFrame_->data, outSamples,
  482. (const uint8_t**)frame->data, frame->nb_samples);
  483. if (convertedSamples < 0) {
  484. AV_LOGGER_ERRORF("音频重采样失败: {}", ffmpeg_utils::errorToString(convertedSamples));
  485. return nullptr;
  486. }
  487. resampledFrame_->nb_samples = convertedSamples;
  488. // 复制时间戳等信息
  489. av_frame_copy_props(resampledFrame_.get(), frame.get());
  490. // 创建新的frame并复制数据
  491. AVFramePtr outputFrame = makeAVFrame();
  492. if (!outputFrame) {
  493. return nullptr;
  494. }
  495. av_frame_ref(outputFrame.get(), resampledFrame_.get());
  496. return outputFrame;
  497. }
  498. AVFramePtr AudioCapturer::applyVolumeControl(const AVFramePtr& frame) {
  499. if (!frame || currentVolume_ == 1.0f) {
  500. return nullptr;
  501. }
  502. // 简单的音量控制实现
  503. AVSampleFormat format = static_cast<AVSampleFormat>(frame->format);
  504. int channels = frame->ch_layout.nb_channels;
  505. int samples = frame->nb_samples;
  506. if (format == AV_SAMPLE_FMT_S16) {
  507. int16_t* data = reinterpret_cast<int16_t*>(frame->data[0]);
  508. for (int i = 0; i < samples * channels; ++i) {
  509. data[i] = static_cast<int16_t>(data[i] * currentVolume_);
  510. }
  511. } else if (format == AV_SAMPLE_FMT_FLT) {
  512. float* data = reinterpret_cast<float*>(frame->data[0]);
  513. for (int i = 0; i < samples * channels; ++i) {
  514. data[i] *= currentVolume_;
  515. }
  516. }
  517. return nullptr;
  518. }
  519. AVFramePtr AudioCapturer::applyNoiseReduction(const AVFramePtr& frame) {
  520. // 简单的降噪实现(实际应用中需要更复杂的算法)
  521. if (!frame) {
  522. return nullptr;
  523. }
  524. // 这里可以实现噪声门限、频谱减法等降噪算法
  525. // 目前只是一个占位符实现
  526. return nullptr;
  527. }
  528. void AudioCapturer::calculateAudioLevel(const AVFramePtr& frame) {
  529. if (!frame) {
  530. return;
  531. }
  532. auto now = std::chrono::steady_clock::now();
  533. auto elapsed = std::chrono::duration<double>(now - lastLevelUpdate_).count();
  534. if (elapsed < LEVEL_UPDATE_INTERVAL) {
  535. return;
  536. }
  537. std::lock_guard<std::mutex> lock(levelMutex_);
  538. AVSampleFormat format = static_cast<AVSampleFormat>(frame->format);
  539. int channels = frame->ch_layout.nb_channels;
  540. int samples = frame->nb_samples;
  541. double sum = 0.0;
  542. int totalSamples = samples * channels;
  543. if (format == AV_SAMPLE_FMT_S16) {
  544. const int16_t* data = reinterpret_cast<const int16_t*>(frame->data[0]);
  545. for (int i = 0; i < totalSamples; ++i) {
  546. sum += std::abs(data[i]) / 32768.0;
  547. }
  548. } else if (format == AV_SAMPLE_FMT_FLT) {
  549. const float* data = reinterpret_cast<const float*>(frame->data[0]);
  550. for (int i = 0; i < totalSamples; ++i) {
  551. sum += std::abs(data[i]);
  552. }
  553. }
  554. float level = static_cast<float>(sum / totalSamples);
  555. audioLevel_.store(std::min<float>(level, 1.0f));
  556. lastLevelUpdate_ = now;
  557. }
  558. void AudioCapturer::cleanupResampler() {
  559. if (swrCtx_) {
  560. swr_free(&swrCtx_);
  561. swrCtx_ = nullptr;
  562. }
  563. resampledFrame_.reset();
  564. needResampling_ = false;
  565. }
  566. void AudioCapturer::cleanupAudioProcessing() {
  567. // 清理音频处理相关资源
  568. noiseReductionEnabled_ = false;
  569. echoCancellationEnabled_ = false;
  570. currentVolume_ = 1.0f;
  571. audioLevel_ = 0.0f;
  572. }
  573. std::vector<AudioDeviceInfo> AudioCapturer::enumerateMicrophones() const {
  574. #ifdef _WIN32
  575. return enumerateDirectSoundDevices();
  576. #elif defined(__linux__)
  577. return enumerateALSADevices();
  578. #elif defined(__APPLE__)
  579. return enumerateCoreAudioDevices();
  580. #else
  581. return {};
  582. #endif
  583. }
  584. std::vector<AudioDeviceInfo> AudioCapturer::enumerateSystemAudioDevices() const {
  585. #ifdef _WIN32
  586. return enumerateWASAPIDevices();
  587. #elif defined(__linux__)
  588. return enumeratePulseAudioDevices();
  589. #elif defined(__APPLE__)
  590. return enumerateCoreAudioDevices();
  591. #else
  592. return {};
  593. #endif
  594. }
  595. const AVInputFormat* AudioCapturer::getPlatformInputFormat() const {
  596. #ifdef _WIN32
  597. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  598. return av_find_input_format("dshow");
  599. } else {
  600. return av_find_input_format("dshow"); // WASAPI通过dshow访问
  601. }
  602. #elif defined(__linux__)
  603. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  604. return av_find_input_format("alsa");
  605. } else {
  606. return av_find_input_format("pulse");
  607. }
  608. #elif defined(__APPLE__)
  609. return av_find_input_format("avfoundation");
  610. #endif
  611. return nullptr;
  612. }
  613. std::string AudioCapturer::getPlatformDeviceName() const {
  614. #ifdef _WIN32
  615. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  616. if (!audioParams_.deviceName.empty()) {
  617. return "audio=" + audioParams_.deviceName;
  618. } else {
  619. return "audio=" + std::to_string(audioParams_.micIndex);
  620. }
  621. } else {
  622. return "audio=" + (audioParams_.audioDevice.empty() ? "@device_cm_{33D9A762-90C8-11D0-BD43-00A0C911CE86}\\wave_{00000000-0000-0000-0000-000000000000}" : audioParams_.audioDevice);
  623. }
  624. #elif defined(__linux__)
  625. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  626. if (!audioParams_.deviceName.empty()) {
  627. return audioParams_.deviceName;
  628. } else {
  629. return "hw:" + std::to_string(audioParams_.micIndex);
  630. }
  631. } else {
  632. return audioParams_.audioDevice.empty() ? "default" : audioParams_.audioDevice;
  633. }
  634. #elif defined(__APPLE__)
  635. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  636. return ":" + std::to_string(audioParams_.micIndex);
  637. } else {
  638. return ":none";
  639. }
  640. #endif
  641. return "";
  642. }
  643. #ifdef _WIN32
  644. std::vector<AudioDeviceInfo> AudioCapturer::enumerateDirectSoundDevices() const {
  645. std::vector<AudioDeviceInfo> devices;
  646. // 简化的DirectSound设备枚举
  647. AudioDeviceInfo device;
  648. device.id = "0";
  649. device.name = "默认麦克风";
  650. device.description = "DirectSound麦克风设备";
  651. device.isDefault = true;
  652. device.isInput = true;
  653. // 添加常见采样率
  654. device.supportedSampleRates = {8000, 16000, 22050, 44100, 48000};
  655. // 添加常见声道数
  656. device.supportedChannels = {1, 2};
  657. // 添加支持的采样格式
  658. device.supportedFormats = {
  659. AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT
  660. };
  661. devices.push_back(device);
  662. return devices;
  663. }
  664. std::vector<AudioDeviceInfo> AudioCapturer::enumerateWASAPIDevices() const {
  665. std::vector<AudioDeviceInfo> devices;
  666. // 简化的WASAPI设备枚举
  667. AudioDeviceInfo device;
  668. device.id = "wasapi_default";
  669. device.name = "默认系统音频";
  670. device.description = "WASAPI系统音频设备";
  671. device.isDefault = true;
  672. device.isInput = false;
  673. // 添加常见采样率
  674. device.supportedSampleRates = {44100, 48000, 96000};
  675. // 添加常见声道数
  676. device.supportedChannels = {2, 6, 8};
  677. // 添加支持的采样格式
  678. device.supportedFormats = {
  679. AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT
  680. };
  681. devices.push_back(device);
  682. return devices;
  683. }
  684. ErrorCode AudioCapturer::setupDirectSoundMicrophone() {
  685. AV_LOGGER_INFO("设置DirectSound麦克风");
  686. return openInputDevice();
  687. }
  688. ErrorCode AudioCapturer::setupWASAPISystemAudio() {
  689. AV_LOGGER_INFO("设置WASAPI系统音频");
  690. return openInputDevice();
  691. }
  692. #endif
  693. // AudioCaptureFactory 实现
  694. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createMicrophone(int micIndex) {
  695. auto capturer = std::make_unique<AudioCapturer>();
  696. AudioCaptureParams params(CapturerType::AUDIO_MIC);
  697. params.micIndex = micIndex;
  698. ErrorCode result = capturer->initialize(params);
  699. if (result != ErrorCode::SUCCESS) {
  700. AV_LOGGER_ERRORF("创建麦克风采集器失败: {}", static_cast<int>(result));
  701. return nullptr;
  702. }
  703. return capturer;
  704. }
  705. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createSystemAudio(bool loopback) {
  706. auto capturer = std::make_unique<AudioCapturer>();
  707. AudioCaptureParams params(loopback ? CapturerType::AUDIO_LOOPBACK : CapturerType::AUDIO_SYSTEM);
  708. params.captureLoopback = loopback;
  709. ErrorCode result = capturer->initialize(params);
  710. if (result != ErrorCode::SUCCESS) {
  711. AV_LOGGER_ERRORF("创建系统音频采集器失败: {}", static_cast<int>(result));
  712. return nullptr;
  713. }
  714. return capturer;
  715. }
  716. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createBestMicrophone() {
  717. return createMicrophone(0); // 默认使用第一个麦克风
  718. }
  719. } // namespace capture
  720. } // namespace av