capture_audio_capturer.cpp 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897
  1. #include "capture_audio_capturer.h"
  2. #include "../base/logger.h"
  3. #include "../base/media_common.h"
  4. #include <algorithm>
  5. #include <cmath>
  6. #ifdef _WIN32
  7. #include <windows.h>
  8. #include <mmdeviceapi.h>
  9. #include <audioclient.h>
  10. #include <endpointvolume.h>
  11. #pragma comment(lib, "ole32.lib")
  12. #endif
  13. extern "C" {
  14. #include <libavformat/avformat.h>
  15. #include <libavdevice/avdevice.h>
  16. #include <libswresample/swresample.h>
  17. #include <libavutil/opt.h>
  18. #include <libavutil/channel_layout.h>
  19. }
  20. namespace av {
  21. namespace capture {
  22. AudioCapturer::AudioCapturer() : audioParams_(CapturerType::AUDIO_MIC) {
  23. AV_LOGGER_DEBUG("创建音频采集器");
  24. // 注册设备
  25. avdevice_register_all();
  26. lastLevelUpdate_ = std::chrono::steady_clock::now();
  27. }
  28. AudioCapturer::~AudioCapturer() {
  29. close();
  30. AV_LOGGER_DEBUG("音频采集器已销毁");
  31. }
  32. ErrorCode AudioCapturer::initialize(const CapturerParams& params) {
  33. if (params.mediaType != MediaType::AUDIO) {
  34. AV_LOGGER_ERROR("参数媒体类型不是音频");
  35. return ErrorCode::INVALID_ARGUMENT;
  36. }
  37. audioParams_ = static_cast<const AudioCaptureParams&>(params);
  38. if (!validateParams(audioParams_)) {
  39. return ErrorCode::INVALID_PARAMS;
  40. }
  41. ErrorCode result = ErrorCode::OK;
  42. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  43. result = initializeMicrophone();
  44. } else if (audioParams_.type == CapturerType::AUDIO_SYSTEM ||
  45. audioParams_.type == CapturerType::AUDIO_LOOPBACK) {
  46. result = initializeSystemAudio();
  47. } else {
  48. AV_LOGGER_ERROR("不支持的音频采集器类型");
  49. return ErrorCode::NOT_SUPPORTED;
  50. }
  51. if (result == ErrorCode::OK) {
  52. setState(CapturerState::INITIALIZED);
  53. AV_LOGGER_INFOF("音频采集器初始化成功: {}Hz, {}ch, {}",
  54. audioParams_.sampleRate, audioParams_.channels,
  55. av_get_sample_fmt_name(audioParams_.sampleFormat));
  56. }
  57. return result;
  58. }
  59. ErrorCode AudioCapturer::start() {
  60. std::lock_guard<std::mutex> lock(captureMutex_);
  61. if (getState() != CapturerState::INITIALIZED) {
  62. AV_LOGGER_ERROR("采集器状态无效,无法启动");
  63. return ErrorCode::INVALID_STATE;
  64. }
  65. shouldStop_ = false;
  66. // 启动采集线程
  67. try {
  68. captureThread_ = std::thread(&AudioCapturer::captureThreadFunc, this);
  69. setState(CapturerState::STARTED);
  70. AV_LOGGER_INFO("音频采集已启动");
  71. return ErrorCode::OK;
  72. } catch (const std::exception& e) {
  73. AV_LOGGER_ERRORF("启动音频采集线程失败: {}", e.what());
  74. return ErrorCode::THREAD_ERROR;
  75. }
  76. }
  77. ErrorCode AudioCapturer::stop() {
  78. std::lock_guard<std::mutex> lock(captureMutex_);
  79. if (getState() != CapturerState::STARTED) {
  80. return ErrorCode::OK;
  81. }
  82. shouldStop_ = true;
  83. // 唤醒暂停的线程
  84. {
  85. std::lock_guard<std::mutex> pauseLock(pauseMutex_);
  86. paused_ = false;
  87. pauseCondition_.notify_all();
  88. }
  89. // 等待线程结束
  90. if (captureThread_.joinable()) {
  91. captureThread_.join();
  92. }
  93. setState(CapturerState::STOPPED);
  94. AV_LOGGER_INFO("音频采集已停止");
  95. return ErrorCode::OK;
  96. }
  97. ErrorCode AudioCapturer::pause() {
  98. if (getState() != CapturerState::STARTED) {
  99. return ErrorCode::INVALID_STATE;
  100. }
  101. paused_ = true;
  102. AV_LOGGER_INFO("音频采集已暂停");
  103. return ErrorCode::OK;
  104. }
  105. ErrorCode AudioCapturer::resume() {
  106. if (getState() != CapturerState::STARTED) {
  107. return ErrorCode::INVALID_STATE;
  108. }
  109. {
  110. std::lock_guard<std::mutex> lock(pauseMutex_);
  111. paused_ = false;
  112. pauseCondition_.notify_all();
  113. }
  114. AV_LOGGER_INFO("音频采集已恢复");
  115. return ErrorCode::OK;
  116. }
  117. ErrorCode AudioCapturer::reset() {
  118. ErrorCode result = stop();
  119. if (result != ErrorCode::OK) {
  120. return result;
  121. }
  122. // 清空帧队列
  123. {
  124. std::lock_guard<std::mutex> lock(queueMutex_);
  125. while (!frameQueue_.empty()) {
  126. frameQueue_.pop();
  127. }
  128. }
  129. resetStats();
  130. audioLevel_ = 0.0f;
  131. setState(CapturerState::INITIALIZED);
  132. AV_LOGGER_INFO("音频采集器已重置");
  133. return ErrorCode::OK;
  134. }
  135. ErrorCode AudioCapturer::close() {
  136. stop();
  137. // 清理资源
  138. cleanupResampler();
  139. cleanupAudioProcessing();
  140. if (codecCtx_) {
  141. avcodec_free_context(&codecCtx_);
  142. codecCtx_ = nullptr;
  143. }
  144. if (formatCtx_) {
  145. avformat_close_input(&formatCtx_);
  146. formatCtx_ = nullptr;
  147. }
  148. codec_ = nullptr;
  149. audioStreamIndex_ = -1;
  150. setState(CapturerState::IDLE);
  151. AV_LOGGER_INFO("音频采集器已关闭");
  152. return ErrorCode::OK;
  153. }
  154. std::vector<std::string> AudioCapturer::getAvailableDevices() const {
  155. std::vector<std::string> devices;
  156. auto deviceInfos = getDetailedDeviceInfo();
  157. for (const auto& info : deviceInfos) {
  158. devices.push_back(info.name);
  159. }
  160. return devices;
  161. }
  162. std::string AudioCapturer::getCurrentDevice() const {
  163. return audioParams_.deviceName;
  164. }
  165. std::vector<AudioDeviceInfo> AudioCapturer::getDetailedDeviceInfo() const {
  166. std::lock_guard<std::mutex> lock(deviceCacheMutex_);
  167. if (!devicesCached_) {
  168. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  169. cachedDevices_ = enumerateMicrophones();
  170. } else {
  171. cachedDevices_ = enumerateSystemAudioDevices();
  172. }
  173. devicesCached_ = true;
  174. }
  175. return cachedDevices_;
  176. }
  177. ErrorCode AudioCapturer::setAudioParams(int sampleRate, int channels, AVSampleFormat sampleFormat) {
  178. if (getState() == CapturerState::STARTED) {
  179. AV_LOGGER_ERROR("无法在采集过程中修改音频参数");
  180. return ErrorCode::INVALID_STATE;
  181. }
  182. audioParams_.sampleRate = sampleRate;
  183. audioParams_.channels = channels;
  184. audioParams_.sampleFormat = sampleFormat;
  185. AV_LOGGER_INFOF("音频参数已更新: {}Hz, {}ch, {}",
  186. sampleRate, channels, av_get_sample_fmt_name(sampleFormat));
  187. return ErrorCode::OK;
  188. }
  189. ErrorCode AudioCapturer::setVolume(float volume) {
  190. if (volume < 0.0f || volume > 2.0f) {
  191. AV_LOGGER_ERROR("音量值超出范围 (0.0-2.0)");
  192. return ErrorCode::INVALID_ARGUMENT;
  193. }
  194. currentVolume_ = volume;
  195. audioParams_.volume = volume;
  196. AV_LOGGER_INFOF("音量已设置为: {:.2f}", volume);
  197. return ErrorCode::OK;
  198. }
  199. float AudioCapturer::getVolume() const {
  200. return currentVolume_;
  201. }
  202. ErrorCode AudioCapturer::setNoiseReduction(bool enable) {
  203. noiseReductionEnabled_ = enable;
  204. audioParams_.enableNoiseReduction = enable;
  205. AV_LOGGER_INFOF("降噪已{}", enable ? "启用" : "禁用");
  206. return ErrorCode::OK;
  207. }
  208. ErrorCode AudioCapturer::setEchoCancellation(bool enable) {
  209. echoCancellationEnabled_ = enable;
  210. audioParams_.enableEchoCancellation = enable;
  211. AV_LOGGER_INFOF("回声消除已{}", enable ? "启用" : "禁用");
  212. return ErrorCode::OK;
  213. }
  214. AudioCaptureParams AudioCapturer::getCurrentParams() const {
  215. return audioParams_;
  216. }
  217. float AudioCapturer::getAudioLevel() const {
  218. return audioLevel_.load();
  219. }
  220. bool AudioCapturer::validateParams(const CapturerParams& params) {
  221. const auto& audioParams = static_cast<const AudioCaptureParams&>(params);
  222. if (audioParams.sampleRate <= 0 || audioParams.sampleRate > 192000) {
  223. AV_LOGGER_ERROR("采样率无效");
  224. return false;
  225. }
  226. if (audioParams.channels <= 0 || audioParams.channels > 8) {
  227. AV_LOGGER_ERROR("声道数无效");
  228. return false;
  229. }
  230. if (audioParams.bufferSize <= 0 || audioParams.bufferSize > 8192) {
  231. AV_LOGGER_ERROR("缓冲区大小无效");
  232. return false;
  233. }
  234. if (audioParams.volume < 0.0f || audioParams.volume > 2.0f) {
  235. AV_LOGGER_ERROR("音量值无效");
  236. return false;
  237. }
  238. return true;
  239. }
  240. ErrorCode AudioCapturer::initializeMicrophone() {
  241. AV_LOGGER_INFOF("初始化麦克风采集器: 索引={}", audioParams_.micIndex);
  242. #ifdef _WIN32
  243. return setupDirectSoundMicrophone();
  244. #elif defined(__linux__)
  245. return setupALSAMicrophone();
  246. #elif defined(__APPLE__)
  247. return setupCoreAudioMicrophone();
  248. #else
  249. AV_LOGGER_ERROR("当前平台不支持麦克风采集");
  250. return ErrorCode::NOT_SUPPORTED;
  251. #endif
  252. }
  253. ErrorCode AudioCapturer::initializeSystemAudio() {
  254. AV_LOGGER_INFO("初始化系统音频采集器");
  255. #ifdef _WIN32
  256. return setupWASAPISystemAudio();
  257. #elif defined(__linux__)
  258. return setupPulseAudioCapture();
  259. #elif defined(__APPLE__)
  260. return setupCoreAudioSystemCapture();
  261. #else
  262. AV_LOGGER_ERROR("当前平台不支持系统音频采集");
  263. return ErrorCode::NOT_SUPPORTED;
  264. #endif
  265. }
  266. ErrorCode AudioCapturer::openInputDevice() {
  267. const AVInputFormat* inputFormat = getPlatformInputFormat();
  268. if (!inputFormat) {
  269. AV_LOGGER_ERROR("获取音频输入格式失败");
  270. return ErrorCode::NOT_SUPPORTED;
  271. }
  272. std::string deviceName = getPlatformDeviceName();
  273. if (deviceName.empty()) {
  274. AV_LOGGER_ERROR("获取音频设备名称失败");
  275. return ErrorCode::DEVICE_NOT_FOUND;
  276. }
  277. AV_LOGGER_INFOF("打开音频输入设备: {} (格式: {})", deviceName, inputFormat->name);
  278. // 设置输入选项
  279. AVDictionary* options = nullptr;
  280. // 设置音频参数
  281. av_dict_set(&options, "sample_rate", std::to_string(audioParams_.sampleRate).c_str(), 0);
  282. av_dict_set(&options, "channels", std::to_string(audioParams_.channels).c_str(), 0);
  283. // 设置缓冲区大小
  284. av_dict_set(&options, "audio_buffer_size", std::to_string(audioParams_.bufferSize).c_str(), 0);
  285. // 打开输入
  286. int ret = avformat_open_input(&formatCtx_, deviceName.c_str(), inputFormat, &options);
  287. av_dict_free(&options);
  288. if (ret < 0) {
  289. AV_LOGGER_ERRORF("打开音频输入设备失败: {} (设备: {})",
  290. ffmpeg_utils::errorToString(ret), deviceName);
  291. return static_cast<ErrorCode>(ret);
  292. }
  293. // 查找流信息
  294. ret = avformat_find_stream_info(formatCtx_, nullptr);
  295. if (ret < 0) {
  296. AV_LOGGER_ERRORF("查找音频流信息失败: {}", ffmpeg_utils::errorToString(ret));
  297. return static_cast<ErrorCode>(ret);
  298. }
  299. // 查找音频流
  300. audioStreamIndex_ = av_find_best_stream(formatCtx_, AVMEDIA_TYPE_AUDIO, -1, -1, &codec_, 0);
  301. if (audioStreamIndex_ < 0) {
  302. AV_LOGGER_ERROR("未找到音频流");
  303. return ErrorCode::STREAM_NOT_FOUND;
  304. }
  305. // 创建解码上下文
  306. codecCtx_ = avcodec_alloc_context3(codec_);
  307. if (!codecCtx_) {
  308. AV_LOGGER_ERROR("分配音频解码上下文失败");
  309. return ErrorCode::OUT_OF_MEMORY;
  310. }
  311. // 复制流参数到解码上下文
  312. ret = avcodec_parameters_to_context(codecCtx_, formatCtx_->streams[audioStreamIndex_]->codecpar);
  313. if (ret < 0) {
  314. AV_LOGGER_ERRORF("复制音频流参数失败: {}", ffmpeg_utils::errorToString(ret));
  315. return static_cast<ErrorCode>(ret);
  316. }
  317. // 打开解码器
  318. ret = avcodec_open2(codecCtx_, codec_, nullptr);
  319. if (ret < 0) {
  320. AV_LOGGER_ERRORF("打开音频解码器失败: {}", ffmpeg_utils::errorToString(ret));
  321. return static_cast<ErrorCode>(ret);
  322. }
  323. // 设置音频重采样
  324. return setupAudioResampling();
  325. }
  326. ErrorCode AudioCapturer::setupAudioResampling() {
  327. AVSampleFormat srcFormat = codecCtx_->sample_fmt;
  328. int srcSampleRate = codecCtx_->sample_rate;
  329. int srcChannels = codecCtx_->channels;
  330. uint64_t srcChannelLayout = codecCtx_->channel_layout;
  331. AVSampleFormat dstFormat = audioParams_.sampleFormat;
  332. int dstSampleRate = audioParams_.sampleRate;
  333. int dstChannels = audioParams_.channels;
  334. uint64_t dstChannelLayout = av_get_default_channel_layout(dstChannels);
  335. needResampling_ = (srcFormat != dstFormat) ||
  336. (srcSampleRate != dstSampleRate) ||
  337. (srcChannels != dstChannels);
  338. if (needResampling_) {
  339. AV_LOGGER_INFOF("需要音频重采样: {}Hz,{}ch,{} -> {}Hz,{}ch,{}",
  340. srcSampleRate, srcChannels, av_get_sample_fmt_name(srcFormat),
  341. dstSampleRate, dstChannels, av_get_sample_fmt_name(dstFormat));
  342. swrCtx_ = swr_alloc();
  343. if (!swrCtx_) {
  344. AV_LOGGER_ERROR("分配音频重采样器失败");
  345. return ErrorCode::OUT_OF_MEMORY;
  346. }
  347. // 设置重采样参数
  348. av_opt_set_int(swrCtx_, "in_channel_layout", srcChannelLayout, 0);
  349. av_opt_set_int(swrCtx_, "in_sample_rate", srcSampleRate, 0);
  350. av_opt_set_sample_fmt(swrCtx_, "in_sample_fmt", srcFormat, 0);
  351. av_opt_set_int(swrCtx_, "out_channel_layout", dstChannelLayout, 0);
  352. av_opt_set_int(swrCtx_, "out_sample_rate", dstSampleRate, 0);
  353. av_opt_set_sample_fmt(swrCtx_, "out_sample_fmt", dstFormat, 0);
  354. // 初始化重采样器
  355. int ret = swr_init(swrCtx_);
  356. if (ret < 0) {
  357. AV_LOGGER_ERRORF("初始化音频重采样器失败: {}", ffmpeg_utils::errorToString(ret));
  358. cleanupResampler();
  359. return static_cast<ErrorCode>(ret);
  360. }
  361. // 创建重采样输出帧
  362. resampledFrame_ = makeAVFrame();
  363. if (!resampledFrame_) {
  364. return ErrorCode::OUT_OF_MEMORY;
  365. }
  366. resampledFrame_->format = dstFormat;
  367. resampledFrame_->sample_rate = dstSampleRate;
  368. resampledFrame_->channels = dstChannels;
  369. resampledFrame_->channel_layout = dstChannelLayout;
  370. }
  371. return ErrorCode::OK;
  372. }
  373. void AudioCapturer::captureThreadFunc() {
  374. AV_LOGGER_INFO("音频采集线程已启动");
  375. while (!shouldStop_) {
  376. // 检查暂停状态
  377. {
  378. std::unique_lock<std::mutex> lock(pauseMutex_);
  379. pauseCondition_.wait(lock, [this] { return !paused_ || shouldStop_; });
  380. }
  381. if (shouldStop_) {
  382. break;
  383. }
  384. ErrorCode result = captureFrame();
  385. if (result != ErrorCode::OK) {
  386. onError(result, "采集音频帧失败");
  387. // 短暂休眠后重试
  388. std::this_thread::sleep_for(std::chrono::milliseconds(5));
  389. }
  390. }
  391. AV_LOGGER_INFO("音频采集线程已退出");
  392. }
  393. ErrorCode AudioCapturer::captureFrame() {
  394. AVPacket packet;
  395. av_init_packet(&packet);
  396. // 读取包
  397. int ret = av_read_frame(formatCtx_, &packet);
  398. if (ret < 0) {
  399. if (ret == AVERROR_EOF) {
  400. AV_LOGGER_WARNING("音频流结束");
  401. return ErrorCode::END_OF_STREAM;
  402. } else {
  403. AV_LOGGER_ERRORF("读取音频帧失败: {}", ffmpeg_utils::errorToString(ret));
  404. return static_cast<ErrorCode>(ret);
  405. }
  406. }
  407. // 检查是否是音频包
  408. if (packet.stream_index != audioStreamIndex_) {
  409. av_packet_unref(&packet);
  410. return ErrorCode::OK;
  411. }
  412. // 发送包到解码器
  413. ret = avcodec_send_packet(codecCtx_, &packet);
  414. av_packet_unref(&packet);
  415. if (ret < 0) {
  416. AV_LOGGER_ERRORF("发送音频包到解码器失败: {}", ffmpeg_utils::errorToString(ret));
  417. return static_cast<ErrorCode>(ret);
  418. }
  419. // 接收解码后的帧
  420. AVFramePtr frame = makeAVFrame();
  421. if (!frame) {
  422. return ErrorCode::OUT_OF_MEMORY;
  423. }
  424. ret = avcodec_receive_frame(codecCtx_, frame.get());
  425. if (ret == AVERROR(EAGAIN)) {
  426. return ErrorCode::OK; // 需要更多输入
  427. } else if (ret < 0) {
  428. AV_LOGGER_ERRORF("接收音频解码帧失败: {}", ffmpeg_utils::errorToString(ret));
  429. return static_cast<ErrorCode>(ret);
  430. }
  431. // 音频处理
  432. AVFramePtr processedFrame = processAudioFrame(frame);
  433. if (!processedFrame) {
  434. return ErrorCode::PROCESSING_ERROR;
  435. }
  436. // 计算音频电平
  437. calculateAudioLevel(processedFrame);
  438. // 回调
  439. onFrameCaptured(processedFrame);
  440. return ErrorCode::OK;
  441. }
  442. AVFramePtr AudioCapturer::processAudioFrame(const AVFramePtr& frame) {
  443. if (!frame) {
  444. return nullptr;
  445. }
  446. AVFramePtr processedFrame = frame;
  447. // 重采样
  448. if (needResampling_) {
  449. processedFrame = resampleAudioFrame(processedFrame);
  450. if (!processedFrame) {
  451. return nullptr;
  452. }
  453. }
  454. // 音量控制
  455. if (currentVolume_ != 1.0f) {
  456. processedFrame = applyVolumeControl(processedFrame);
  457. }
  458. // 降噪处理
  459. if (noiseReductionEnabled_) {
  460. processedFrame = applyNoiseReduction(processedFrame);
  461. }
  462. return processedFrame;
  463. }
  464. AVFramePtr AudioCapturer::resampleAudioFrame(const AVFramePtr& frame) {
  465. if (!frame || !swrCtx_ || !resampledFrame_) {
  466. return frame;
  467. }
  468. // 计算输出采样数
  469. int outSamples = swr_get_out_samples(swrCtx_, frame->nb_samples);
  470. resampledFrame_->nb_samples = outSamples;
  471. // 重新分配缓冲区(如果需要)
  472. if (av_frame_get_buffer(resampledFrame_.get(), 0) < 0) {
  473. AV_LOGGER_ERROR("分配重采样缓冲区失败");
  474. return nullptr;
  475. }
  476. // 执行重采样
  477. int convertedSamples = swr_convert(swrCtx_,
  478. resampledFrame_->data, outSamples,
  479. (const uint8_t**)frame->data, frame->nb_samples);
  480. if (convertedSamples < 0) {
  481. AV_LOGGER_ERRORF("音频重采样失败: {}", ffmpeg_utils::errorToString(convertedSamples));
  482. return nullptr;
  483. }
  484. resampledFrame_->nb_samples = convertedSamples;
  485. // 复制时间戳等信息
  486. av_frame_copy_props(resampledFrame_.get(), frame.get());
  487. return resampledFrame_;
  488. }
  489. AVFramePtr AudioCapturer::applyVolumeControl(const AVFramePtr& frame) {
  490. if (!frame || currentVolume_ == 1.0f) {
  491. return frame;
  492. }
  493. // 简单的音量控制实现
  494. AVSampleFormat format = static_cast<AVSampleFormat>(frame->format);
  495. int channels = frame->ch_layout.nb_channels;
  496. int samples = frame->nb_samples;
  497. if (format == AV_SAMPLE_FMT_S16) {
  498. int16_t* data = reinterpret_cast<int16_t*>(frame->data[0]);
  499. for (int i = 0; i < samples * channels; ++i) {
  500. data[i] = static_cast<int16_t>(data[i] * currentVolume_);
  501. }
  502. } else if (format == AV_SAMPLE_FMT_FLT) {
  503. float* data = reinterpret_cast<float*>(frame->data[0]);
  504. for (int i = 0; i < samples * channels; ++i) {
  505. data[i] *= currentVolume_;
  506. }
  507. }
  508. return frame;
  509. }
  510. AVFramePtr AudioCapturer::applyNoiseReduction(const AVFramePtr& frame) {
  511. // 简单的降噪实现(实际应用中需要更复杂的算法)
  512. if (!frame) {
  513. return frame;
  514. }
  515. // 这里可以实现噪声门限、频谱减法等降噪算法
  516. // 目前只是一个占位符实现
  517. return frame;
  518. }
  519. void AudioCapturer::calculateAudioLevel(const AVFramePtr& frame) {
  520. if (!frame) {
  521. return;
  522. }
  523. auto now = std::chrono::steady_clock::now();
  524. auto elapsed = std::chrono::duration<double>(now - lastLevelUpdate_).count();
  525. if (elapsed < LEVEL_UPDATE_INTERVAL) {
  526. return;
  527. }
  528. std::lock_guard<std::mutex> lock(levelMutex_);
  529. AVSampleFormat format = static_cast<AVSampleFormat>(frame->format);
  530. int channels = frame->ch_layout.nb_channels;
  531. int samples = frame->nb_samples;
  532. double sum = 0.0;
  533. int totalSamples = samples * channels;
  534. if (format == AV_SAMPLE_FMT_S16) {
  535. const int16_t* data = reinterpret_cast<const int16_t*>(frame->data[0]);
  536. for (int i = 0; i < totalSamples; ++i) {
  537. sum += std::abs(data[i]) / 32768.0;
  538. }
  539. } else if (format == AV_SAMPLE_FMT_FLT) {
  540. const float* data = reinterpret_cast<const float*>(frame->data[0]);
  541. for (int i = 0; i < totalSamples; ++i) {
  542. sum += std::abs(data[i]);
  543. }
  544. }
  545. float level = static_cast<float>(sum / totalSamples);
  546. audioLevel_.store(std::min(level, 1.0f));
  547. lastLevelUpdate_ = now;
  548. }
  549. void AudioCapturer::cleanupResampler() {
  550. if (swrCtx_) {
  551. swr_free(&swrCtx_);
  552. swrCtx_ = nullptr;
  553. }
  554. resampledFrame_.reset();
  555. needResampling_ = false;
  556. }
  557. void AudioCapturer::cleanupAudioProcessing() {
  558. // 清理音频处理相关资源
  559. noiseReductionEnabled_ = false;
  560. echoCancellationEnabled_ = false;
  561. currentVolume_ = 1.0f;
  562. audioLevel_ = 0.0f;
  563. }
  564. std::vector<AudioDeviceInfo> AudioCapturer::enumerateMicrophones() const {
  565. #ifdef _WIN32
  566. return enumerateDirectSoundDevices();
  567. #elif defined(__linux__)
  568. return enumerateALSADevices();
  569. #elif defined(__APPLE__)
  570. return enumerateCoreAudioDevices();
  571. #else
  572. return {};
  573. #endif
  574. }
  575. std::vector<AudioDeviceInfo> AudioCapturer::enumerateSystemAudioDevices() const {
  576. #ifdef _WIN32
  577. return enumerateWASAPIDevices();
  578. #elif defined(__linux__)
  579. return enumeratePulseAudioDevices();
  580. #elif defined(__APPLE__)
  581. return enumerateCoreAudioDevices();
  582. #else
  583. return {};
  584. #endif
  585. }
  586. const AVInputFormat* AudioCapturer::getPlatformInputFormat() const {
  587. #ifdef _WIN32
  588. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  589. return av_find_input_format("dshow");
  590. } else {
  591. return av_find_input_format("dshow"); // WASAPI通过dshow访问
  592. }
  593. #elif defined(__linux__)
  594. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  595. return av_find_input_format("alsa");
  596. } else {
  597. return av_find_input_format("pulse");
  598. }
  599. #elif defined(__APPLE__)
  600. return av_find_input_format("avfoundation");
  601. #endif
  602. return nullptr;
  603. }
  604. std::string AudioCapturer::getPlatformDeviceName() const {
  605. #ifdef _WIN32
  606. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  607. if (!audioParams_.deviceName.empty()) {
  608. return "audio=" + audioParams_.deviceName;
  609. } else {
  610. return "audio=" + std::to_string(audioParams_.micIndex);
  611. }
  612. } else {
  613. return "audio=" + (audioParams_.audioDevice.empty() ? "@device_cm_{33D9A762-90C8-11D0-BD43-00A0C911CE86}\\wave_{00000000-0000-0000-0000-000000000000}" : audioParams_.audioDevice);
  614. }
  615. #elif defined(__linux__)
  616. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  617. if (!audioParams_.deviceName.empty()) {
  618. return audioParams_.deviceName;
  619. } else {
  620. return "hw:" + std::to_string(audioParams_.micIndex);
  621. }
  622. } else {
  623. return audioParams_.audioDevice.empty() ? "default" : audioParams_.audioDevice;
  624. }
  625. #elif defined(__APPLE__)
  626. if (audioParams_.type == CapturerType::AUDIO_MIC) {
  627. return ":" + std::to_string(audioParams_.micIndex);
  628. } else {
  629. return ":none";
  630. }
  631. #endif
  632. return "";
  633. }
  634. #ifdef _WIN32
  635. std::vector<AudioDeviceInfo> AudioCapturer::enumerateDirectSoundDevices() const {
  636. std::vector<AudioDeviceInfo> devices;
  637. // 简化的DirectSound设备枚举
  638. AudioDeviceInfo device;
  639. device.id = "0";
  640. device.name = "默认麦克风";
  641. device.description = "DirectSound麦克风设备";
  642. device.isDefault = true;
  643. device.isInput = true;
  644. // 添加常见采样率
  645. device.supportedSampleRates = {8000, 16000, 22050, 44100, 48000};
  646. // 添加常见声道数
  647. device.supportedChannels = {1, 2};
  648. // 添加支持的采样格式
  649. device.supportedFormats = {
  650. AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT
  651. };
  652. devices.push_back(device);
  653. return devices;
  654. }
  655. std::vector<AudioDeviceInfo> AudioCapturer::enumerateWASAPIDevices() const {
  656. std::vector<AudioDeviceInfo> devices;
  657. // 简化的WASAPI设备枚举
  658. AudioDeviceInfo device;
  659. device.id = "wasapi_default";
  660. device.name = "默认系统音频";
  661. device.description = "WASAPI系统音频设备";
  662. device.isDefault = true;
  663. device.isInput = false;
  664. // 添加常见采样率
  665. device.supportedSampleRates = {44100, 48000, 96000};
  666. // 添加常见声道数
  667. device.supportedChannels = {2, 6, 8};
  668. // 添加支持的采样格式
  669. device.supportedFormats = {
  670. AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT
  671. };
  672. devices.push_back(device);
  673. return devices;
  674. }
  675. ErrorCode AudioCapturer::setupDirectSoundMicrophone() {
  676. AV_LOGGER_INFO("设置DirectSound麦克风");
  677. return openInputDevice();
  678. }
  679. ErrorCode AudioCapturer::setupWASAPISystemAudio() {
  680. AV_LOGGER_INFO("设置WASAPI系统音频");
  681. return openInputDevice();
  682. }
  683. #endif
  684. // AudioCaptureFactory 实现
  685. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createMicrophone(int micIndex) {
  686. auto capturer = std::make_unique<AudioCapturer>();
  687. AudioCaptureParams params(CapturerType::AUDIO_MIC);
  688. params.micIndex = micIndex;
  689. ErrorCode result = capturer->initialize(params);
  690. if (result != ErrorCode::OK) {
  691. AV_LOGGER_ERRORF("创建麦克风采集器失败: {}", static_cast<int>(result));
  692. return nullptr;
  693. }
  694. return capturer;
  695. }
  696. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createSystemAudio(bool loopback) {
  697. auto capturer = std::make_unique<AudioCapturer>();
  698. AudioCaptureParams params(loopback ? CapturerType::AUDIO_LOOPBACK : CapturerType::AUDIO_SYSTEM);
  699. params.captureLoopback = loopback;
  700. ErrorCode result = capturer->initialize(params);
  701. if (result != ErrorCode::OK) {
  702. AV_LOGGER_ERRORF("创建系统音频采集器失败: {}", static_cast<int>(result));
  703. return nullptr;
  704. }
  705. return capturer;
  706. }
  707. std::unique_ptr<AudioCapturer> AudioCapturer::AudioCaptureFactory::createBestMicrophone() {
  708. return createMicrophone(0); // 默认使用第一个麦克风
  709. }
  710. } // namespace capture
  711. } // namespace av