content/renderer/media/audio_repetition_detector.cc - Issue 1357013006: Add detection for repeated audio in capturing.

Side by Side Diff: content/renderer/media/audio_repetition_detector.cc

Issue 1357013006: Add detection for repeated audio in capturing. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: some small changes Created 5 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

« content/renderer/media/audio_repetition_detector.h ('K') | « content/renderer/media/audio_repetition_detector.h ('k') | content/renderer/media/audio_repetition_detector_unittest.cc » ('j') | content/renderer/media/media_stream_audio_processor.h » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
(Empty)
	1 // Copyright 2015 The Chromium Authors. All rights reserved.

	2 // Use of this source code is governed by a BSD-style license that can be

	3 // found in the LICENSE file.

	4

	5 #include "content/renderer/media/audio_repetition_detector.h"

	6

	7 #include "base/logging.h"

	8 #include "base/macros.h"

	9 #include "base/metrics/histogram_macros.h"

	10

	11 namespace content {

	12

	13 namespace {

	14

	15 const AudioRepetitionDetector::Pattern kRepetitionPatterns[] = {

	16 {1, 10, 10},

	17 {2, 20, 10},

	18 {3, 30, 10},

	19 {4, 40, 10},

	20 {5, 50, 10},

	21 {6, 60, 10},

	22 {7, 70, 10},

	23 {8, 80, 10},

	24 {9, 90, 10},

	25 {10, 100, 10},

	26 {20, 200, 10},

	27 };

	28

	29 // This is used for increasing the efficiency of copying data into the buffer.

	30 // Input longer than \|kMaxFrames\| won't be a problem, and will be devided into

	31 // trunks automatically.

	32 const size_t kMaxFrames = 480; // 10 ms * 48 kHz

	33

	34 } // namespace

	35

	36 AudioRepetitionDetector::State::State(const Pattern &pattern)

	37 : pattern_(pattern) {

	38 Reset();

	39 }

	40

	41 void AudioRepetitionDetector::State::Increment(bool zero) {

	42 if (0 == count_frames_ && zero) {

	43 // If a repetition starts with zeros, we enter the all zero mode until

	44 // a non zero is found later. The point is that the beginning zeros should

	45 // be counted in the length of the repetition as long as the repetition does

	46 // not comprise only zeros.

	47 all_zero_ = true;

	48 }

	49 ++count_frames_;

	50 if (!zero)

	51 all_zero_ = false;

	52 }

	53

	54 bool AudioRepetitionDetector::State::HasValidReport(int sample_rate) const {

	55 return (!all_zero_ && count_frames_ >=

	56 static_cast<size_t>(pattern_.min_length_ms * sample_rate / 1000));

	57 }

	58

	59 void AudioRepetitionDetector::State::Reset() {

	60 count_frames_ = 0;

	61 all_zero_ = true;

	62 reported_ = false;

	63 }

	64

	65 AudioRepetitionDetector::AudioRepetitionDetector()

	66 : max_look_back_ms_(0),

	67 sample_rate_(0),

	68 buffer_size_frames_(0),

	69 buffer_end_index_(0),

	70 max_frames_(kMaxFrames) {

	71 RegisterRepetitionPatterns(kRepetitionPatterns,

	72 arraysize(kRepetitionPatterns));

	73 }

	74

	75 AudioRepetitionDetector::~AudioRepetitionDetector() {

	76 DCHECK(thread_checker_.CalledOnValidThread());

	77 }

	78

	79 void AudioRepetitionDetector::RegisterRepetitionPatterns(

	80 const Pattern* patterns, size_t num_patterns) {

	81 DCHECK(thread_checker_.CalledOnValidThread());

	82 Pattern pattern;

	83 for (size_t idx = 0; idx < num_patterns; idx++) {

	84 pattern = patterns[idx];

	85 ids_.push_back(pattern.id);

	86 states_.push_back(new State(pattern));

	87 if (pattern.look_back_ms > max_look_back_ms_)

	88 max_look_back_ms_ = pattern.look_back_ms;

	89 }

	90 }

	91

	92 void AudioRepetitionDetector::Reset(size_t num_channels, int sample_rate) {

	93 DCHECK(thread_checker_.CalledOnValidThread());

	94 num_channels_ = num_channels;

	95 sample_rate_ = sample_rate;

	96

	97 // \|(xxx + 999) / 1000\| is an arithmetic way to round up \|xxx / 1000\|.

	98 buffer_size_frames_ =

	99 (max_look_back_ms_ * sample_rate_ + 999) / 1000 + max_frames_;

	100

	101 audio_buffer_.resize(buffer_size_frames_ * num_channels_);

	102 for (auto state : states_)

	103 state->Reset();

	104 }

	105

	106 void AudioRepetitionDetector::AddFramesToBuffer(const float* data,

	107 size_t num_frames) {

	108 DCHECK(thread_checker_.CalledOnValidThread());

	109 DCHECK_LE(num_frames, buffer_size_frames_);

	110 const size_t margin = buffer_size_frames_ - buffer_end_index_;

	111 const auto it = audio_buffer_.begin() + buffer_end_index_ * num_channels_;

	112 if (num_frames <= margin) {

	113 std::copy(data, data + num_frames * num_channels_, it);

	114 buffer_end_index_ += num_frames;

	115 } else {

	116 std::copy(data, data + margin * num_channels_, it);

	117 std::copy(data + margin * num_channels_, data + num_frames * num_channels_,

	118 audio_buffer_.begin());

	119 buffer_end_index_ = num_frames - margin;

	120 }

	121 }

	122

	123 bool AudioRepetitionDetector::Equal(const float* frame,

	124 int look_back_frames) const {

	125 DCHECK(thread_checker_.CalledOnValidThread());

	126 const size_t look_back_index =

	127 (buffer_end_index_ + buffer_size_frames_ - look_back_frames) %

	128 buffer_size_frames_ ;

	129 auto it = audio_buffer_.begin() + look_back_index * num_channels_;

	130 for (size_t channel = 0; channel < num_channels_; ++channel, ++frame, ++it) {

	131 if (frame != it)

	132 return false;

	133 }

	134 return true;

	135 }

	136

	137 bool AudioRepetitionDetector::IsZero(const float* frame,

	138 size_t num_channels) const {

	139 for (size_t channel = 0; channel < num_channels; ++channel, ++frame) {

	140 if (*frame != 0)

	141 return false;

	142 }

	143 return true;

	144 }

	145

	146 void AudioRepetitionDetector::Detect(const float* data, size_t num_frames,

	147 size_t num_channels, int sample_rate) {

	148 DCHECK(thread_checker_.CalledOnValidThread());

	149 DCHECK_GT(states_.size(), 0ul);

	150 if (num_channels != num_channels_ \|\| sample_rate != sample_rate_)

	151 Reset(num_channels, sample_rate);

	152

	153 // The maximum number of frames \|audio_buffer_\| can take in is \|max_frames_\|.

	154 // Therefore, input data with larger frames needs be divided into trunks.
	ajm 2015/09/30 00:23:43 s/trunks/chunks s/trunks/chunks
	155 while (num_frames > max_frames_) {

	156 Detect(data, max_frames_, num_channels, sample_rate);

	157 data += max_frames_ * num_channels;

	158 num_frames -= max_frames_;

	159 }

	160

	161 if (num_frames == 0)

	162 return;

	163

	164 AddFramesToBuffer(data, num_frames);

	165

	166 for (size_t idx = num_frames; idx > 0; --idx, data += num_channels) {

	167 for (auto state : states_) {

	168 // Look back position depends on the sample rate. It is rounded down to

	169 // the closest integer.

	170 const size_t look_back_frames =

	171 state->look_back_ms() * sample_rate_ / 1000;

	172 // Equal(data, offset) checks if \|data\| equals the audio frame located

	173 // \|offset\| frames from the end of buffer. Now a full frame has been

	174 // inserted to the buffer, and thus \|offset\| should compensate for it.

	175 if (Equal(data, look_back_frames + idx)) {

	176 if (!state->reported()) {

	177 state->Increment(IsZero(data, num_channels));

	178 if (state->HasValidReport(sample_rate)) {

	179 ReportRepetition(state->id());

	180 state->set_reported(true);

	181 }

	182 }

	183 } else {

	184 state->Reset();

	185 }

	186 }

	187 }

	188 }

	189

	190 void AudioRepetitionDetector::ReportRepetition(int id) {

	191 DCHECK(thread_checker_.CalledOnValidThread());

	192 UMA_HISTOGRAM_CUSTOM_ENUMERATION(

	193 "Media.AudioCapturerRepetition", id, ids_);

	194 }

	195

	196 } // namespace content

OLD	NEW