Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

104 lines
3.4 KiB
C
Raw Normal View History

/*
* Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*/
#ifndef MODULES_AUDIO_PROCESSING_TEST_CONVERSATIONAL_SPEECH_MULTIEND_CALL_H_
#define MODULES_AUDIO_PROCESSING_TEST_CONVERSATIONAL_SPEECH_MULTIEND_CALL_H_
#include <stddef.h>
#include <map>
#include <memory>
#include <set>
#include <string>
#include <utility>
#include <vector>
#include "api/array_view.h"
#include "modules/audio_processing/test/conversational_speech/timing.h"
#include "modules/audio_processing/test/conversational_speech/wavreader_abstract_factory.h"
#include "modules/audio_processing/test/conversational_speech/wavreader_interface.h"
namespace webrtc {
namespace test {
namespace conversational_speech {
class MultiEndCall {
public:
struct SpeakingTurn {
// Constructor required in order to use std::vector::emplace_back().
SpeakingTurn(std::string new_speaker_name,
std::string new_audiotrack_file_name,
size_t new_begin,
size_t new_end,
int gain)
: speaker_name(std::move(new_speaker_name)),
audiotrack_file_name(std::move(new_audiotrack_file_name)),
begin(new_begin),
end(new_end),
gain(gain) {}
std::string speaker_name;
std::string audiotrack_file_name;
size_t begin;
size_t end;
int gain;
};
MultiEndCall(
rtc::ArrayView<const Turn> timing,
const std::string& audiotracks_path,
std::unique_ptr<WavReaderAbstractFactory> wavreader_abstract_factory);
~MultiEndCall();
MultiEndCall(const MultiEndCall&) = delete;
MultiEndCall& operator=(const MultiEndCall&) = delete;
Reland of Conversational speech tool, simualtor + unit tests (patchset #1 id:1 of https://codereview.webrtc.org/2925123003/ ) Reason for revert: Build file causing google3 compilation error fixed Original issue's description: > Revert of Conversational speech tool, simualtor + unit tests (patchset #12 id:220001 of https://codereview.webrtc.org/2790933002/ ) > > Reason for revert: > Compile Error. > > Original issue's description: > > The simulator puts into action the schedule of speech turns encoded in a MultiEndCall instance. The output is a set of audio track pairs. There is one set for each speaker and each set contains one near-end and one far-end audio track. The tracks are directly written into wav files instead of creating them in memory. To speed up the creation of the output wav files, *all* the source audio tracks (i.e., the atomic speech turns) are pre-loaded. > > > > The ConversationalSpeechTest.MultiEndCallSimulator unit test defines a conversational speech sequence and creates two wav files (with pure tones at 440 and 880 Hz) that are used as atomic speech turn tracks. > > > > This CL also patches MultiEndCall in order to allow input audio tracks with same sample rate and single channel only. > > > > BUG=webrtc:7218 > > > > Review-Url: https://codereview.webrtc.org/2790933002 > > Cr-Commit-Position: refs/heads/master@{#18480} > > Committed: https://chromium.googlesource.com/external/webrtc/+/6b648c4697cede14605fd2b89425866eec5f7c79 > > TBR=minyue@webrtc.org,alessiob@webrtc.org > # Skipping CQ checks because original CL landed less than 1 days ago. > NOPRESUBMIT=true > NOTREECHECKS=true > NOTRY=true > BUG=webrtc:7218 > > Review-Url: https://codereview.webrtc.org/2925123003 > Cr-Commit-Position: refs/heads/master@{#18481} > Committed: https://chromium.googlesource.com/external/webrtc/+/4c72cf43dfda9255468102ce4b4c520571d8f455 TBR=minyue@webrtc.org,charujain@webrtc.org # Skipping CQ checks because original CL landed less than 1 days ago. NOPRESUBMIT=true NOTREECHECKS=true NOTRY=true BUG=webrtc:7218 Review-Url: https://codereview.webrtc.org/2930853002 Cr-Commit-Position: refs/heads/master@{#18606}
2017-06-15 02:24:59 -07:00
const std::set<std::string>& speaker_names() const { return speaker_names_; }
const std::map<std::string, std::unique_ptr<WavReaderInterface>>&
Reland of Conversational speech tool, simualtor + unit tests (patchset #1 id:1 of https://codereview.webrtc.org/2925123003/ ) Reason for revert: Build file causing google3 compilation error fixed Original issue's description: > Revert of Conversational speech tool, simualtor + unit tests (patchset #12 id:220001 of https://codereview.webrtc.org/2790933002/ ) > > Reason for revert: > Compile Error. > > Original issue's description: > > The simulator puts into action the schedule of speech turns encoded in a MultiEndCall instance. The output is a set of audio track pairs. There is one set for each speaker and each set contains one near-end and one far-end audio track. The tracks are directly written into wav files instead of creating them in memory. To speed up the creation of the output wav files, *all* the source audio tracks (i.e., the atomic speech turns) are pre-loaded. > > > > The ConversationalSpeechTest.MultiEndCallSimulator unit test defines a conversational speech sequence and creates two wav files (with pure tones at 440 and 880 Hz) that are used as atomic speech turn tracks. > > > > This CL also patches MultiEndCall in order to allow input audio tracks with same sample rate and single channel only. > > > > BUG=webrtc:7218 > > > > Review-Url: https://codereview.webrtc.org/2790933002 > > Cr-Commit-Position: refs/heads/master@{#18480} > > Committed: https://chromium.googlesource.com/external/webrtc/+/6b648c4697cede14605fd2b89425866eec5f7c79 > > TBR=minyue@webrtc.org,alessiob@webrtc.org > # Skipping CQ checks because original CL landed less than 1 days ago. > NOPRESUBMIT=true > NOTREECHECKS=true > NOTRY=true > BUG=webrtc:7218 > > Review-Url: https://codereview.webrtc.org/2925123003 > Cr-Commit-Position: refs/heads/master@{#18481} > Committed: https://chromium.googlesource.com/external/webrtc/+/4c72cf43dfda9255468102ce4b4c520571d8f455 TBR=minyue@webrtc.org,charujain@webrtc.org # Skipping CQ checks because original CL landed less than 1 days ago. NOPRESUBMIT=true NOTREECHECKS=true NOTRY=true BUG=webrtc:7218 Review-Url: https://codereview.webrtc.org/2930853002 Cr-Commit-Position: refs/heads/master@{#18606}
2017-06-15 02:24:59 -07:00
audiotrack_readers() const {
return audiotrack_readers_;
}
bool valid() const { return valid_; }
int sample_rate() const { return sample_rate_hz_; }
size_t total_duration_samples() const { return total_duration_samples_; }
const std::vector<SpeakingTurn>& speaking_turns() const {
return speaking_turns_;
}
private:
// Finds unique speaker names.
void FindSpeakerNames();
Reland of Conversational speech tool, simualtor + unit tests (patchset #1 id:1 of https://codereview.webrtc.org/2925123003/ ) Reason for revert: Build file causing google3 compilation error fixed Original issue's description: > Revert of Conversational speech tool, simualtor + unit tests (patchset #12 id:220001 of https://codereview.webrtc.org/2790933002/ ) > > Reason for revert: > Compile Error. > > Original issue's description: > > The simulator puts into action the schedule of speech turns encoded in a MultiEndCall instance. The output is a set of audio track pairs. There is one set for each speaker and each set contains one near-end and one far-end audio track. The tracks are directly written into wav files instead of creating them in memory. To speed up the creation of the output wav files, *all* the source audio tracks (i.e., the atomic speech turns) are pre-loaded. > > > > The ConversationalSpeechTest.MultiEndCallSimulator unit test defines a conversational speech sequence and creates two wav files (with pure tones at 440 and 880 Hz) that are used as atomic speech turn tracks. > > > > This CL also patches MultiEndCall in order to allow input audio tracks with same sample rate and single channel only. > > > > BUG=webrtc:7218 > > > > Review-Url: https://codereview.webrtc.org/2790933002 > > Cr-Commit-Position: refs/heads/master@{#18480} > > Committed: https://chromium.googlesource.com/external/webrtc/+/6b648c4697cede14605fd2b89425866eec5f7c79 > > TBR=minyue@webrtc.org,alessiob@webrtc.org > # Skipping CQ checks because original CL landed less than 1 days ago. > NOPRESUBMIT=true > NOTREECHECKS=true > NOTRY=true > BUG=webrtc:7218 > > Review-Url: https://codereview.webrtc.org/2925123003 > Cr-Commit-Position: refs/heads/master@{#18481} > Committed: https://chromium.googlesource.com/external/webrtc/+/4c72cf43dfda9255468102ce4b4c520571d8f455 TBR=minyue@webrtc.org,charujain@webrtc.org # Skipping CQ checks because original CL landed less than 1 days ago. NOPRESUBMIT=true NOTREECHECKS=true NOTRY=true BUG=webrtc:7218 Review-Url: https://codereview.webrtc.org/2930853002 Cr-Commit-Position: refs/heads/master@{#18606}
2017-06-15 02:24:59 -07:00
// Creates one WavReader instance for each unique audiotrack. It returns false
// if the audio tracks do not have the same sample rate or if they are not
// mono.
bool CreateAudioTrackReaders();
// Validates the speaking turns timing information. Accepts cross-talk, but
// only up to 2 speakers. Rejects unordered turns and self cross-talk.
bool CheckTiming();
rtc::ArrayView<const Turn> timing_;
const std::string& audiotracks_path_;
std::unique_ptr<WavReaderAbstractFactory> wavreader_abstract_factory_;
std::set<std::string> speaker_names_;
std::map<std::string, std::unique_ptr<WavReaderInterface>>
audiotrack_readers_;
bool valid_;
Reland of Conversational speech tool, simualtor + unit tests (patchset #1 id:1 of https://codereview.webrtc.org/2925123003/ ) Reason for revert: Build file causing google3 compilation error fixed Original issue's description: > Revert of Conversational speech tool, simualtor + unit tests (patchset #12 id:220001 of https://codereview.webrtc.org/2790933002/ ) > > Reason for revert: > Compile Error. > > Original issue's description: > > The simulator puts into action the schedule of speech turns encoded in a MultiEndCall instance. The output is a set of audio track pairs. There is one set for each speaker and each set contains one near-end and one far-end audio track. The tracks are directly written into wav files instead of creating them in memory. To speed up the creation of the output wav files, *all* the source audio tracks (i.e., the atomic speech turns) are pre-loaded. > > > > The ConversationalSpeechTest.MultiEndCallSimulator unit test defines a conversational speech sequence and creates two wav files (with pure tones at 440 and 880 Hz) that are used as atomic speech turn tracks. > > > > This CL also patches MultiEndCall in order to allow input audio tracks with same sample rate and single channel only. > > > > BUG=webrtc:7218 > > > > Review-Url: https://codereview.webrtc.org/2790933002 > > Cr-Commit-Position: refs/heads/master@{#18480} > > Committed: https://chromium.googlesource.com/external/webrtc/+/6b648c4697cede14605fd2b89425866eec5f7c79 > > TBR=minyue@webrtc.org,alessiob@webrtc.org > # Skipping CQ checks because original CL landed less than 1 days ago. > NOPRESUBMIT=true > NOTREECHECKS=true > NOTRY=true > BUG=webrtc:7218 > > Review-Url: https://codereview.webrtc.org/2925123003 > Cr-Commit-Position: refs/heads/master@{#18481} > Committed: https://chromium.googlesource.com/external/webrtc/+/4c72cf43dfda9255468102ce4b4c520571d8f455 TBR=minyue@webrtc.org,charujain@webrtc.org # Skipping CQ checks because original CL landed less than 1 days ago. NOPRESUBMIT=true NOTREECHECKS=true NOTRY=true BUG=webrtc:7218 Review-Url: https://codereview.webrtc.org/2930853002 Cr-Commit-Position: refs/heads/master@{#18606}
2017-06-15 02:24:59 -07:00
int sample_rate_hz_;
size_t total_duration_samples_;
std::vector<SpeakingTurn> speaking_turns_;
};
} // namespace conversational_speech
} // namespace test
} // namespace webrtc
#endif // MODULES_AUDIO_PROCESSING_TEST_CONVERSATIONAL_SPEECH_MULTIEND_CALL_H_