1// Copyright 2013 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#include <list>
6
7#include "base/bind.h"
8#include "base/memory/scoped_ptr.h"
9#include "base/run_loop.h"
10#include "base/strings/utf_string_conversions.h"
11#include "content/browser/speech/google_streaming_remote_engine.h"
12#include "content/browser/speech/speech_recognition_manager_impl.h"
13#include "content/browser/speech/speech_recognizer_impl.h"
14#include "content/public/browser/browser_thread.h"
15#include "content/public/browser/notification_types.h"
16#include "content/public/browser/web_contents.h"
17#include "content/public/test/browser_test_utils.h"
18#include "content/public/test/test_utils.h"
19#include "content/shell/browser/shell.h"
20#include "content/test/content_browser_test.h"
21#include "content/test/content_browser_test_utils.h"
22#include "content/test/mock_google_streaming_server.h"
23#include "media/audio/mock_audio_manager.h"
24#include "media/audio/test_audio_input_controller_factory.h"
25#include "testing/gtest/include/gtest/gtest.h"
26
27using base::RunLoop;
28
29namespace content {
30
31class SpeechRecognitionBrowserTest :
32    public ContentBrowserTest,
33    public MockGoogleStreamingServer::Delegate,
34    public media::TestAudioInputControllerDelegate {
35 public:
36  enum StreamingServerState {
37    kIdle,
38    kTestAudioControllerOpened,
39    kClientConnected,
40    kClientAudioUpload,
41    kClientAudioUploadComplete,
42    kTestAudioControllerClosed,
43    kClientDisconnected
44  };
45
46  // MockGoogleStreamingServerDelegate methods.
47  virtual void OnClientConnected() OVERRIDE {
48    ASSERT_EQ(kTestAudioControllerOpened, streaming_server_state_);
49    streaming_server_state_ = kClientConnected;
50  }
51
52  virtual void OnClientAudioUpload() OVERRIDE {
53    if (streaming_server_state_ == kClientConnected)
54      streaming_server_state_ = kClientAudioUpload;
55  }
56
57  virtual void OnClientAudioUploadComplete() OVERRIDE {
58    ASSERT_EQ(kTestAudioControllerClosed, streaming_server_state_);
59    streaming_server_state_ = kClientAudioUploadComplete;
60  }
61
62  virtual void OnClientDisconnected() OVERRIDE {
63    ASSERT_EQ(kClientAudioUploadComplete, streaming_server_state_);
64    streaming_server_state_ = kClientDisconnected;
65  }
66
67  // media::TestAudioInputControllerDelegate methods.
68  virtual void TestAudioControllerOpened(
69      media::TestAudioInputController* controller) OVERRIDE {
70    ASSERT_EQ(kIdle, streaming_server_state_);
71    streaming_server_state_ = kTestAudioControllerOpened;
72    const int capture_packet_interval_ms =
73        (1000 * controller->audio_parameters().frames_per_buffer()) /
74        controller->audio_parameters().sample_rate();
75    ASSERT_EQ(GoogleStreamingRemoteEngine::kAudioPacketIntervalMs,
76        capture_packet_interval_ms);
77    FeedAudioController(500 /* ms */, /*noise=*/ false);
78    FeedAudioController(1000 /* ms */, /*noise=*/ true);
79    FeedAudioController(1000 /* ms */, /*noise=*/ false);
80  }
81
82  virtual void TestAudioControllerClosed(
83      media::TestAudioInputController* controller) OVERRIDE {
84    ASSERT_EQ(kClientAudioUpload, streaming_server_state_);
85    streaming_server_state_ = kTestAudioControllerClosed;
86    mock_streaming_server_->MockGoogleStreamingServer::SimulateResult(
87        GetGoodSpeechResult());
88  }
89
90  // Helper methods used by test fixtures.
91  GURL GetTestUrlFromFragment(const std::string fragment) {
92    return GURL(GetTestUrl("speech", "web_speech_recognition.html").spec() +
93        "#" + fragment);
94  }
95
96  std::string GetPageFragment() {
97    return shell()->web_contents()->GetURL().ref();
98  }
99
100  const StreamingServerState &streaming_server_state() {
101    return streaming_server_state_;
102  }
103
104 protected:
105  // ContentBrowserTest methods.
106  virtual void SetUpInProcessBrowserTestFixture() OVERRIDE {
107    test_audio_input_controller_factory_.set_delegate(this);
108    media::AudioInputController::set_factory_for_testing(
109        &test_audio_input_controller_factory_);
110    mock_streaming_server_.reset(new MockGoogleStreamingServer(this));
111    streaming_server_state_ = kIdle;
112  }
113
114  virtual void SetUpOnMainThread() OVERRIDE {
115    ASSERT_TRUE(SpeechRecognitionManagerImpl::GetInstance());
116    SpeechRecognizerImpl::SetAudioManagerForTesting(
117        new media::MockAudioManager(BrowserThread::GetMessageLoopProxyForThread(
118            BrowserThread::IO)));
119  }
120
121  virtual void TearDownOnMainThread() OVERRIDE {
122    SpeechRecognizerImpl::SetAudioManagerForTesting(NULL);
123  }
124
125  virtual void TearDownInProcessBrowserTestFixture() OVERRIDE {
126    test_audio_input_controller_factory_.set_delegate(NULL);
127    mock_streaming_server_.reset();
128  }
129
130 private:
131  static void FeedSingleBufferToAudioController(
132      scoped_refptr<media::TestAudioInputController> controller,
133      size_t buffer_size,
134      bool fill_with_noise) {
135    DCHECK(controller.get());
136    scoped_ptr<uint8[]> audio_buffer(new uint8[buffer_size]);
137    if (fill_with_noise) {
138      for (size_t i = 0; i < buffer_size; ++i)
139        audio_buffer[i] = static_cast<uint8>(127 * sin(i * 3.14F /
140            (16 * buffer_size)));
141    } else {
142      memset(audio_buffer.get(), 0, buffer_size);
143    }
144    controller->event_handler()->OnData(controller,
145                                        audio_buffer.get(),
146                                        buffer_size);
147  }
148
149  void FeedAudioController(int duration_ms, bool feed_with_noise) {
150    media::TestAudioInputController* controller =
151        test_audio_input_controller_factory_.controller();
152    ASSERT_TRUE(controller);
153    const media::AudioParameters& audio_params = controller->audio_parameters();
154    const size_t buffer_size = audio_params.GetBytesPerBuffer();
155    const int ms_per_buffer = audio_params.frames_per_buffer() * 1000 /
156                              audio_params.sample_rate();
157    // We can only simulate durations that are integer multiples of the
158    // buffer size. In this regard see
159    // SpeechRecognitionEngine::GetDesiredAudioChunkDurationMs().
160    ASSERT_EQ(0, duration_ms % ms_per_buffer);
161
162    const int n_buffers = duration_ms / ms_per_buffer;
163    for (int i = 0; i < n_buffers; ++i) {
164      base::MessageLoop::current()->PostTask(FROM_HERE, base::Bind(
165          &FeedSingleBufferToAudioController,
166          scoped_refptr<media::TestAudioInputController>(controller),
167          buffer_size,
168          feed_with_noise));
169    }
170  }
171
172  SpeechRecognitionResult GetGoodSpeechResult() {
173    SpeechRecognitionResult result;
174    result.hypotheses.push_back(SpeechRecognitionHypothesis(
175        UTF8ToUTF16("Pictures of the moon"), 1.0F));
176    return result;
177  }
178
179  StreamingServerState streaming_server_state_;
180  scoped_ptr<MockGoogleStreamingServer> mock_streaming_server_;
181  media::TestAudioInputControllerFactory test_audio_input_controller_factory_;
182};
183
184// Simply loads the test page and checks if it was able to create a Speech
185// Recognition object in JavaScript, to make sure the Web Speech API is enabled.
186IN_PROC_BROWSER_TEST_F(SpeechRecognitionBrowserTest, Precheck) {
187  NavigateToURLBlockUntilNavigationsComplete(
188      shell(), GetTestUrlFromFragment("precheck"), 2);
189
190  EXPECT_EQ(kIdle, streaming_server_state());
191  EXPECT_EQ("success", GetPageFragment());
192}
193
194IN_PROC_BROWSER_TEST_F(SpeechRecognitionBrowserTest, OneShotRecognition) {
195  NavigateToURLBlockUntilNavigationsComplete(
196      shell(), GetTestUrlFromFragment("oneshot"), 2);
197
198  EXPECT_EQ(kClientDisconnected, streaming_server_state());
199  EXPECT_EQ("goodresult1", GetPageFragment());
200}
201
202}  // namespace content
203