Adding instrumentation to locate the source of jankiness
[chromium-blink-merge.git] / chrome / browser / process_singleton_browsertest.cc
blob4a682a239a88d29cac923a371a47f814b76e6440
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 // This test validates that the ProcessSingleton class properly makes sure
6 // that there is only one main browser process.
7 //
8 // It is currently compiled and run on Windows and Posix(non-Mac) platforms.
9 // Mac uses system services and ProcessSingletonMac is a noop. (Maybe it still
10 // makes sense to test that the system services are giving the behavior we
11 // want?)
13 #include "base/bind.h"
14 #include "base/command_line.h"
15 #include "base/files/file_path.h"
16 #include "base/files/scoped_temp_dir.h"
17 #include "base/memory/ref_counted.h"
18 #include "base/path_service.h"
19 #include "base/process/kill.h"
20 #include "base/process/launch.h"
21 #include "base/process/process_iterator.h"
22 #include "base/synchronization/waitable_event.h"
23 #include "base/test/test_timeouts.h"
24 #include "base/threading/thread.h"
25 #include "chrome/common/chrome_constants.h"
26 #include "chrome/common/chrome_paths.h"
27 #include "chrome/common/chrome_switches.h"
28 #include "chrome/test/base/in_process_browser_test.h"
29 #include "chrome/test/base/test_launcher_utils.h"
31 namespace {
33 // This is for the code that is to be ran in multiple threads at once,
34 // to stress a race condition on first process start.
35 // We use the thread safe ref counted base class so that we can use the
36 // base::Bind to run the StartChrome methods in many threads.
37 class ChromeStarter : public base::RefCountedThreadSafe<ChromeStarter> {
38 public:
39 ChromeStarter(base::TimeDelta timeout, const base::FilePath& user_data_dir)
40 : ready_event_(false /* manual */, false /* signaled */),
41 done_event_(false /* manual */, false /* signaled */),
42 process_handle_(base::kNullProcessHandle),
43 process_terminated_(false),
44 timeout_(timeout),
45 user_data_dir_(user_data_dir) {
48 // We must reset some data members since we reuse the same ChromeStarter
49 // object and start/stop it a few times. We must start fresh! :-)
50 void Reset() {
51 ready_event_.Reset();
52 done_event_.Reset();
53 if (process_handle_ != base::kNullProcessHandle)
54 base::CloseProcessHandle(process_handle_);
55 process_handle_ = base::kNullProcessHandle;
56 process_terminated_ = false;
59 void StartChrome(base::WaitableEvent* start_event, bool first_run) {
60 // TODO(mattm): maybe stuff should be refactored to use
61 // UITest::LaunchBrowserHelper somehow?
62 base::FilePath program;
63 ASSERT_TRUE(PathService::Get(base::FILE_EXE, &program));
64 CommandLine command_line(program);
65 command_line.AppendSwitchPath(switches::kUserDataDir, user_data_dir_);
67 if (first_run)
68 command_line.AppendSwitch(switches::kForceFirstRun);
69 else
70 command_line.AppendSwitch(switches::kNoFirstRun);
72 // Add the normal test-mode switches, except for the ones we're adding
73 // ourselves.
74 CommandLine standard_switches(CommandLine::NO_PROGRAM);
75 test_launcher_utils::PrepareBrowserCommandLineForTests(&standard_switches);
76 const CommandLine::SwitchMap& switch_map = standard_switches.GetSwitches();
77 for (CommandLine::SwitchMap::const_iterator i = switch_map.begin();
78 i != switch_map.end(); ++i) {
79 const std::string& switch_name = i->first;
80 if (switch_name == switches::kUserDataDir ||
81 switch_name == switches::kForceFirstRun ||
82 switch_name == switches::kNoFirstRun)
83 continue;
85 command_line.AppendSwitchNative(switch_name, i->second);
88 // Try to get all threads to launch the app at the same time.
89 // So let the test know we are ready.
90 ready_event_.Signal();
91 // And then wait for the test to tell us to GO!
92 ASSERT_NE(static_cast<base::WaitableEvent*>(NULL), start_event);
93 start_event->Wait();
95 // Here we don't wait for the app to be terminated because one of the
96 // process will stay alive while the others will be restarted. If we would
97 // wait here, we would never get a handle to the main process...
98 base::LaunchProcess(command_line, base::LaunchOptions(), &process_handle_);
99 ASSERT_NE(base::kNullProcessHandle, process_handle_);
101 // We can wait on the handle here, we should get stuck on one and only
102 // one process. The test below will take care of killing that process
103 // to unstuck us once it confirms there is only one.
104 process_terminated_ = base::WaitForSingleProcess(process_handle_,
105 timeout_);
106 // Let the test know we are done.
107 done_event_.Signal();
110 // Public access to simplify the test code using them.
111 base::WaitableEvent ready_event_;
112 base::WaitableEvent done_event_;
113 base::ProcessHandle process_handle_;
114 bool process_terminated_;
116 private:
117 friend class base::RefCountedThreadSafe<ChromeStarter>;
119 ~ChromeStarter() {
120 if (process_handle_ != base::kNullProcessHandle)
121 base::CloseProcessHandle(process_handle_);
124 base::TimeDelta timeout_;
125 base::FilePath user_data_dir_;
127 DISALLOW_COPY_AND_ASSIGN(ChromeStarter);
130 } // namespace
132 // Our test fixture that initializes and holds onto a few global vars.
133 class ProcessSingletonTest : public InProcessBrowserTest {
134 public:
135 ProcessSingletonTest()
136 // We use a manual reset so that all threads wake up at once when signaled
137 // and thus we must manually reset it for each attempt.
138 : threads_waker_(true /* manual */, false /* signaled */) {
139 EXPECT_TRUE(temp_profile_dir_.CreateUniqueTempDir());
142 virtual void SetUp() {
143 // Start the threads and create the starters.
144 for (size_t i = 0; i < kNbThreads; ++i) {
145 chrome_starter_threads_[i].reset(new base::Thread("ChromeStarter"));
146 ASSERT_TRUE(chrome_starter_threads_[i]->Start());
147 chrome_starters_[i] = new ChromeStarter(
148 TestTimeouts::action_max_timeout(), temp_profile_dir_.path());
152 virtual void TearDown() {
153 // Stop the threads.
154 for (size_t i = 0; i < kNbThreads; ++i)
155 chrome_starter_threads_[i]->Stop();
158 // This method is used to make sure we kill the main browser process after
159 // all of its child processes have successfully attached to it. This was added
160 // when we realized that if we just kill the parent process right away, we
161 // sometimes end up with dangling child processes. If we Sleep for a certain
162 // amount of time, we are OK... So we introduced this method to avoid a
163 // flaky wait. Instead, we kill all descendants of the main process after we
164 // killed it, relying on the fact that we can still get the parent id of a
165 // child process, even when the parent dies.
166 void KillProcessTree(base::ProcessHandle process_handle) {
167 class ProcessTreeFilter : public base::ProcessFilter {
168 public:
169 explicit ProcessTreeFilter(base::ProcessId parent_pid) {
170 ancestor_pids_.insert(parent_pid);
172 virtual bool Includes(const base::ProcessEntry & entry) const override {
173 if (ancestor_pids_.find(entry.parent_pid()) != ancestor_pids_.end()) {
174 ancestor_pids_.insert(entry.pid());
175 return true;
176 } else {
177 return false;
180 private:
181 mutable std::set<base::ProcessId> ancestor_pids_;
182 } process_tree_filter(base::GetProcId(process_handle));
184 // Start by explicitly killing the main process we know about...
185 static const int kExitCode = 42;
186 EXPECT_TRUE(base::KillProcess(process_handle, kExitCode, true /* wait */));
188 // Then loop until we can't find any of its descendant.
189 // But don't try more than kNbTries times...
190 static const int kNbTries = 10;
191 int num_tries = 0;
192 base::FilePath program;
193 ASSERT_TRUE(PathService::Get(base::FILE_EXE, &program));
194 base::FilePath::StringType exe_name = program.BaseName().value();
195 while (base::GetProcessCount(exe_name, &process_tree_filter) > 0 &&
196 num_tries++ < kNbTries) {
197 base::KillProcesses(exe_name, kExitCode, &process_tree_filter);
199 DLOG_IF(ERROR, num_tries >= kNbTries) << "Failed to kill all processes!";
202 // Since this is a hard to reproduce problem, we make a few attempts.
203 // We stop the attempts at the first error, and when there are no errors,
204 // we don't time-out of any wait, so it executes quite fast anyway.
205 static const size_t kNbAttempts = 5;
207 // The idea is to start chrome from multiple threads all at once.
208 static const size_t kNbThreads = 5;
209 scoped_refptr<ChromeStarter> chrome_starters_[kNbThreads];
210 scoped_ptr<base::Thread> chrome_starter_threads_[kNbThreads];
212 // The event that will get all threads to wake up simultaneously and try
213 // to start a chrome process at the same time.
214 base::WaitableEvent threads_waker_;
216 // We don't want to use the default profile, but can't use UITest's since we
217 // don't use UITest::LaunchBrowser.
218 base::ScopedTempDir temp_profile_dir_;
221 #if defined(OS_LINUX) && defined(TOOLKIT_VIEWS)
222 // http://crbug.com/58219
223 #define MAYBE_StartupRaceCondition DISABLED_StartupRaceCondition
224 #else
225 #define MAYBE_StartupRaceCondition StartupRaceCondition
226 #endif
227 IN_PROC_BROWSER_TEST_F(ProcessSingletonTest, MAYBE_StartupRaceCondition) {
228 // We use this to stop the attempts loop on the first failure.
229 bool failed = false;
230 for (size_t attempt = 0; attempt < kNbAttempts && !failed; ++attempt) {
231 SCOPED_TRACE(testing::Message() << "Attempt: " << attempt << ".");
232 // We use a single event to get all threads to do the AppLaunch at the same
233 // time...
234 threads_waker_.Reset();
236 // Test both with and without the first-run dialog, since they exercise
237 // different paths.
238 #if defined(OS_POSIX)
239 // TODO(mattm): test first run dialog singleton handling on linux too.
240 // On posix if we test the first run dialog, GracefulShutdownHandler gets
241 // the TERM signal, but since the message loop isn't running during the gtk
242 // first run dialog, the ShutdownDetector never handles it, and KillProcess
243 // has to time out (60 sec!) and SIGKILL.
244 bool first_run = false;
245 #else
246 // Test for races in both regular start up and first run start up cases.
247 bool first_run = attempt % 2;
248 #endif
250 // Here we prime all the threads with a ChromeStarter that will wait for
251 // our signal to launch its chrome process.
252 for (size_t i = 0; i < kNbThreads; ++i) {
253 ASSERT_NE(static_cast<ChromeStarter*>(NULL), chrome_starters_[i].get());
254 chrome_starters_[i]->Reset();
256 ASSERT_TRUE(chrome_starter_threads_[i]->IsRunning());
257 ASSERT_NE(static_cast<base::MessageLoop*>(NULL),
258 chrome_starter_threads_[i]->message_loop());
260 chrome_starter_threads_[i]->message_loop()->PostTask(
261 FROM_HERE, base::Bind(&ChromeStarter::StartChrome,
262 chrome_starters_[i].get(),
263 &threads_waker_,
264 first_run));
267 // Wait for all the starters to be ready.
268 // We could replace this loop if we ever implement a WaitAll().
269 for (size_t i = 0; i < kNbThreads; ++i) {
270 SCOPED_TRACE(testing::Message() << "Waiting on thread: " << i << ".");
271 chrome_starters_[i]->ready_event_.Wait();
273 // GO!
274 threads_waker_.Signal();
276 // As we wait for all threads to signal that they are done, we remove their
277 // index from this vector so that we get left with only the index of
278 // the thread that started the main process.
279 std::vector<size_t> pending_starters(kNbThreads);
280 for (size_t i = 0; i < kNbThreads; ++i)
281 pending_starters[i] = i;
283 // We use a local array of starter's done events we must wait on...
284 // These are collected from the starters that we have not yet been removed
285 // from the pending_starters vector.
286 base::WaitableEvent* starters_done_events[kNbThreads];
287 // At the end, "There can be only one" main browser process alive.
288 while (pending_starters.size() > 1) {
289 SCOPED_TRACE(testing::Message() << pending_starters.size() <<
290 " starters left.");
291 for (size_t i = 0; i < pending_starters.size(); ++i) {
292 starters_done_events[i] =
293 &chrome_starters_[pending_starters[i]]->done_event_;
295 size_t done_index = base::WaitableEvent::WaitMany(
296 starters_done_events, pending_starters.size());
297 size_t starter_index = pending_starters[done_index];
298 // If the starter is done but has not marked itself as terminated,
299 // it is because it timed out of its WaitForSingleProcess(). Only the
300 // last one standing should be left waiting... So we failed...
301 EXPECT_TRUE(chrome_starters_[starter_index]->process_terminated_ ||
302 failed) << "There is more than one main process.";
303 if (!chrome_starters_[starter_index]->process_terminated_) {
304 // This will stop the "for kNbAttempts" loop.
305 failed = true;
306 // But we let the last loop turn finish so that we can properly
307 // kill all remaining processes. Starting with this one...
308 if (chrome_starters_[starter_index]->process_handle_ !=
309 base::kNullProcessHandle) {
310 KillProcessTree(chrome_starters_[starter_index]->process_handle_);
313 pending_starters.erase(pending_starters.begin() + done_index);
316 // "There can be only one!" :-)
317 ASSERT_EQ(static_cast<size_t>(1), pending_starters.size());
318 size_t last_index = pending_starters.front();
319 pending_starters.clear();
320 if (chrome_starters_[last_index]->process_handle_ !=
321 base::kNullProcessHandle) {
322 KillProcessTree(chrome_starters_[last_index]->process_handle_);
323 chrome_starters_[last_index]->done_event_.Wait();