1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "net/socket/tcp_client_socket_win.h"
9 #include "base/basictypes.h"
10 #include "base/compiler_specific.h"
11 #include "base/metrics/stats_counters.h"
12 #include "base/strings/string_util.h"
13 #include "base/win/object_watcher.h"
14 #include "base/win/windows_version.h"
15 #include "net/base/connection_type_histograms.h"
16 #include "net/base/io_buffer.h"
17 #include "net/base/ip_endpoint.h"
18 #include "net/base/net_errors.h"
19 #include "net/base/net_log.h"
20 #include "net/base/net_util.h"
21 #include "net/base/network_change_notifier.h"
22 #include "net/base/winsock_init.h"
23 #include "net/base/winsock_util.h"
24 #include "net/socket/socket_net_log_params.h"
30 const int kTCPKeepAliveSeconds
= 45;
31 bool g_disable_overlapped_reads
= false;
33 bool SetSocketReceiveBufferSize(SOCKET socket
, int32 size
) {
34 int rv
= setsockopt(socket
, SOL_SOCKET
, SO_RCVBUF
,
35 reinterpret_cast<const char*>(&size
), sizeof(size
));
36 DCHECK(!rv
) << "Could not set socket receive buffer size: " << GetLastError();
40 bool SetSocketSendBufferSize(SOCKET socket
, int32 size
) {
41 int rv
= setsockopt(socket
, SOL_SOCKET
, SO_SNDBUF
,
42 reinterpret_cast<const char*>(&size
), sizeof(size
));
43 DCHECK(!rv
) << "Could not set socket send buffer size: " << GetLastError();
48 // The Nagle implementation on windows is governed by RFC 896. The idea
49 // behind Nagle is to reduce small packets on the network. When Nagle is
50 // enabled, if a partial packet has been sent, the TCP stack will disallow
51 // further *partial* packets until an ACK has been received from the other
52 // side. Good applications should always strive to send as much data as
53 // possible and avoid partial-packet sends. However, in most real world
54 // applications, there are edge cases where this does not happen, and two
55 // partial packets may be sent back to back. For a browser, it is NEVER
56 // a benefit to delay for an RTT before the second packet is sent.
58 // As a practical example in Chromium today, consider the case of a small
59 // POST. I have verified this:
60 // Client writes 649 bytes of header (partial packet #1)
61 // Client writes 50 bytes of POST data (partial packet #2)
62 // In the above example, with Nagle, a RTT delay is inserted between these
63 // two sends due to nagle. RTTs can easily be 100ms or more. The best
64 // fix is to make sure that for POSTing data, we write as much data as
65 // possible and minimize partial packets. We will fix that. But disabling
66 // Nagle also ensure we don't run into this delay in other edge cases.
68 // http://technet.microsoft.com/en-us/library/bb726981.aspx
69 bool DisableNagle(SOCKET socket
, bool disable
) {
70 BOOL val
= disable
? TRUE
: FALSE
;
71 int rv
= setsockopt(socket
, IPPROTO_TCP
, TCP_NODELAY
,
72 reinterpret_cast<const char*>(&val
),
74 DCHECK(!rv
) << "Could not disable nagle";
78 // Enable TCP Keep-Alive to prevent NAT routers from timing out TCP
79 // connections. See http://crbug.com/27400 for details.
80 bool SetTCPKeepAlive(SOCKET socket
, BOOL enable
, int delay_secs
) {
81 int delay
= delay_secs
* 1000;
82 struct tcp_keepalive keepalive_vals
= {
83 enable
? 1 : 0, // TCP keep-alive on.
84 delay
, // Delay seconds before sending first TCP keep-alive packet.
85 delay
, // Delay seconds between sending TCP keep-alive packets.
87 DWORD bytes_returned
= 0xABAB;
88 int rv
= WSAIoctl(socket
, SIO_KEEPALIVE_VALS
, &keepalive_vals
,
89 sizeof(keepalive_vals
), NULL
, 0,
90 &bytes_returned
, NULL
, NULL
);
91 DCHECK(!rv
) << "Could not enable TCP Keep-Alive for socket: " << socket
92 << " [error: " << WSAGetLastError() << "].";
94 // Disregard any failure in disabling nagle or enabling TCP Keep-Alive.
98 // Sets socket parameters. Returns the OS error code (or 0 on
100 int SetupSocket(SOCKET socket
) {
101 // Increase the socket buffer sizes from the default sizes for WinXP. In
102 // performance testing, there is substantial benefit by increasing from 8KB
105 // http://support.microsoft.com/kb/823764/EN-US
106 // On Vista, if we manually set these sizes, Vista turns off its receive
107 // window auto-tuning feature.
108 // http://blogs.msdn.com/wndp/archive/2006/05/05/Winhec-blog-tcpip-2.aspx
109 // Since Vista's auto-tune is better than any static value we can could set,
110 // only change these on pre-vista machines.
111 if (base::win::GetVersion() < base::win::VERSION_VISTA
) {
112 const int32 kSocketBufferSize
= 64 * 1024;
113 SetSocketReceiveBufferSize(socket
, kSocketBufferSize
);
114 SetSocketSendBufferSize(socket
, kSocketBufferSize
);
117 DisableNagle(socket
, true);
118 SetTCPKeepAlive(socket
, true, kTCPKeepAliveSeconds
);
122 // Creates a new socket and sets default parameters for it. Returns
123 // the OS error code (or 0 on success).
124 int CreateSocket(int family
, SOCKET
* socket
) {
125 *socket
= CreatePlatformSocket(family
, SOCK_STREAM
, IPPROTO_TCP
);
126 if (*socket
== INVALID_SOCKET
) {
127 int os_error
= WSAGetLastError();
128 LOG(ERROR
) << "CreatePlatformSocket failed: " << os_error
;
131 int error
= SetupSocket(*socket
);
133 if (closesocket(*socket
) < 0)
134 PLOG(ERROR
) << "closesocket";
135 *socket
= INVALID_SOCKET
;
141 int MapConnectError(int os_error
) {
143 // connect fails with WSAEACCES when Windows Firewall blocks the
146 return ERR_NETWORK_ACCESS_DENIED
;
148 return ERR_CONNECTION_TIMED_OUT
;
150 int net_error
= MapSystemError(os_error
);
151 if (net_error
== ERR_FAILED
)
152 return ERR_CONNECTION_FAILED
; // More specific than ERR_FAILED.
154 // Give a more specific error when the user is offline.
155 if (net_error
== ERR_ADDRESS_UNREACHABLE
&&
156 NetworkChangeNotifier::IsOffline()) {
157 return ERR_INTERNET_DISCONNECTED
;
167 //-----------------------------------------------------------------------------
169 // This class encapsulates all the state that has to be preserved as long as
170 // there is a network IO operation in progress. If the owner TCPClientSocketWin
171 // is destroyed while an operation is in progress, the Core is detached and it
172 // lives until the operation completes and the OS doesn't reference any resource
173 // declared on this class anymore.
174 class TCPClientSocketWin::Core
: public base::RefCounted
<Core
> {
176 explicit Core(TCPClientSocketWin
* socket
);
178 // Start watching for the end of a read or write operation.
180 void WatchForWrite();
182 // The TCPClientSocketWin is going away.
183 void Detach() { socket_
= NULL
; }
185 // Throttle the read size based on our current slow start state.
186 // Returns the throttled read size.
187 int ThrottleReadSize(int size
) {
188 if (slow_start_throttle_
< kMaxSlowStartThrottle
) {
189 size
= std::min(size
, slow_start_throttle_
);
190 slow_start_throttle_
*= 2;
195 // The separate OVERLAPPED variables for asynchronous operation.
196 // |read_overlapped_| is used for both Connect() and Read().
197 // |write_overlapped_| is only used for Write();
198 OVERLAPPED read_overlapped_
;
199 OVERLAPPED write_overlapped_
;
201 // The buffers used in Read() and Write().
202 scoped_refptr
<IOBuffer
> read_iobuffer_
;
203 scoped_refptr
<IOBuffer
> write_iobuffer_
;
204 int read_buffer_length_
;
205 int write_buffer_length_
;
207 // Remember the state of g_disable_overlapped_reads for the duration of the
208 // socket based on what it was when the socket was created.
209 bool disable_overlapped_reads_
;
210 bool non_blocking_reads_initialized_
;
213 friend class base::RefCounted
<Core
>;
215 class ReadDelegate
: public base::win::ObjectWatcher::Delegate
{
217 explicit ReadDelegate(Core
* core
) : core_(core
) {}
218 virtual ~ReadDelegate() {}
220 // base::ObjectWatcher::Delegate methods:
221 virtual void OnObjectSignaled(HANDLE object
);
227 class WriteDelegate
: public base::win::ObjectWatcher::Delegate
{
229 explicit WriteDelegate(Core
* core
) : core_(core
) {}
230 virtual ~WriteDelegate() {}
232 // base::ObjectWatcher::Delegate methods:
233 virtual void OnObjectSignaled(HANDLE object
);
241 // The socket that created this object.
242 TCPClientSocketWin
* socket_
;
244 // |reader_| handles the signals from |read_watcher_|.
245 ReadDelegate reader_
;
246 // |writer_| handles the signals from |write_watcher_|.
247 WriteDelegate writer_
;
249 // |read_watcher_| watches for events from Connect() and Read().
250 base::win::ObjectWatcher read_watcher_
;
251 // |write_watcher_| watches for events from Write();
252 base::win::ObjectWatcher write_watcher_
;
254 // When doing reads from the socket, we try to mirror TCP's slow start.
255 // We do this because otherwise the async IO subsystem artifically delays
256 // returning data to the application.
257 static const int kInitialSlowStartThrottle
= 1 * 1024;
258 static const int kMaxSlowStartThrottle
= 32 * kInitialSlowStartThrottle
;
259 int slow_start_throttle_
;
261 DISALLOW_COPY_AND_ASSIGN(Core
);
264 TCPClientSocketWin::Core::Core(
265 TCPClientSocketWin
* socket
)
266 : read_buffer_length_(0),
267 write_buffer_length_(0),
268 disable_overlapped_reads_(g_disable_overlapped_reads
),
269 non_blocking_reads_initialized_(false),
273 slow_start_throttle_(kInitialSlowStartThrottle
) {
274 memset(&read_overlapped_
, 0, sizeof(read_overlapped_
));
275 memset(&write_overlapped_
, 0, sizeof(write_overlapped_
));
277 read_overlapped_
.hEvent
= WSACreateEvent();
278 write_overlapped_
.hEvent
= WSACreateEvent();
281 TCPClientSocketWin::Core::~Core() {
282 // Make sure the message loop is not watching this object anymore.
283 read_watcher_
.StopWatching();
284 write_watcher_
.StopWatching();
286 WSACloseEvent(read_overlapped_
.hEvent
);
287 memset(&read_overlapped_
, 0xaf, sizeof(read_overlapped_
));
288 WSACloseEvent(write_overlapped_
.hEvent
);
289 memset(&write_overlapped_
, 0xaf, sizeof(write_overlapped_
));
292 void TCPClientSocketWin::Core::WatchForRead() {
293 // We grab an extra reference because there is an IO operation in progress.
294 // Balanced in ReadDelegate::OnObjectSignaled().
296 read_watcher_
.StartWatching(read_overlapped_
.hEvent
, &reader_
);
299 void TCPClientSocketWin::Core::WatchForWrite() {
300 // We grab an extra reference because there is an IO operation in progress.
301 // Balanced in WriteDelegate::OnObjectSignaled().
303 write_watcher_
.StartWatching(write_overlapped_
.hEvent
, &writer_
);
306 void TCPClientSocketWin::Core::ReadDelegate::OnObjectSignaled(
308 DCHECK_EQ(object
, core_
->read_overlapped_
.hEvent
);
309 if (core_
->socket_
) {
310 if (core_
->socket_
->waiting_connect()) {
311 core_
->socket_
->DidCompleteConnect();
312 } else if (core_
->disable_overlapped_reads_
) {
313 core_
->socket_
->DidSignalRead();
315 core_
->socket_
->DidCompleteRead();
322 void TCPClientSocketWin::Core::WriteDelegate::OnObjectSignaled(
324 DCHECK_EQ(object
, core_
->write_overlapped_
.hEvent
);
326 core_
->socket_
->DidCompleteWrite();
331 //-----------------------------------------------------------------------------
333 TCPClientSocketWin::TCPClientSocketWin(const AddressList
& addresses
,
334 net::NetLog
* net_log
,
335 const net::NetLog::Source
& source
)
336 : socket_(INVALID_SOCKET
),
337 bound_socket_(INVALID_SOCKET
),
338 addresses_(addresses
),
339 current_address_index_(-1),
340 waiting_read_(false),
341 waiting_write_(false),
342 next_connect_state_(CONNECT_STATE_NONE
),
343 connect_os_error_(0),
344 net_log_(BoundNetLog::Make(net_log
, NetLog::SOURCE_SOCKET
)),
345 previously_disconnected_(false) {
346 net_log_
.BeginEvent(NetLog::TYPE_SOCKET_ALIVE
,
347 source
.ToEventParametersCallback());
351 TCPClientSocketWin::~TCPClientSocketWin() {
353 net_log_
.EndEvent(NetLog::TYPE_SOCKET_ALIVE
);
356 int TCPClientSocketWin::AdoptSocket(SOCKET socket
) {
357 DCHECK_EQ(socket_
, INVALID_SOCKET
);
359 int error
= SetupSocket(socket
);
361 return MapSystemError(error
);
364 SetNonBlocking(socket_
);
366 core_
= new Core(this);
367 current_address_index_
= 0;
368 use_history_
.set_was_ever_connected();
373 int TCPClientSocketWin::Bind(const IPEndPoint
& address
) {
374 if (current_address_index_
>= 0 || bind_address_
.get()) {
375 // Cannot bind the socket if we are already connected or connecting.
376 return ERR_UNEXPECTED
;
379 SockaddrStorage storage
;
380 if (!address
.ToSockAddr(storage
.addr
, &storage
.addr_len
))
381 return ERR_INVALID_ARGUMENT
;
383 // Create |bound_socket_| and try to bind it to |address|.
384 int error
= CreateSocket(address
.GetSockAddrFamily(), &bound_socket_
);
386 return MapSystemError(error
);
388 if (bind(bound_socket_
, storage
.addr
, storage
.addr_len
)) {
390 if (closesocket(bound_socket_
) < 0)
391 PLOG(ERROR
) << "closesocket";
392 bound_socket_
= INVALID_SOCKET
;
393 return MapSystemError(error
);
396 bind_address_
.reset(new IPEndPoint(address
));
402 int TCPClientSocketWin::Connect(const CompletionCallback
& callback
) {
403 DCHECK(CalledOnValidThread());
405 // If already connected, then just return OK.
406 if (socket_
!= INVALID_SOCKET
)
409 base::StatsCounter
connects("tcp.connect");
410 connects
.Increment();
412 net_log_
.BeginEvent(NetLog::TYPE_TCP_CONNECT
,
413 addresses_
.CreateNetLogCallback());
415 // We will try to connect to each address in addresses_. Start with the
416 // first one in the list.
417 next_connect_state_
= CONNECT_STATE_CONNECT
;
418 current_address_index_
= 0;
420 int rv
= DoConnectLoop(OK
);
421 if (rv
== ERR_IO_PENDING
) {
422 // Synchronous operation not supported.
423 DCHECK(!callback
.is_null());
424 // TODO(ajwong): Is setting read_callback_ the right thing to do here??
425 read_callback_
= callback
;
427 LogConnectCompletion(rv
);
433 int TCPClientSocketWin::DoConnectLoop(int result
) {
434 DCHECK_NE(next_connect_state_
, CONNECT_STATE_NONE
);
438 ConnectState state
= next_connect_state_
;
439 next_connect_state_
= CONNECT_STATE_NONE
;
441 case CONNECT_STATE_CONNECT
:
445 case CONNECT_STATE_CONNECT_COMPLETE
:
446 rv
= DoConnectComplete(rv
);
449 LOG(DFATAL
) << "bad state " << state
;
453 } while (rv
!= ERR_IO_PENDING
&& next_connect_state_
!= CONNECT_STATE_NONE
);
458 int TCPClientSocketWin::DoConnect() {
459 DCHECK_GE(current_address_index_
, 0);
460 DCHECK_LT(current_address_index_
, static_cast<int>(addresses_
.size()));
461 DCHECK_EQ(0, connect_os_error_
);
463 const IPEndPoint
& endpoint
= addresses_
[current_address_index_
];
465 if (previously_disconnected_
) {
466 use_history_
.Reset();
467 previously_disconnected_
= false;
470 net_log_
.BeginEvent(NetLog::TYPE_TCP_CONNECT_ATTEMPT
,
471 CreateNetLogIPEndPointCallback(&endpoint
));
473 next_connect_state_
= CONNECT_STATE_CONNECT_COMPLETE
;
475 if (bound_socket_
!= INVALID_SOCKET
) {
476 DCHECK(bind_address_
.get());
477 socket_
= bound_socket_
;
478 bound_socket_
= INVALID_SOCKET
;
480 connect_os_error_
= CreateSocket(endpoint
.GetSockAddrFamily(), &socket_
);
481 if (connect_os_error_
!= 0)
482 return MapSystemError(connect_os_error_
);
484 if (bind_address_
.get()) {
485 SockaddrStorage storage
;
486 if (!bind_address_
->ToSockAddr(storage
.addr
, &storage
.addr_len
))
487 return ERR_INVALID_ARGUMENT
;
488 if (bind(socket_
, storage
.addr
, storage
.addr_len
))
489 return MapSystemError(errno
);
494 core_
= new Core(this);
495 // WSAEventSelect sets the socket to non-blocking mode as a side effect.
496 // Our connect() and recv() calls require that the socket be non-blocking.
497 WSAEventSelect(socket_
, core_
->read_overlapped_
.hEvent
, FD_CONNECT
);
499 SockaddrStorage storage
;
500 if (!endpoint
.ToSockAddr(storage
.addr
, &storage
.addr_len
))
501 return ERR_INVALID_ARGUMENT
;
502 if (!connect(socket_
, storage
.addr
, storage
.addr_len
)) {
503 // Connected without waiting!
505 // The MSDN page for connect says:
506 // With a nonblocking socket, the connection attempt cannot be completed
507 // immediately. In this case, connect will return SOCKET_ERROR, and
508 // WSAGetLastError will return WSAEWOULDBLOCK.
509 // which implies that for a nonblocking socket, connect never returns 0.
510 // It's not documented whether the event object will be signaled or not
511 // if connect does return 0. So the code below is essentially dead code
512 // and we don't know if it's correct.
515 if (ResetEventIfSignaled(core_
->read_overlapped_
.hEvent
))
518 int os_error
= WSAGetLastError();
519 if (os_error
!= WSAEWOULDBLOCK
) {
520 LOG(ERROR
) << "connect failed: " << os_error
;
521 connect_os_error_
= os_error
;
522 return MapConnectError(os_error
);
526 core_
->WatchForRead();
527 return ERR_IO_PENDING
;
530 int TCPClientSocketWin::DoConnectComplete(int result
) {
531 // Log the end of this attempt (and any OS error it threw).
532 int os_error
= connect_os_error_
;
533 connect_os_error_
= 0;
535 net_log_
.EndEvent(NetLog::TYPE_TCP_CONNECT_ATTEMPT
,
536 NetLog::IntegerCallback("os_error", os_error
));
538 net_log_
.EndEvent(NetLog::TYPE_TCP_CONNECT_ATTEMPT
);
542 use_history_
.set_was_ever_connected();
546 // Close whatever partially connected socket we currently have.
549 // Try to fall back to the next address in the list.
550 if (current_address_index_
+ 1 < static_cast<int>(addresses_
.size())) {
551 next_connect_state_
= CONNECT_STATE_CONNECT
;
552 ++current_address_index_
;
556 // Otherwise there is nothing to fall back to, so give up.
560 void TCPClientSocketWin::Disconnect() {
561 DCHECK(CalledOnValidThread());
564 current_address_index_
= -1;
565 bind_address_
.reset();
568 void TCPClientSocketWin::DoDisconnect() {
569 DCHECK(CalledOnValidThread());
571 if (socket_
== INVALID_SOCKET
)
574 // Note: don't use CancelIo to cancel pending IO because it doesn't work
575 // when there is a Winsock layered service provider.
577 // In most socket implementations, closing a socket results in a graceful
578 // connection shutdown, but in Winsock we have to call shutdown explicitly.
579 // See the MSDN page "Graceful Shutdown, Linger Options, and Socket Closure"
580 // at http://msdn.microsoft.com/en-us/library/ms738547.aspx
581 shutdown(socket_
, SD_SEND
);
583 // This cancels any pending IO.
584 closesocket(socket_
);
585 socket_
= INVALID_SOCKET
;
587 if (waiting_connect()) {
588 // We closed the socket, so this notification will never come.
589 // From MSDN' WSAEventSelect documentation:
590 // "Closing a socket with closesocket also cancels the association and
591 // selection of network events specified in WSAEventSelect for the socket".
595 waiting_read_
= false;
596 waiting_write_
= false;
601 previously_disconnected_
= true;
604 bool TCPClientSocketWin::IsConnected() const {
605 DCHECK(CalledOnValidThread());
607 if (socket_
== INVALID_SOCKET
|| waiting_connect())
613 // Check if connection is alive.
615 int rv
= recv(socket_
, &c
, 1, MSG_PEEK
);
618 if (rv
== SOCKET_ERROR
&& WSAGetLastError() != WSAEWOULDBLOCK
)
624 bool TCPClientSocketWin::IsConnectedAndIdle() const {
625 DCHECK(CalledOnValidThread());
627 if (socket_
== INVALID_SOCKET
|| waiting_connect())
633 // Check if connection is alive and we haven't received any data
636 int rv
= recv(socket_
, &c
, 1, MSG_PEEK
);
639 if (WSAGetLastError() != WSAEWOULDBLOCK
)
645 int TCPClientSocketWin::GetPeerAddress(IPEndPoint
* address
) const {
646 DCHECK(CalledOnValidThread());
649 return ERR_SOCKET_NOT_CONNECTED
;
650 *address
= addresses_
[current_address_index_
];
654 int TCPClientSocketWin::GetLocalAddress(IPEndPoint
* address
) const {
655 DCHECK(CalledOnValidThread());
657 if (socket_
== INVALID_SOCKET
) {
658 if (bind_address_
.get()) {
659 *address
= *bind_address_
;
662 return ERR_SOCKET_NOT_CONNECTED
;
665 struct sockaddr_storage addr_storage
;
666 socklen_t addr_len
= sizeof(addr_storage
);
667 struct sockaddr
* addr
= reinterpret_cast<struct sockaddr
*>(&addr_storage
);
668 if (getsockname(socket_
, addr
, &addr_len
))
669 return MapSystemError(WSAGetLastError());
670 if (!address
->FromSockAddr(addr
, addr_len
))
675 void TCPClientSocketWin::SetSubresourceSpeculation() {
676 use_history_
.set_subresource_speculation();
679 void TCPClientSocketWin::SetOmniboxSpeculation() {
680 use_history_
.set_omnibox_speculation();
683 bool TCPClientSocketWin::WasEverUsed() const {
684 return use_history_
.was_used_to_convey_data();
687 bool TCPClientSocketWin::UsingTCPFastOpen() const {
688 // Not supported on windows.
692 bool TCPClientSocketWin::WasNpnNegotiated() const {
696 NextProto
TCPClientSocketWin::GetNegotiatedProtocol() const {
697 return kProtoUnknown
;
700 bool TCPClientSocketWin::GetSSLInfo(SSLInfo
* ssl_info
) {
704 int TCPClientSocketWin::Read(IOBuffer
* buf
,
706 const CompletionCallback
& callback
) {
707 DCHECK(CalledOnValidThread());
708 DCHECK_NE(socket_
, INVALID_SOCKET
);
709 DCHECK(!waiting_read_
);
710 DCHECK(read_callback_
.is_null());
711 DCHECK(!core_
->read_iobuffer_
);
713 return DoRead(buf
, buf_len
, callback
);
716 int TCPClientSocketWin::Write(IOBuffer
* buf
,
718 const CompletionCallback
& callback
) {
719 DCHECK(CalledOnValidThread());
720 DCHECK_NE(socket_
, INVALID_SOCKET
);
721 DCHECK(!waiting_write_
);
722 DCHECK(write_callback_
.is_null());
723 DCHECK_GT(buf_len
, 0);
724 DCHECK(!core_
->write_iobuffer_
);
726 base::StatsCounter
writes("tcp.writes");
730 write_buffer
.len
= buf_len
;
731 write_buffer
.buf
= buf
->data();
733 // TODO(wtc): Remove the assertion after enough testing.
734 AssertEventNotSignaled(core_
->write_overlapped_
.hEvent
);
736 int rv
= WSASend(socket_
, &write_buffer
, 1, &num
, 0,
737 &core_
->write_overlapped_
, NULL
);
739 if (ResetEventIfSignaled(core_
->write_overlapped_
.hEvent
)) {
740 rv
= static_cast<int>(num
);
741 if (rv
> buf_len
|| rv
< 0) {
742 // It seems that some winsock interceptors report that more was written
743 // than was available. Treat this as an error. http://crbug.com/27870
744 LOG(ERROR
) << "Detected broken LSP: Asked to write " << buf_len
745 << " bytes, but " << rv
<< " bytes reported.";
746 return ERR_WINSOCK_UNEXPECTED_WRITTEN_BYTES
;
748 base::StatsCounter
write_bytes("tcp.write_bytes");
751 use_history_
.set_was_used_to_convey_data();
752 net_log_
.AddByteTransferEvent(NetLog::TYPE_SOCKET_BYTES_SENT
, rv
,
757 int os_error
= WSAGetLastError();
758 if (os_error
!= WSA_IO_PENDING
) {
759 int net_error
= MapSystemError(os_error
);
760 net_log_
.AddEvent(NetLog::TYPE_SOCKET_WRITE_ERROR
,
761 CreateNetLogSocketErrorCallback(net_error
, os_error
));
765 waiting_write_
= true;
766 write_callback_
= callback
;
767 core_
->write_iobuffer_
= buf
;
768 core_
->write_buffer_length_
= buf_len
;
769 core_
->WatchForWrite();
770 return ERR_IO_PENDING
;
773 bool TCPClientSocketWin::SetReceiveBufferSize(int32 size
) {
774 DCHECK(CalledOnValidThread());
775 return SetSocketReceiveBufferSize(socket_
, size
);
778 bool TCPClientSocketWin::SetSendBufferSize(int32 size
) {
779 DCHECK(CalledOnValidThread());
780 return SetSocketSendBufferSize(socket_
, size
);
783 bool TCPClientSocketWin::SetKeepAlive(bool enable
, int delay
) {
784 return SetTCPKeepAlive(socket_
, enable
, delay
);
787 bool TCPClientSocketWin::SetNoDelay(bool no_delay
) {
788 return DisableNagle(socket_
, no_delay
);
791 void TCPClientSocketWin::DisableOverlappedReads() {
792 g_disable_overlapped_reads
= true;
795 void TCPClientSocketWin::LogConnectCompletion(int net_error
) {
797 UpdateConnectionTypeHistograms(CONNECTION_ANY
);
799 if (net_error
!= OK
) {
800 net_log_
.EndEventWithNetErrorCode(NetLog::TYPE_TCP_CONNECT
, net_error
);
804 struct sockaddr_storage source_address
;
805 socklen_t addrlen
= sizeof(source_address
);
806 int rv
= getsockname(
807 socket_
, reinterpret_cast<struct sockaddr
*>(&source_address
), &addrlen
);
809 LOG(ERROR
) << "getsockname() [rv: " << rv
810 << "] error: " << WSAGetLastError();
812 net_log_
.EndEventWithNetErrorCode(NetLog::TYPE_TCP_CONNECT
, rv
);
817 NetLog::TYPE_TCP_CONNECT
,
818 CreateNetLogSourceAddressCallback(
819 reinterpret_cast<const struct sockaddr
*>(&source_address
),
820 sizeof(source_address
)));
823 int TCPClientSocketWin::DoRead(IOBuffer
* buf
, int buf_len
,
824 const CompletionCallback
& callback
) {
825 if (core_
->disable_overlapped_reads_
) {
826 if (!core_
->non_blocking_reads_initialized_
) {
827 WSAEventSelect(socket_
, core_
->read_overlapped_
.hEvent
,
829 core_
->non_blocking_reads_initialized_
= true;
831 int rv
= recv(socket_
, buf
->data(), buf_len
, 0);
832 if (rv
== SOCKET_ERROR
) {
833 int os_error
= WSAGetLastError();
834 if (os_error
!= WSAEWOULDBLOCK
) {
835 int net_error
= MapSystemError(os_error
);
836 net_log_
.AddEvent(NetLog::TYPE_SOCKET_READ_ERROR
,
837 CreateNetLogSocketErrorCallback(net_error
, os_error
));
841 base::StatsCounter
read_bytes("tcp.read_bytes");
843 use_history_
.set_was_used_to_convey_data();
846 net_log_
.AddByteTransferEvent(NetLog::TYPE_SOCKET_BYTES_RECEIVED
, rv
,
851 buf_len
= core_
->ThrottleReadSize(buf_len
);
854 read_buffer
.len
= buf_len
;
855 read_buffer
.buf
= buf
->data();
857 // TODO(wtc): Remove the assertion after enough testing.
858 AssertEventNotSignaled(core_
->read_overlapped_
.hEvent
);
861 int rv
= WSARecv(socket_
, &read_buffer
, 1, &num
, &flags
,
862 &core_
->read_overlapped_
, NULL
);
864 if (ResetEventIfSignaled(core_
->read_overlapped_
.hEvent
)) {
865 base::StatsCounter
read_bytes("tcp.read_bytes");
867 use_history_
.set_was_used_to_convey_data();
870 net_log_
.AddByteTransferEvent(NetLog::TYPE_SOCKET_BYTES_RECEIVED
, num
,
872 return static_cast<int>(num
);
875 int os_error
= WSAGetLastError();
876 if (os_error
!= WSA_IO_PENDING
) {
877 int net_error
= MapSystemError(os_error
);
878 net_log_
.AddEvent(NetLog::TYPE_SOCKET_READ_ERROR
,
879 CreateNetLogSocketErrorCallback(net_error
, os_error
));
885 waiting_read_
= true;
886 read_callback_
= callback
;
887 core_
->read_iobuffer_
= buf
;
888 core_
->read_buffer_length_
= buf_len
;
889 core_
->WatchForRead();
890 return ERR_IO_PENDING
;
893 void TCPClientSocketWin::DoReadCallback(int rv
) {
894 DCHECK_NE(rv
, ERR_IO_PENDING
);
895 DCHECK(!read_callback_
.is_null());
897 // Since Run may result in Read being called, clear read_callback_ up front.
898 CompletionCallback c
= read_callback_
;
899 read_callback_
.Reset();
903 void TCPClientSocketWin::DoWriteCallback(int rv
) {
904 DCHECK_NE(rv
, ERR_IO_PENDING
);
905 DCHECK(!write_callback_
.is_null());
907 // since Run may result in Write being called, clear write_callback_ up front.
908 CompletionCallback c
= write_callback_
;
909 write_callback_
.Reset();
913 void TCPClientSocketWin::DidCompleteConnect() {
914 DCHECK_EQ(next_connect_state_
, CONNECT_STATE_CONNECT_COMPLETE
);
917 WSANETWORKEVENTS events
;
918 int rv
= WSAEnumNetworkEvents(socket_
, core_
->read_overlapped_
.hEvent
,
921 if (rv
== SOCKET_ERROR
) {
923 os_error
= WSAGetLastError();
924 result
= MapSystemError(os_error
);
925 } else if (events
.lNetworkEvents
& FD_CONNECT
) {
926 os_error
= events
.iErrorCode
[FD_CONNECT_BIT
];
927 result
= MapConnectError(os_error
);
930 result
= ERR_UNEXPECTED
;
933 connect_os_error_
= os_error
;
934 rv
= DoConnectLoop(result
);
935 if (rv
!= ERR_IO_PENDING
) {
936 LogConnectCompletion(rv
);
941 void TCPClientSocketWin::DidCompleteRead() {
942 DCHECK(waiting_read_
);
943 DWORD num_bytes
, flags
;
944 BOOL ok
= WSAGetOverlappedResult(socket_
, &core_
->read_overlapped_
,
945 &num_bytes
, FALSE
, &flags
);
946 waiting_read_
= false;
949 base::StatsCounter
read_bytes("tcp.read_bytes");
950 read_bytes
.Add(num_bytes
);
952 use_history_
.set_was_used_to_convey_data();
953 net_log_
.AddByteTransferEvent(NetLog::TYPE_SOCKET_BYTES_RECEIVED
,
954 num_bytes
, core_
->read_iobuffer_
->data());
955 rv
= static_cast<int>(num_bytes
);
957 int os_error
= WSAGetLastError();
958 rv
= MapSystemError(os_error
);
959 net_log_
.AddEvent(NetLog::TYPE_SOCKET_READ_ERROR
,
960 CreateNetLogSocketErrorCallback(rv
, os_error
));
962 WSAResetEvent(core_
->read_overlapped_
.hEvent
);
963 core_
->read_iobuffer_
= NULL
;
964 core_
->read_buffer_length_
= 0;
968 void TCPClientSocketWin::DidCompleteWrite() {
969 DCHECK(waiting_write_
);
971 DWORD num_bytes
, flags
;
972 BOOL ok
= WSAGetOverlappedResult(socket_
, &core_
->write_overlapped_
,
973 &num_bytes
, FALSE
, &flags
);
974 WSAResetEvent(core_
->write_overlapped_
.hEvent
);
975 waiting_write_
= false;
978 int os_error
= WSAGetLastError();
979 rv
= MapSystemError(os_error
);
980 net_log_
.AddEvent(NetLog::TYPE_SOCKET_WRITE_ERROR
,
981 CreateNetLogSocketErrorCallback(rv
, os_error
));
983 rv
= static_cast<int>(num_bytes
);
984 if (rv
> core_
->write_buffer_length_
|| rv
< 0) {
985 // It seems that some winsock interceptors report that more was written
986 // than was available. Treat this as an error. http://crbug.com/27870
987 LOG(ERROR
) << "Detected broken LSP: Asked to write "
988 << core_
->write_buffer_length_
<< " bytes, but " << rv
989 << " bytes reported.";
990 rv
= ERR_WINSOCK_UNEXPECTED_WRITTEN_BYTES
;
992 base::StatsCounter
write_bytes("tcp.write_bytes");
993 write_bytes
.Add(num_bytes
);
995 use_history_
.set_was_used_to_convey_data();
996 net_log_
.AddByteTransferEvent(NetLog::TYPE_SOCKET_BYTES_SENT
, num_bytes
,
997 core_
->write_iobuffer_
->data());
1000 core_
->write_iobuffer_
= NULL
;
1001 DoWriteCallback(rv
);
1004 void TCPClientSocketWin::DidSignalRead() {
1005 DCHECK(waiting_read_
);
1007 WSANETWORKEVENTS network_events
;
1008 int rv
= WSAEnumNetworkEvents(socket_
, core_
->read_overlapped_
.hEvent
,
1010 if (rv
== SOCKET_ERROR
) {
1011 os_error
= WSAGetLastError();
1012 rv
= MapSystemError(os_error
);
1013 } else if (network_events
.lNetworkEvents
) {
1014 DCHECK_EQ(network_events
.lNetworkEvents
& ~(FD_READ
| FD_CLOSE
), 0);
1015 // If network_events.lNetworkEvents is FD_CLOSE and
1016 // network_events.iErrorCode[FD_CLOSE_BIT] is 0, it is a graceful
1017 // connection closure. It is tempting to directly set rv to 0 in
1018 // this case, but the MSDN pages for WSAEventSelect and
1019 // WSAAsyncSelect recommend we still call DoRead():
1020 // FD_CLOSE should only be posted after all data is read from a
1021 // socket, but an application should check for remaining data upon
1022 // receipt of FD_CLOSE to avoid any possibility of losing data.
1024 // If network_events.iErrorCode[FD_READ_BIT] or
1025 // network_events.iErrorCode[FD_CLOSE_BIT] is nonzero, still call
1026 // DoRead() because recv() reports a more accurate error code
1027 // (WSAECONNRESET vs. WSAECONNABORTED) when the connection was
1029 rv
= DoRead(core_
->read_iobuffer_
, core_
->read_buffer_length_
,
1031 if (rv
== ERR_IO_PENDING
)
1034 // This may happen because Read() may succeed synchronously and
1035 // consume all the received data without resetting the event object.
1036 core_
->WatchForRead();
1039 waiting_read_
= false;
1040 core_
->read_iobuffer_
= NULL
;
1041 core_
->read_buffer_length_
= 0;