• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright 2012 The Chromium Authors
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 #ifndef NET_SOCKET_UDP_SOCKET_WIN_H_
6 #define NET_SOCKET_UDP_SOCKET_WIN_H_
7 
8 #include <winsock2.h>
9 
10 #include <qos2.h>
11 #include <stdint.h>
12 
13 // Must be after winsock2.h:
14 #include <MSWSock.h>
15 
16 #include <atomic>
17 #include <memory>
18 #include <set>
19 
20 #include "base/gtest_prod_util.h"
21 #include "base/memory/raw_ptr.h"
22 #include "base/memory/scoped_refptr.h"
23 #include "base/memory/weak_ptr.h"
24 #include "base/threading/thread_checker.h"
25 #include "base/win/object_watcher.h"
26 #include "base/win/scoped_handle.h"
27 #include "net/base/address_family.h"
28 #include "net/base/completion_once_callback.h"
29 #include "net/base/io_buffer.h"
30 #include "net/base/ip_endpoint.h"
31 #include "net/base/net_export.h"
32 #include "net/base/network_handle.h"
33 #include "net/base/sockaddr_storage.h"
34 #include "net/log/net_log_with_source.h"
35 #include "net/socket/datagram_socket.h"
36 #include "net/socket/diff_serv_code_point.h"
37 #include "net/socket/udp_socket_global_limits.h"
38 #include "net/traffic_annotation/network_traffic_annotation.h"
39 
40 namespace net {
41 
42 class IPAddress;
43 class NetLog;
44 struct NetLogSource;
45 class SocketTag;
46 
47 // QWAVE (Quality Windows Audio/Video Experience) is the latest windows
48 // library for setting packet priorities (and other things). Unfortunately,
49 // Microsoft has decided that setting the DSCP bits with setsockopt() no
50 // longer works, so we have to use this API instead.
51 // This class is meant to be used as a singleton. It exposes a few dynamically
52 // loaded functions and a bool called "qwave_supported".
53 class NET_EXPORT QwaveApi {
54   typedef BOOL(WINAPI* CreateHandleFn)(PQOS_VERSION, PHANDLE);
55   typedef BOOL(WINAPI* CloseHandleFn)(HANDLE);
56   typedef BOOL(WINAPI* AddSocketToFlowFn)(HANDLE,
57                                           SOCKET,
58                                           PSOCKADDR,
59                                           QOS_TRAFFIC_TYPE,
60                                           DWORD,
61                                           PQOS_FLOWID);
62   typedef BOOL(WINAPI* RemoveSocketFromFlowFn)(HANDLE,
63                                                SOCKET,
64                                                QOS_FLOWID,
65                                                DWORD);
66   typedef BOOL(WINAPI* SetFlowFn)(HANDLE,
67                                   QOS_FLOWID,
68                                   QOS_SET_FLOW,
69                                   ULONG,
70                                   PVOID,
71                                   DWORD,
72                                   LPOVERLAPPED);
73 
74  public:
75   QwaveApi();
76 
77   QwaveApi(const QwaveApi&) = delete;
78   QwaveApi& operator=(const QwaveApi&) = delete;
79 
80   static QwaveApi* GetDefault();
81 
82   virtual bool qwave_supported() const;
83   virtual void OnFatalError();
84 
85   virtual BOOL CreateHandle(PQOS_VERSION version, PHANDLE handle);
86   virtual BOOL CloseHandle(HANDLE handle);
87   virtual BOOL AddSocketToFlow(HANDLE handle,
88                                SOCKET socket,
89                                PSOCKADDR addr,
90                                QOS_TRAFFIC_TYPE traffic_type,
91                                DWORD flags,
92                                PQOS_FLOWID flow_id);
93   virtual BOOL RemoveSocketFromFlow(HANDLE handle,
94                                     SOCKET socket,
95                                     QOS_FLOWID flow_id,
96                                     DWORD reserved);
97   virtual BOOL SetFlow(HANDLE handle,
98                        QOS_FLOWID flow_id,
99                        QOS_SET_FLOW op,
100                        ULONG size,
101                        PVOID data,
102                        DWORD reserved,
103                        LPOVERLAPPED overlapped);
104 
105  private:
106   std::atomic<bool> qwave_supported_{false};
107 
108   CreateHandleFn create_handle_func_;
109   CloseHandleFn close_handle_func_;
110   AddSocketToFlowFn add_socket_to_flow_func_;
111   RemoveSocketFromFlowFn remove_socket_from_flow_func_;
112   SetFlowFn set_flow_func_;
113 };
114 
115 //-----------------------------------------------------------------------------
116 
117 // Helper for maintaining the state that (unlike a blanket socket option), DSCP
118 // values are set per-remote endpoint instead of just per-socket on Windows.
119 // The implementation creates a single QWAVE 'flow' for the socket, and adds
120 // all encountered remote addresses to that flow.  Flows are the minimum
121 // manageable unit within the QWAVE API.  See
122 // https://docs.microsoft.com/en-us/previous-versions/windows/desktop/api/qos2/
123 // for Microsoft's documentation.
124 class NET_EXPORT DscpManager {
125  public:
126   DscpManager(QwaveApi* api, SOCKET socket);
127 
128   DscpManager(const DscpManager&) = delete;
129   DscpManager& operator=(const DscpManager&) = delete;
130 
131   ~DscpManager();
132 
133   // Remembers the latest |dscp| so PrepareToSend can add remote addresses to
134   // the qos flow. Destroys the old flow if it exists and |dscp| changes.
135   void Set(DiffServCodePoint dscp);
136 
137   // Constructs a qos flow for the latest set DSCP value if we don't already
138   // have one. Adds |remote_address| to the qos flow if it hasn't been added
139   // already. Does nothing if no DSCP value has been Set.
140   int PrepareForSend(const IPEndPoint& remote_address);
141 
142  private:
143   void RequestHandle();
144   static HANDLE DoCreateHandle(QwaveApi* api);
145   static void OnHandleCreated(QwaveApi* api,
146                               base::WeakPtr<DscpManager> dscp_manager,
147                               HANDLE handle);
148 
149   const raw_ptr<QwaveApi> api_;
150   const SOCKET socket_;
151 
152   DiffServCodePoint dscp_value_ = DSCP_NO_CHANGE;
153   // The remote addresses currently in the flow.
154   std::set<IPEndPoint> configured_;
155 
156   HANDLE qos_handle_ = nullptr;
157   bool handle_is_initializing_ = false;
158   // 0 means no flow has been constructed.
159   QOS_FLOWID flow_id_ = 0;
160   base::WeakPtrFactory<DscpManager> weak_ptr_factory_{this};
161 };
162 
163 //-----------------------------------------------------------------------------
164 
165 class NET_EXPORT UDPSocketWin : public base::win::ObjectWatcher::Delegate {
166  public:
167   // BindType is ignored. Windows has an option to do random binds, so
168   // UDPSocketWin sets that whenever connecting a socket.
169   UDPSocketWin(DatagramSocket::BindType bind_type,
170                net::NetLog* net_log,
171                const net::NetLogSource& source);
172 
173   UDPSocketWin(DatagramSocket::BindType bind_type,
174                NetLogWithSource source_net_log);
175 
176   UDPSocketWin(const UDPSocketWin&) = delete;
177   UDPSocketWin& operator=(const UDPSocketWin&) = delete;
178 
179   ~UDPSocketWin() override;
180 
181   // Opens the socket.
182   // Returns a net error code.
183   int Open(AddressFamily address_family);
184 
185   // Not implemented. Returns ERR_NOT_IMPLEMENTED.
186   int BindToNetwork(handles::NetworkHandle network);
187 
188   // Connects the socket to connect with a certain |address|.
189   // Should be called after Open().
190   // Returns a net error code.
191   int Connect(const IPEndPoint& address);
192 
193   // Binds the address/port for this socket to |address|.  This is generally
194   // only used on a server. Should be called after Open().
195   // Returns a net error code.
196   int Bind(const IPEndPoint& address);
197 
198   // Closes the socket.
199   void Close();
200 
201   // Copies the remote udp address into |address| and returns a net error code.
202   int GetPeerAddress(IPEndPoint* address) const;
203 
204   // Copies the local udp address into |address| and returns a net error code.
205   // (similar to getsockname)
206   int GetLocalAddress(IPEndPoint* address) const;
207 
208   // IO:
209   // Multiple outstanding read requests are not supported.
210   // Full duplex mode (reading and writing at the same time) is supported
211 
212   // Reads from the socket.
213   // Only usable from the client-side of a UDP socket, after the socket
214   // has been connected.
215   int Read(IOBuffer* buf, int buf_len, CompletionOnceCallback callback);
216 
217   // Writes to the socket.
218   // Only usable from the client-side of a UDP socket, after the socket
219   // has been connected.
220   int Write(IOBuffer* buf,
221             int buf_len,
222             CompletionOnceCallback callback,
223             const NetworkTrafficAnnotationTag& traffic_annotation);
224 
225   // Reads from a socket and receive sender address information.
226   // |buf| is the buffer to read data into.
227   // |buf_len| is the maximum amount of data to read.
228   // |address| is a buffer provided by the caller for receiving the sender
229   //   address information about the received data.  This buffer must be kept
230   //   alive by the caller until the callback is placed.
231   // |callback| is the callback on completion of the RecvFrom.
232   // Returns a net error code, or ERR_IO_PENDING if the IO is in progress.
233   // If ERR_IO_PENDING is returned, this socket takes a ref to |buf| to keep
234   // it alive until the data is received. However, the caller must keep
235   // |address| alive until the callback is called.
236   int RecvFrom(IOBuffer* buf,
237                int buf_len,
238                IPEndPoint* address,
239                CompletionOnceCallback callback);
240 
241   // Sends to a socket with a particular destination.
242   // |buf| is the buffer to send.
243   // |buf_len| is the number of bytes to send.
244   // |address| is the recipient address.
245   // |callback| is the user callback function to call on complete.
246   // Returns a net error code, or ERR_IO_PENDING if the IO is in progress.
247   // If ERR_IO_PENDING is returned, this socket copies |address| for
248   // asynchronous sending, and takes a ref to |buf| to keep it alive until the
249   // data is sent.
250   int SendTo(IOBuffer* buf,
251              int buf_len,
252              const IPEndPoint& address,
253              CompletionOnceCallback callback);
254 
255   // Sets the receive buffer size (in bytes) for the socket.
256   // Returns a net error code.
257   int SetReceiveBufferSize(int32_t size);
258 
259   // Sets the send buffer size (in bytes) for the socket.
260   // Returns a net error code.
261   int SetSendBufferSize(int32_t size);
262 
263   // Requests that packets sent by this socket not be fragment, either locally
264   // by the host, or by routers (via the DF bit in the IPv4 packet header).
265   // May not be supported by all platforms. Returns a network error code if
266   // there was a problem, but the socket will still be usable. Can not
267   // return ERR_IO_PENDING.
268   int SetDoNotFragment();
269 
270   // Requests that packets received by this socket have the ECN bit set. Returns
271   // a network error code if there was a problem.
272   int SetRecvTos();
273 
274   // This is a no-op on Windows.
275   void SetMsgConfirm(bool confirm);
276 
277   // Returns true if the socket is already connected or bound.
is_connected()278   bool is_connected() const { return is_connected_; }
279 
NetLog()280   const NetLogWithSource& NetLog() const { return net_log_; }
281 
282   // Sets socket options to allow the socket to share the local address to which
283   // the socket will be bound with other processes. If multiple processes are
284   // bound to the same local address at the same time, behavior is undefined;
285   // e.g., it is not guaranteed that incoming  messages will be sent to all
286   // listening sockets. Returns a net error code.
287   //
288   // Should be called between Open() and Bind().
289   int AllowAddressReuse();
290 
291   // Sets socket options to allow sending and receiving packets to and from
292   // broadcast addresses.
293   int SetBroadcast(bool broadcast);
294 
295   // Sets socket options to allow the socket to share the local address to which
296   // the socket will be bound with other processes and attempt to allow all such
297   // sockets to receive the same multicast messages. Returns a net error code.
298   //
299   // For Windows, multicast messages should always be shared between sockets
300   // configured thusly as long as the sockets join the same multicast group and
301   // interface.
302   //
303   // Should be called between Open() and Bind().
304   int AllowAddressSharingForMulticast();
305 
306   // Joins the multicast group.
307   // |group_address| is the group address to join, could be either
308   // an IPv4 or IPv6 address.
309   // Returns a net error code.
310   int JoinGroup(const IPAddress& group_address) const;
311 
312   // Leaves the multicast group.
313   // |group_address| is the group address to leave, could be either
314   // an IPv4 or IPv6 address. If the socket hasn't joined the group,
315   // it will be ignored.
316   // It's optional to leave the multicast group before destroying
317   // the socket. It will be done by the OS.
318   // Return a net error code.
319   int LeaveGroup(const IPAddress& group_address) const;
320 
321   // Sets interface to use for multicast. If |interface_index| set to 0,
322   // default interface is used.
323   // Should be called before Bind().
324   // Returns a net error code.
325   int SetMulticastInterface(uint32_t interface_index);
326 
327   // Sets the time-to-live option for UDP packets sent to the multicast
328   // group address. The default value of this option is 1.
329   // Cannot be negative or more than 255.
330   // Should be called before Bind().
331   int SetMulticastTimeToLive(int time_to_live);
332 
333   // Sets the loopback flag for UDP socket. If this flag is true, the host
334   // will receive packets sent to the joined group from itself.
335   // The default value of this option is true.
336   // Should be called before Bind().
337   //
338   // Note: the behavior of |SetMulticastLoopbackMode| is slightly
339   // different between Windows and Unix-like systems. The inconsistency only
340   // happens when there are more than one applications on the same host
341   // joined to the same multicast group while having different settings on
342   // multicast loopback mode. On Windows, the applications with loopback off
343   // will not RECEIVE the loopback packets; while on Unix-like systems, the
344   // applications with loopback off will not SEND the loopback packets to
345   // other applications on the same host. See MSDN: http://goo.gl/6vqbj
346   int SetMulticastLoopbackMode(bool loopback);
347 
348   // Sets the differentiated services flags on outgoing packets. May not do
349   // anything on some platforms. A return value of ERR_INVALID_HANDLE indicates
350   // the value was not set but could succeed on a future call, because
351   // initialization is in progress.
352   int SetDiffServCodePoint(DiffServCodePoint dscp);
353 
354   // Requests that packets sent by this socket have the DSCP and/or ECN
355   // bits set. Returns a network error code if there was a problem. If
356   // DSCP_NO_CHANGE or ECN_NO_CHANGE are set, will preserve those parts of
357   // the original setting.
358   // ECN values other than 0 must not be used outside of tests, without
359   // appropriate congestion control.
360   int SetTos(DiffServCodePoint dscp, EcnCodePoint ecn);
361 
362   // Sets IPV6_V6ONLY on the socket. If this flag is true, the socket will be
363   // restricted to only IPv6; false allows both IPv4 and IPv6 traffic.
364   int SetIPv6Only(bool ipv6_only);
365 
366   // Resets the thread to be used for thread-safety checks.
367   void DetachFromThread();
368 
369   // This class by default uses overlapped IO. Call this method before Open() or
370   // AdoptOpenedSocket() to switch to non-blocking IO.
371   void UseNonBlockingIO();
372 
373   // Apply |tag| to this socket.
374   void ApplySocketTag(const SocketTag& tag);
375 
376   // Takes ownership of `socket`, which should be a socket descriptor opened
377   // with the specified address family. The socket should only be created but
378   // not bound or connected to an address. This method must be called after
379   // UseNonBlockingIO, otherwise the adopted socket will not have the
380   // non-blocking IO flag set.
381   int AdoptOpenedSocket(AddressFamily address_family, SOCKET socket);
382 
get_multicast_interface_for_testing()383   uint32_t get_multicast_interface_for_testing() {
384     return multicast_interface_;
385   }
get_use_non_blocking_io_for_testing()386   bool get_use_non_blocking_io_for_testing() { return use_non_blocking_io_; }
387 
388   // Because the windows API separates out DSCP and ECN better than Posix, this
389   // function does not actually return the correct DSCP value, instead always
390   // returning DSCP_DEFAULT rather than the last incoming value.
391   // If a use case arises for reading the incoming DSCP value, it would only
392   // then worth be executing the system call.
393   // However, the ECN member of the return value is correct if SetRecvTos()
394   // was called previously on the socket.
GetLastTos()395   DscpAndEcn GetLastTos() const { return last_tos_; }
396 
397  private:
398   enum SocketOptions {
399     SOCKET_OPTION_MULTICAST_LOOP = 1 << 0
400   };
401 
402   class Core;
403 
404   void DoReadCallback(int rv);
405   void DoWriteCallback(int rv);
406 
407   void DidCompleteRead();
408   void DidCompleteWrite();
409 
410   // base::ObjectWatcher::Delegate implementation.
411   void OnObjectSignaled(HANDLE object) override;
412   void OnReadSignaled();
413   void OnWriteSignaled();
414 
415   void WatchForReadWrite();
416 
417   // Handles stats and logging. |result| is the number of bytes transferred, on
418   // success, or the net error code on failure.
419   void LogRead(int result, const char* bytes, const IPEndPoint* address) const;
420   void LogWrite(int result, const char* bytes, const IPEndPoint* address) const;
421   // Reads the last error, maps it, logs it, and returns the mapped result.
422   int LogAndReturnError() const;
423 
424   // Same as SendTo(), except that address is passed by pointer
425   // instead of by reference. It is called from Write() with |address|
426   // set to NULL.
427   int SendToOrWrite(IOBuffer* buf,
428                     int buf_len,
429                     const IPEndPoint* address,
430                     CompletionOnceCallback callback);
431 
432   int InternalConnect(const IPEndPoint& address);
433 
434   // Returns a function pointer to the platform's instantiation of WSARecvMsg()
435   // or WSASendMsg().
436   LPFN_WSARECVMSG GetRecvMsgPointer();
437   LPFN_WSASENDMSG GetSendMsgPointer();
438 
439   // Populates |message| with |storage|, |data_buffer|, and |control_buffer| to
440   // use ECN before calls to either WSASendMsg() (if |send| is true) or
441   // WSARecvMsg().
442   // |data_buffer| is the datagram. |control_buffer| is the storage
443   // space for cmsgs. If |send| is false for an overlapped socket, the caller
444   // must retain a reference to |msghdr|, |storage|, and the buf members of
445   // |data_buffer| and |control_buffer|, in case WSARecvMsg() returns IO_PENDING
446   // and the result is delivered asynchronously.
447   void PopulateWSAMSG(WSAMSG& message,
448                       SockaddrStorage& storage,
449                       WSABUF* data_buffer,
450                       WSABUF& control_buffer,
451                       bool send);
452   // Sets last_tos_ to the last ECN codepoint contained in |message|.
453   void SetLastTosFromWSAMSG(WSAMSG& message);
454 
455   // Version for using overlapped IO.
456   int InternalRecvFromOverlapped(IOBuffer* buf,
457                                  int buf_len,
458                                  IPEndPoint* address);
459   int InternalSendToOverlapped(IOBuffer* buf,
460                                int buf_len,
461                                const IPEndPoint* address);
462 
463   // Version for using non-blocking IO.
464   int InternalRecvFromNonBlocking(IOBuffer* buf,
465                                   int buf_len,
466                                   IPEndPoint* address);
467   int InternalSendToNonBlocking(IOBuffer* buf,
468                                 int buf_len,
469                                 const IPEndPoint* address);
470 
471   // Applies |socket_options_| to |socket_|. Should be called before
472   // Bind().
473   int SetMulticastOptions();
474   int DoBind(const IPEndPoint& address);
475 
476   // Configures opened `socket_` depending on whether it uses nonblocking IO.
477   void ConfigureOpenedSocket();
478 
479   // This is provided to allow QwaveApi mocking in tests. |UDPSocketWin| method
480   // implementations should call |GetQwaveApi()| instead of
481   // |QwaveApi::GetDefault()| directly.
482   virtual QwaveApi* GetQwaveApi() const;
483 
484   SOCKET socket_;
485   int addr_family_ = 0;
486   bool is_connected_ = false;
487 
488   // Bitwise-or'd combination of SocketOptions. Specifies the set of
489   // options that should be applied to |socket_| before Bind().
490   int socket_options_;
491 
492   // Multicast interface.
493   uint32_t multicast_interface_ = 0;
494 
495   // Multicast socket options cached for SetMulticastOption.
496   // Cannot be used after Bind().
497   int multicast_time_to_live_ = 1;
498 
499   // These are mutable since they're just cached copies to make
500   // GetPeerAddress/GetLocalAddress smarter.
501   mutable std::unique_ptr<IPEndPoint> local_address_;
502   mutable std::unique_ptr<IPEndPoint> remote_address_;
503 
504   // The core of the socket that can live longer than the socket itself. We pass
505   // resources to the Windows async IO functions and we have to make sure that
506   // they are not destroyed while the OS still references them.
507   scoped_refptr<Core> core_;
508 
509   // True if non-blocking IO is used.
510   bool use_non_blocking_io_ = false;
511 
512   // Watches |read_write_event_|.
513   base::win::ObjectWatcher read_write_watcher_;
514 
515   // Events for read and write.
516   base::win::ScopedHandle read_write_event_;
517 
518   // The buffers used in Read() and Write().
519   scoped_refptr<IOBuffer> read_iobuffer_;
520   scoped_refptr<IOBuffer> write_iobuffer_;
521 
522   int read_iobuffer_len_ = 0;
523   int write_iobuffer_len_ = 0;
524 
525   raw_ptr<IPEndPoint> recv_from_address_ = nullptr;
526 
527   // Cached copy of the current address we're sending to, if any.  Used for
528   // logging.
529   std::unique_ptr<IPEndPoint> send_to_address_;
530 
531   // External callback; called when read is complete.
532   CompletionOnceCallback read_callback_;
533 
534   // External callback; called when write is complete.
535   CompletionOnceCallback write_callback_;
536 
537   NetLogWithSource net_log_;
538 
539   // Maintains remote addresses for QWAVE qos management.
540   std::unique_ptr<DscpManager> dscp_manager_;
541 
542   // Manages decrementing the global open UDP socket counter when this
543   // UDPSocket is destroyed.
544   OwnedUDPSocketCount owned_socket_count_;
545 
546   DscpAndEcn last_tos_ = {DSCP_DEFAULT, ECN_DEFAULT};
547 
548   // If true, the socket has been configured to report ECN on incoming
549   // datagrams.
550   bool report_ecn_ = false;
551 
552   // Function pointers to the platform implementations of WSARecvMsg() and
553   // WSASendMsg().
554   LPFN_WSARECVMSG wsa_recv_msg_ = nullptr;
555   LPFN_WSASENDMSG wsa_send_msg_ = nullptr;
556 
557   // The ECN codepoint to send on outgoing packets.
558   EcnCodePoint send_ecn_ = ECN_NOT_ECT;
559 
560   THREAD_CHECKER(thread_checker_);
561 
562   // Used to prevent null dereferences in OnObjectSignaled, when passing an
563   // error to both read and write callbacks. Cleared in Close()
564   base::WeakPtrFactory<UDPSocketWin> event_pending_{this};
565 };
566 
567 //-----------------------------------------------------------------------------
568 
569 
570 
571 }  // namespace net
572 
573 #endif  // NET_SOCKET_UDP_SOCKET_WIN_H_
574