1 /*
2 * Copyright (C) 2021 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 //! Provides a backing task to implement a network
18
19 use crate::boot_time::{timeout, BootTime, Duration};
20 use crate::config::Config;
21 use crate::connection::Connection;
22 use crate::dispatcher::{QueryError, Response};
23 use crate::encoding;
24 use anyhow::{anyhow, bail, Result};
25 use std::sync::Arc;
26 use tokio::sync::{mpsc, watch};
27 use tokio::task;
28
29 use super::{Query, ServerInfo, SocketTagger, ValidationReporter};
30
31 use log::debug;
32
33 pub struct Driver {
34 info: ServerInfo,
35 config: Config,
36 connection: Connection,
37 command_rx: mpsc::Receiver<Command>,
38 status_tx: watch::Sender<Status>,
39 validation: ValidationReporter,
40 tag_socket: SocketTagger,
41 }
42
43 #[derive(Debug)]
44 /// Requests the network can handle
45 pub enum Command {
46 /// Send a DNS query to the network
47 Query(Query),
48 /// Run a probe to check the health of the network. Argument is timeout.
49 Probe(Duration),
50 }
51
52 #[derive(Clone, Debug)]
53 /// Current Network Status
54 ///
55 /// (Unprobed or Failed) can go to (Live or Failed) via Probe.
56 /// Currently, there is no way to go from Live to Failed - probing a live network will short-circuit to returning valid, and query failures do not declare the network failed.
57 pub enum Status {
58 /// Network has not been probed, it may or may not work
59 Unprobed,
60 /// Network is believed to be working
61 Live,
62 /// Network is broken, reason as argument
63 Failed(Arc<anyhow::Error>),
64 }
65
66 impl Status {
is_live(&self) -> bool67 pub fn is_live(&self) -> bool {
68 matches!(self, Self::Live)
69 }
is_failed(&self) -> bool70 pub fn is_failed(&self) -> bool {
71 matches!(self, Self::Failed(_))
72 }
73 }
74
build_connection( info: &ServerInfo, tag_socket: &SocketTagger, config: &mut Config, session: Option<Vec<u8>>, ) -> Result<Connection>75 async fn build_connection(
76 info: &ServerInfo,
77 tag_socket: &SocketTagger,
78 config: &mut Config,
79 session: Option<Vec<u8>>,
80 ) -> Result<Connection> {
81 use std::ops::DerefMut;
82 Ok(Connection::new(
83 info.domain.as_deref(),
84 info.peer_addr,
85 info.sk_mark,
86 info.net_id,
87 tag_socket,
88 config.take().await.deref_mut(),
89 session,
90 )
91 .await?)
92 }
93
94 impl Driver {
95 const MAX_BUFFERED_COMMANDS: usize = 50;
96
new( info: ServerInfo, mut config: Config, validation: ValidationReporter, tag_socket: SocketTagger, ) -> Result<(Self, mpsc::Sender<Command>, watch::Receiver<Status>)>97 pub async fn new(
98 info: ServerInfo,
99 mut config: Config,
100 validation: ValidationReporter,
101 tag_socket: SocketTagger,
102 ) -> Result<(Self, mpsc::Sender<Command>, watch::Receiver<Status>)> {
103 let (command_tx, command_rx) = mpsc::channel(Self::MAX_BUFFERED_COMMANDS);
104 let (status_tx, status_rx) = watch::channel(Status::Unprobed);
105 let connection = build_connection(&info, &tag_socket, &mut config, None).await?;
106 Ok((
107 Self { info, config, connection, status_tx, command_rx, validation, tag_socket },
108 command_tx,
109 status_rx,
110 ))
111 }
112
drive(mut self) -> Result<()>113 pub async fn drive(mut self) -> Result<()> {
114 while let Some(cmd) = self.command_rx.recv().await {
115 match cmd {
116 Command::Probe(duration) =>
117 if let Err(e) = self.probe(duration).await { self.status_tx.send(Status::Failed(Arc::new(e)))? },
118 Command::Query(query) =>
119 if let Err(e) = self.send_query(query).await { debug!("Unable to send query: {:?}", e) },
120 };
121 }
122 Ok(())
123 }
124
probe(&mut self, probe_timeout: Duration) -> Result<()>125 async fn probe(&mut self, probe_timeout: Duration) -> Result<()> {
126 if self.status_tx.borrow().is_failed() {
127 debug!("Network is currently failed, reconnecting");
128 // If our network is currently failed, it may be due to issues with the connection.
129 // Re-establish before re-probing
130 self.connection =
131 build_connection(&self.info, &self.tag_socket, &mut self.config, None).await?;
132 self.status_tx.send(Status::Unprobed)?;
133 }
134 if self.status_tx.borrow().is_live() {
135 // If we're already validated, short circuit
136 (self.validation)(&self.info, true).await;
137 return Ok(());
138 }
139 self.force_probe(probe_timeout).await
140 }
141
force_probe(&mut self, probe_timeout: Duration) -> Result<()>142 async fn force_probe(&mut self, probe_timeout: Duration) -> Result<()> {
143 debug!("Sending probe to server {} on Network {}", self.info.peer_addr, self.info.net_id);
144 let probe = encoding::probe_query()?;
145 let dns_request = encoding::dns_request(&probe, &self.info.url)?;
146 let expiry = BootTime::now().checked_add(probe_timeout);
147 let request = async {
148 match self.connection.query(dns_request, expiry).await {
149 Err(e) => self.status_tx.send(Status::Failed(Arc::new(anyhow!(e)))),
150 Ok(rsp) => {
151 if let Some(_stream) = rsp.await {
152 // TODO verify stream contents
153 self.status_tx.send(Status::Live)
154 } else {
155 self.status_tx.send(Status::Failed(Arc::new(anyhow!("Empty response"))))
156 }
157 }
158 }
159 };
160 match timeout(probe_timeout, request).await {
161 // Timed out
162 Err(time) => self.status_tx.send(Status::Failed(Arc::new(anyhow!(
163 "Probe timed out after {:?} (timeout={:?})",
164 time,
165 probe_timeout
166 )))),
167 // Query completed
168 Ok(r) => r,
169 }?;
170 let valid = self.status_tx.borrow().is_live();
171 (self.validation)(&self.info, valid).await;
172 Ok(())
173 }
174
send_query(&mut self, query: Query) -> Result<()>175 async fn send_query(&mut self, query: Query) -> Result<()> {
176 // If the associated receiver has been closed, meaning that the request has already
177 // timed out, just drop it. This check helps drain the channel quickly in the case
178 // where the network is stalled.
179 if query.response.is_closed() {
180 bail!("Abandoning expired DNS request")
181 }
182
183 if !self.connection.wait_for_live().await {
184 let session =
185 if self.info.use_session_resumption { self.connection.session() } else { None };
186 // Try reconnecting
187 self.connection =
188 build_connection(&self.info, &self.tag_socket, &mut self.config, session).await?;
189 }
190 let request = encoding::dns_request(&query.query, &self.info.url)?;
191 let stream_fut = self.connection.query(request, Some(query.expiry)).await?;
192 task::spawn(async move {
193 let stream = match stream_fut.await {
194 Some(stream) => stream,
195 None => {
196 debug!("Connection died while processing request");
197 // We don't care if the response is gone
198 let _ =
199 query.response.send(Response::Error { error: QueryError::ConnectionError });
200 return;
201 }
202 };
203 // We don't care if the response is gone.
204 let _ = if let Some(err) = stream.error {
205 query.response.send(Response::Error { error: QueryError::Reset(err) })
206 } else {
207 query.response.send(Response::Success { answer: stream.data })
208 };
209 });
210 Ok(())
211 }
212 }
213