istio · istio-testing · Feb 5, 2024 · Jan 16, 2024 · Jan 17, 2024 · Jan 22, 2024
@@ -42,6 +42,21 @@ pub enum Identity {
     },
 }
 
+impl Ord for Identity {
+    // Not sure this is a super legit compare but I think it should work for POC
+    fn cmp(&self, other: &Self) -> Ordering {
+        let s = format!("{self}");
+        let o = format!("{other}");
+        s.cmp(&o)
+    }
+}
+
+impl PartialOrd for Identity {
+    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
 impl EncodeLabelValue for Identity {
     fn encode(&self, writer: &mut LabelValueEncoder) -> Result<(), std::fmt::Error> {
         writer.write_str(&self.to_string())

@@ -41,6 +41,7 @@ use crate::state::workload::{network_addr, Workload};
 use crate::state::DemandProxyState;
 use crate::{config, identity, socket, tls};
 
+mod connection_manager;
 mod inbound;
 mod inbound_passthrough;
 #[allow(non_camel_case_types)]

@@ -0,0 +1,359 @@
+// Copyright Istio Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use crate::proxy::error;
+use crate::rbac::Connection;
+use crate::state::DemandProxyState;
+use drain;
+use std::collections::HashMap;
+use std::sync::{atomic::AtomicUsize, Arc};
+use tokio::sync::watch;
+use tokio::sync::RwLock;
+use tracing::{debug, info};
+
+struct ConnectionDrain {
+    tx: drain::Signal,
+    rx: drain::Watch,
+    count: AtomicUsize,
+}
+
+impl ConnectionDrain {
+    fn new() -> Self {
+        let (tx, rx) = drain::channel();
+        let count = AtomicUsize::new(1);
+        ConnectionDrain { tx, rx, count }
+    }
+
+    /// drain drops the internal reference to rx and then signals drain on the tx
+    // always inline, this is for convenience so that we don't forget to drop the rx but there's really no reason it needs to grow the stack
+    #[inline(always)]
+    async fn drain(self) {
+        drop(self.rx); // very important, drain cannont complete if there are outstand rx
+        self.tx.drain().await;
+    }
+}
+
+#[derive(Clone)]
+pub struct ConnectionManager {
+    drains: Arc<RwLock<HashMap<Connection, ConnectionDrain>>>,
+}
+
+impl ConnectionManager {
+    pub fn new() -> Self {
+        ConnectionManager {
+            drains: Arc::new(RwLock::new(HashMap::new())),
+        }
+    }
+
+    // register a connection with the manager and get a channel to receive on
+    pub async fn track(self, c: &Connection) -> drain::Watch {
+        let cd = ConnectionDrain::new();
+        let rx = cd.rx.clone();
+        let mut drains = self.drains.write().await;
+        if let Some(w) = drains.remove(c) {
+            w.count.fetch_add(1, std::sync::atomic::Ordering::SeqCst);
+            let rx = w.rx.clone();
+            drains.insert(c.clone(), w);
+            debug!("there are {} tracked connections", drains.len());
+            return rx;
+        }
+        drains.insert(c.clone(), cd);
+        debug!("there are {} tracked connections", drains.len());
+        rx
+    }
+
+    // releases tracking on a connection
+    // uses a counter to determine if there are other tracked connections or not so it may retain the tx/rx channels when necessary
+    pub async fn release(self, c: &Connection) {
+        let mut drains = self.drains.write().await;
+        if let Some((k, v)) = drains.remove_entry(c) {
+            if v.count.fetch_sub(1, std::sync::atomic::Ordering::SeqCst) > 1 {
+                // something else is tracking this connection, retain
+                drains.insert(k, v);
+            }
+        }
+    }
+
+    // signal all connections listening to this channel to take action (typically terminate traffic)
+    async fn close(&self, c: &Connection) {
+        if let Some(cd) = self.drains.clone().write().await.remove(c) {
+            cd.drain().await;
+        } else {
+            // this is bad, possibly drain called twice
+            error!("requested drain on a Connection which wasn't initialized");
+        }
+    }
+
+    //  get a list of all connections being tracked
+    async fn connections(&self) -> Vec<Connection> {
+        // potentially large copy under read lock, could require optomization
+        self.drains.read().await.keys().cloned().collect()
+    }
+}
+
+pub async fn policy_watcher(
+    state: DemandProxyState,
+    mut stop_rx: watch::Receiver<()>,
+    connection_manager: ConnectionManager,
+    parent_proxy: &str,
+) {
+    let mut policies_changed = state.read().policies.subscribe();
+    loop {
+        tokio::select! {
+            _ = stop_rx.changed() => {
+                break;
+            }
+            _ = policies_changed.changed() => {
+                let connections = connection_manager.connections().await;
+                for conn in connections {
+                    if !state.assert_rbac(&conn).await {
+                        connection_manager.close(&conn).await;
+                        info!("{parent_proxy} connection {conn} closed because it's no longer allowed after a policy update");
+                    }
+                }
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use drain::Watch;
+    use hickory_resolver::config::{ResolverConfig, ResolverOpts};
+    use std::net::{Ipv4Addr, SocketAddrV4};
+    use std::sync::{Arc, RwLock};
+    use std::time::Duration;
+    use tokio::sync::watch;
+
+    use crate::rbac::Connection;
+    use crate::state::{DemandProxyState, ProxyState};
+    use crate::xds::istio::security::{Action, Authorization, Scope};
+    use crate::xds::ProxyStateUpdateMutator;
+
+    use super::ConnectionManager;
+
+    #[tokio::test]
+    async fn test_connection_manager_close() {
+        // setup a new ConnectionManager
+        let connection_manager = ConnectionManager::new();
+        // ensure drains is empty
+        assert_eq!(connection_manager.drains.read().await.len(), 0);
+        assert_eq!(connection_manager.connections().await.len(), 0);
+
+        // track a new connection
+        let conn1 = Connection {
+            src_identity: None,
+            src_ip: std::net::IpAddr::V4(Ipv4Addr::new(192, 168, 0, 1)),
+            dst_network: "".to_string(),
+            dst: std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::new(192, 168, 0, 2), 8080)),
+        };
+        let close1 = connection_manager.clone().track(&conn1).await;
+        // ensure drains contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn1.clone()));
+
+        // setup a second track on the same connection
+        let another_conn1 = conn1.clone();
+        let another_close1 = connection_manager.clone().track(&another_conn1).await;
+        // ensure drains contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn1.clone()));
+
+        // track a second connection
+        let conn2 = Connection {
+            src_identity: None,
+            src_ip: std::net::IpAddr::V4(Ipv4Addr::new(192, 168, 0, 3)),
+            dst_network: "".to_string(),
+            dst: std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::new(192, 168, 0, 2), 8080)),
+        };
+        let close2 = connection_manager.clone().track(&conn2).await;
+        // ensure drains contains exactly 2 items
+        assert_eq!(connection_manager.drains.read().await.len(), 2);
+        assert_eq!(connection_manager.connections().await.len(), 2);
+        let mut connections = connection_manager.connections().await;
+        connections.sort(); // ordering cannot be guaranteed without sorting
+        assert_eq!(connections, vec![conn1.clone(), conn2.clone()]);
+
+        // spawn tasks to assert that we close in a timely manner for conn1
+        tokio::spawn(assert_close(close1));
+        tokio::spawn(assert_close(another_close1));
+        // close conn1
+        connection_manager.close(&conn1).await;
+        // ensure drains contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn2.clone()));
+
+        // spawn a task to assert that we close in a timely manner for conn2
+        tokio::spawn(assert_close(close2));
+        // close conn2
+        connection_manager.close(&conn2).await;
+        // assert that drains is empty again
+        assert_eq!(connection_manager.drains.read().await.len(), 0);
+        assert_eq!(connection_manager.connections().await.len(), 0);
+    }
+
+    #[tokio::test]
+    async fn test_connection_manager_release() {
+        // setup a new ConnectionManager
+        let connection_manager = ConnectionManager::new();
+        // ensure drains is empty
+        assert_eq!(connection_manager.drains.read().await.len(), 0);
+        assert_eq!(connection_manager.connections().await.len(), 0);
+
+        // create a new connection
+        let conn1 = Connection {
+            src_identity: None,
+            src_ip: std::net::IpAddr::V4(Ipv4Addr::new(192, 168, 0, 1)),
+            dst_network: "".to_string(),
+            dst: std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::new(192, 168, 0, 2), 8080)),
+        };
+
+        // create a second connection
+        let conn2 = Connection {
+            src_identity: None,
+            src_ip: std::net::IpAddr::V4(Ipv4Addr::new(192, 168, 0, 3)),
+            dst_network: "".to_string(),
+            dst: std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::new(192, 168, 0, 2), 8080)),
+        };
+
+        let another_conn1 = conn1.clone();
+
+        // watch the connections
+        let close1 = connection_manager.clone().track(&conn1).await;
+        let another_close1 = connection_manager.clone().track(&another_conn1).await;
+        // ensure drains contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn1.clone()));
+
+        // release conn1's clone
+        drop(another_close1);
+        connection_manager.clone().release(&another_conn1).await;
+        // ensure drains still contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn1.clone()));
+
+        // track conn2
+        let close2 = connection_manager.clone().track(&conn2).await;
+        // ensure drains contains exactly 2 items
+        assert_eq!(connection_manager.drains.read().await.len(), 2);
+        assert_eq!(connection_manager.connections().await.len(), 2);
+        let mut connections = connection_manager.connections().await;
+        connections.sort(); // ordering cannot be guaranteed without sorting
+        assert_eq!(connections, vec![conn1.clone(), conn2.clone()]);
+
+        // release conn1
+        drop(close1);
+        connection_manager.clone().release(&conn1).await;
+        // ensure drains contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(connection_manager.connections().await, vec!(conn2.clone()));
+
+        // clone conn2 and track it
+        let another_conn2 = conn2.clone();
+        let another_close2 = connection_manager.clone().track(&another_conn2).await;
+        drop(close2);
+        // release tracking on conn2
+        connection_manager.clone().release(&conn2).await;
+        // ensure drains still contains exactly 1 item
+        assert_eq!(connection_manager.drains.read().await.len(), 1);
+        assert_eq!(connection_manager.connections().await.len(), 1);
+        assert_eq!(
+            connection_manager.connections().await,
+            vec!(another_conn2.clone())
+        );
+
+        // release tracking on conn2's clone
+        drop(another_close2);
+        connection_manager.clone().release(&another_conn2).await;
+        // ensure drains contains exactly 0 items
+        assert_eq!(connection_manager.drains.read().await.len(), 0);
+        assert_eq!(connection_manager.connections().await.len(), 0);
+    }
+
+    #[tokio::test]
+    async fn test_policy_watcher_lifecycle() {
+        // preamble: setup an environment
+        let state = Arc::new(RwLock::new(ProxyState::default()));
+        let dstate = DemandProxyState::new(
+            state.clone(),
+            None,
+            ResolverConfig::default(),
+            ResolverOpts::default(),
+        );
+        let connection_manager = ConnectionManager::new();
+        let parent_proxy = "test";
+        let (stop_tx, stop_rx) = watch::channel(());
+        let state_mutator = ProxyStateUpdateMutator::new_no_fetch();
+
+        // clones to move into spawned task
+        let ds = dstate.clone();
+        let cm = connection_manager.clone();
+        // spawn a task which watches policy and asserts that the policy watcher stop correctly
+        tokio::spawn(async move {
+            let res = tokio::time::timeout(
+                Duration::from_secs(1),
+                super::policy_watcher(ds, stop_rx, cm, parent_proxy),
+            )
+            .await;
+            assert!(res.is_ok())
+        });
+
+        // create a test connection
+        let conn1 = Connection {
+            src_identity: None,
+            src_ip: std::net::IpAddr::V4(Ipv4Addr::new(192, 168, 0, 1)),
+            dst_network: "".to_string(),
+            dst: std::net::SocketAddr::V4(SocketAddrV4::new(Ipv4Addr::new(192, 168, 0, 2), 8080)),
+        };
+        // watch the connection
+        let close1 = connection_manager.clone().track(&conn1).await;
+
+        // generate policy which denies everything
+        let auth = Authorization {
+            name: "allow-nothing".to_string(),
+            action: Action::Deny as i32,
+            scope: Scope::Global as i32,
+            namespace: "default".to_string(),
+            rules: vec![],
+        };
+
+        // spawn an assertion that our connection close is received
+        tokio::spawn(assert_close(close1));
+
+        // update our state
+        let mut s = state
+            .write()
+            .expect("test fails if we're unable to get a write lock on state");
+        let res = state_mutator.insert_authorization(&mut s, auth);
+        // assert that the update was OK
+        assert!(res.is_ok());
+        // release lock
+        drop(s);
+
+        // send the signal which stops policy watcher
+        stop_tx.send_replace(());
+    }
+
+    // small helper to assert that the Watches are working in a timely manner
+    async fn assert_close(c: Watch) {
+        let result = tokio::time::timeout(Duration::from_secs(1), c.signaled()).await;
+        assert!(result.is_ok())
+    }
+}