From 6e771c7d8c0d000aeffc93d1698db2f4b66b5140 Mon Sep 17 00:00:00 2001 From: Damien Date: Thu, 20 Oct 2022 09:53:38 +0100 Subject: [PATCH] feat: gateway admin revive (#412) * feat: gateway admin command (revive) * fmt * clippy * refactor: revive deployers using GatewayService * tests: add ContextArgs * refactor: simplify passing around of fqdn * tests: update test archive * refactor: remove stray exec.rs file * refactor: unused is_error() Co-authored-by: chesedo --- gateway/src/api/latest.rs | 9 ++--- gateway/src/args.rs | 46 ++++++++++++++++++------- gateway/src/lib.rs | 38 ++++++++++---------- gateway/src/main.rs | 20 +++++++++-- gateway/src/project.rs | 56 ++++++++++++++++++++++++++++++ gateway/src/service.rs | 59 +++++++++++++++++++++++--------- gateway/src/worker.rs | 52 +++++++++++++++++----------- gateway/tests/hello_world.crate | Bin 933 -> 934 bytes 8 files changed, 203 insertions(+), 77 deletions(-) diff --git a/gateway/src/api/latest.rs b/gateway/src/api/latest.rs index 69ca3cfdb..524bb42a2 100644 --- a/gateway/src/api/latest.rs +++ b/gateway/src/api/latest.rs @@ -190,8 +190,7 @@ pub mod tests { #[tokio::test] async fn api_create_get_delete_projects() -> anyhow::Result<()> { let world = World::new().await; - let service = - Arc::new(GatewayService::init(world.args(), world.fqdn(), world.pool()).await); + let service = Arc::new(GatewayService::init(world.args(), world.pool()).await); let (sender, mut receiver) = channel::(256); tokio::spawn(async move { @@ -326,8 +325,7 @@ pub mod tests { #[tokio::test] async fn api_create_get_users() -> anyhow::Result<()> { let world = World::new().await; - let service = - Arc::new(GatewayService::init(world.args(), world.fqdn(), world.pool()).await); + let service = Arc::new(GatewayService::init(world.args(), world.pool()).await); let (sender, mut receiver) = channel::(256); tokio::spawn(async move { @@ -416,8 +414,7 @@ pub mod tests { #[tokio::test(flavor = "multi_thread")] async fn status() { let world = World::new().await; - let service = - Arc::new(GatewayService::init(world.args(), world.fqdn(), world.pool()).await); + let service = Arc::new(GatewayService::init(world.args(), world.pool()).await); let (sender, mut receiver) = channel::(1); let (ctl_send, ctl_recv) = oneshot::channel(); diff --git a/gateway/src/args.rs b/gateway/src/args.rs index 5f65a7480..ae0b1bced 100644 --- a/gateway/src/args.rs +++ b/gateway/src/args.rs @@ -19,6 +19,7 @@ pub struct Args { pub enum Commands { Start(StartArgs), Init(InitArgs), + Exec(ExecCmds), } #[derive(clap::Args, Debug, Clone)] @@ -29,6 +30,35 @@ pub struct StartArgs { /// Address to bind the user plane to #[arg(long, default_value = "127.0.0.1:8000")] pub user: SocketAddr, + #[command(flatten)] + pub context: ContextArgs, +} + +#[derive(clap::Args, Debug, Clone)] +pub struct InitArgs { + /// Name of initial account to create + #[arg(long)] + pub name: String, + /// Key to assign to initial account + #[arg(long)] + pub key: Option, +} + +#[derive(clap::Args, Debug, Clone)] +pub struct ExecCmds { + #[command(flatten)] + pub context: ContextArgs, + #[command(subcommand)] + pub command: ExecCmd, +} + +#[derive(Subcommand, Debug, Clone)] +pub enum ExecCmd { + Revive, +} + +#[derive(clap::Args, Debug, Clone)] +pub struct ContextArgs { /// Default image to deploy user runtimes into #[arg(long, default_value = "public.ecr.aws/shuttle/deployer:latest")] pub image: String, @@ -40,23 +70,13 @@ pub struct StartArgs { /// the provisioner service #[arg(long, default_value = "provisioner")] pub provisioner_host: String, - /// The path to the docker daemon socket - #[arg(long, default_value = "/var/run/docker.sock")] - pub docker_host: String, /// The Docker Network name in which to deploy user runtimes #[arg(long, default_value = "shuttle_default")] pub network_name: String, /// FQDN where the proxy can be reached at #[arg(long)] pub proxy_fqdn: FQDN, -} - -#[derive(clap::Args, Debug, Clone)] -pub struct InitArgs { - /// Name of initial account to create - #[arg(long)] - pub name: String, - /// Key to assign to initial account - #[arg(long)] - pub key: Option, + /// The path to the docker daemon socket + #[arg(long, default_value = "/var/run/docker.sock")] + pub docker_host: String, } diff --git a/gateway/src/lib.rs b/gateway/src/lib.rs index d5d2980bd..6a99be184 100644 --- a/gateway/src/lib.rs +++ b/gateway/src/lib.rs @@ -287,7 +287,7 @@ pub mod tests { use tracing::info; use crate::api::make_api; - use crate::args::StartArgs; + use crate::args::{ContextArgs, StartArgs}; use crate::auth::User; use crate::proxy::make_proxy; use crate::service::{ContainerSettings, GatewayService, MIGRATIONS}; @@ -485,7 +485,6 @@ pub mod tests { args: StartArgs, hyper: HyperClient, pool: SqlitePool, - fqdn: String, } #[derive(Clone, Copy)] @@ -493,13 +492,11 @@ pub mod tests { pub docker: &'c Docker, pub container_settings: &'c ContainerSettings, pub hyper: &'c HyperClient, - pub fqdn: &'c str, } impl World { pub async fn new() -> Self { let docker = Docker::connect_with_local_defaults().unwrap(); - let fqdn = "test.shuttleapp.rs".to_string(); docker .list_images::<&str>(None) @@ -529,17 +526,19 @@ pub mod tests { let args = StartArgs { control, - docker_host, user, - image, - prefix, - provisioner_host, - network_name, - proxy_fqdn: FQDN::from_str(&fqdn).unwrap(), + context: ContextArgs { + docker_host, + image, + prefix, + provisioner_host, + network_name, + proxy_fqdn: FQDN::from_str("test.shuttleapp.rs").unwrap(), + }, }; - let settings = ContainerSettings::builder(&docker, fqdn.clone()) - .from_args(&args) + let settings = ContainerSettings::builder(&docker) + .from_args(&args.context) .await; let hyper = HyperClient::builder().build(HttpConnector::new()); @@ -553,12 +552,11 @@ pub mod tests { args, hyper, pool, - fqdn, } } - pub fn args(&self) -> StartArgs { - self.args.clone() + pub fn args(&self) -> ContextArgs { + self.args.context.clone() } pub fn pool(&self) -> SqlitePool { @@ -570,7 +568,11 @@ pub mod tests { } pub fn fqdn(&self) -> String { - self.fqdn.clone() + self.args() + .proxy_fqdn + .to_string() + .trim_end_matches('.') + .to_string() } } @@ -580,7 +582,6 @@ pub mod tests { docker: &self.docker, container_settings: &self.settings, hyper: &self.hyper, - fqdn: &self.fqdn, } } } @@ -598,8 +599,7 @@ pub mod tests { #[tokio::test] async fn end_to_end() { let world = World::new().await; - let service = - Arc::new(GatewayService::init(world.args(), world.fqdn(), world.pool()).await); + let service = Arc::new(GatewayService::init(world.args(), world.pool()).await); let worker = Worker::new(Arc::clone(&service)); let (log_out, mut log_in) = channel(256); diff --git a/gateway/src/main.rs b/gateway/src/main.rs index 5a01f5e48..24df027fc 100644 --- a/gateway/src/main.rs +++ b/gateway/src/main.rs @@ -1,12 +1,12 @@ use clap::Parser; use futures::prelude::*; -use shuttle_gateway::args::{Args, Commands, InitArgs}; +use shuttle_gateway::args::{Args, Commands, ExecCmd, ExecCmds, InitArgs}; use shuttle_gateway::auth::Key; use shuttle_gateway::proxy::make_proxy; use shuttle_gateway::service::{GatewayService, MIGRATIONS}; use shuttle_gateway::worker::{Work, Worker}; use shuttle_gateway::{api::make_api, args::StartArgs}; -use shuttle_gateway::{Refresh, Service}; +use shuttle_gateway::{project, Refresh, Service}; use sqlx::migrate::MigrateDatabase; use sqlx::{query, Sqlite, SqlitePool}; use std::io; @@ -55,16 +55,18 @@ async fn main() -> io::Result<()> { match args.command { Commands::Start(start_args) => start(db, start_args).await, Commands::Init(init_args) => init(db, init_args).await, + Commands::Exec(exec_cmd) => exec(db, exec_cmd).await, } } async fn start(db: SqlitePool, args: StartArgs) -> io::Result<()> { let fqdn = args + .context .proxy_fqdn .to_string() .trim_end_matches('.') .to_string(); - let gateway = Arc::new(GatewayService::init(args.clone(), fqdn.clone(), db).await); + let gateway = Arc::new(GatewayService::init(args.context.clone(), db).await); let worker = Worker::new(Arc::clone(&gateway)); @@ -146,3 +148,15 @@ async fn init(db: SqlitePool, args: InitArgs) -> io::Result<()> { println!("`{}` created as super user with key: {key}", args.name); Ok(()) } + +async fn exec(db: SqlitePool, exec_cmd: ExecCmds) -> io::Result<()> { + let gateway = GatewayService::init(exec_cmd.context.clone(), db).await; + + match exec_cmd.command { + ExecCmd::Revive => project::exec::revive(gateway) + .await + .map_err(|e| io::Error::new(io::ErrorKind::Other, e))?, + }; + + Ok(()) +} diff --git a/gateway/src/project.rs b/gateway/src/project.rs index 7f5d983ec..4e80925c3 100644 --- a/gateway/src/project.rs +++ b/gateway/src/project.rs @@ -703,6 +703,62 @@ impl<'c> State<'c> for ProjectError { } } +pub mod exec { + use bollard::service::ContainerState; + + use crate::{ + service::GatewayService, + worker::{do_work, Work}, + }; + + use super::*; + + pub async fn revive(gateway: GatewayService) -> Result<(), ProjectError> { + let mut mutations = Vec::new(); + + for Work { + project_name, + account_name, + work, + } in gateway + .iter_projects() + .await + .expect("could not list projects") + { + if let Project::Errored(ProjectError { ctx: Some(ctx), .. }) = work { + if let Some(container) = ctx.container() { + if let Ok(container) = gateway + .context() + .docker() + .inspect_container(safe_unwrap!(container.id), None) + .await + { + if let Some(ContainerState { + status: Some(ContainerStateStatusEnum::EXITED), + .. + }) = container.state + { + mutations.push(Work { + project_name, + account_name, + work: Project::Stopped(ProjectStopped { container }), + }); + } + } + } + } + } + + for work in mutations { + debug!(?work, "project will be revived"); + + do_work(work, &gateway).await; + } + + Ok(()) + } +} + #[cfg(test)] pub mod tests { diff --git a/gateway/src/service.rs b/gateway/src/service.rs index 2cae0e7bf..d8a84f712 100644 --- a/gateway/src/service.rs +++ b/gateway/src/service.rs @@ -20,7 +20,7 @@ use sqlx::types::Json as SqlxJson; use sqlx::{query, Error as SqlxError, Row}; use tracing::debug; -use crate::args::StartArgs; +use crate::args::ContextArgs; use crate::auth::{Key, User}; use crate::project::{self, Project}; use crate::worker::Work; @@ -43,33 +43,35 @@ pub struct ContainerSettingsBuilder<'d> { image: Option, provisioner: Option, network_name: Option, - fqdn: String, + fqdn: Option, } impl<'d> ContainerSettingsBuilder<'d> { - pub fn new(docker: &'d Docker, fqdn: String) -> Self { + pub fn new(docker: &'d Docker) -> Self { Self { docker, prefix: None, image: None, provisioner: None, network_name: None, - fqdn, + fqdn: None, } } - pub async fn from_args(self, args: &StartArgs) -> ContainerSettings { - let StartArgs { + pub async fn from_args(self, args: &ContextArgs) -> ContainerSettings { + let ContextArgs { prefix, network_name, provisioner_host, image, + proxy_fqdn, .. } = args; self.prefix(prefix) .image(image) .provisioner_host(provisioner_host) .network_name(network_name) + .fqdn(proxy_fqdn) .build() .await } @@ -94,6 +96,11 @@ impl<'d> ContainerSettingsBuilder<'d> { self } + pub fn fqdn(mut self, fqdn: S) -> Self { + self.fqdn = Some(fqdn.to_string().trim_end_matches('.').to_string()); + self + } + /// Resolves the Docker network ID for the given network name. /// /// # Panics @@ -125,7 +132,7 @@ impl<'d> ContainerSettingsBuilder<'d> { let network_name = self.network_name.take().unwrap(); let network_id = self.resolve_network_id(&network_name).await; - let fqdn = self.fqdn; + let fqdn = self.fqdn.take().unwrap(); ContainerSettings { prefix, @@ -148,8 +155,8 @@ pub struct ContainerSettings { } impl ContainerSettings { - pub fn builder(docker: &Docker, fqdn: String) -> ContainerSettingsBuilder { - ContainerSettingsBuilder::new(docker, fqdn) + pub fn builder(docker: &Docker) -> ContainerSettingsBuilder { + ContainerSettingsBuilder::new(docker) } } @@ -181,12 +188,10 @@ impl GatewayService { /// /// * `args` - The [`Args`] with which the service was /// started. Will be passed as [`Context`] to workers and state. - pub async fn init(args: StartArgs, fqdn: String, db: SqlitePool) -> Self { + pub async fn init(args: ContextArgs, db: SqlitePool) -> Self { let docker = Docker::connect_with_unix(&args.docker_host, 60, API_DEFAULT_VERSION).unwrap(); - let container_settings = ContainerSettings::builder(&docker, fqdn) - .from_args(&args) - .await; + let container_settings = ContainerSettings::builder(&docker).from_args(&args).await; let provider = GatewayContextProvider::new(docker, container_settings); @@ -439,11 +444,33 @@ impl GatewayService { }) } - fn context(&self) -> GatewayContext { + pub fn context(&self) -> GatewayContext { self.provider.context() } } +#[async_trait] +impl<'c> Service<'c> for GatewayService { + type Context = GatewayContext<'c>; + + type State = Work; + + type Error = Error; + + fn context(&'c self) -> Self::Context { + GatewayService::context(self) + } + + async fn update( + &self, + Work { + project_name, work, .. + }: &Self::State, + ) -> Result<(), Self::Error> { + self.update_project(project_name, work).await + } +} + #[async_trait] impl<'c> Service<'c> for Arc { type Context = GatewayContext<'c>; @@ -492,7 +519,7 @@ pub mod tests { #[tokio::test] async fn service_create_find_user() -> anyhow::Result<()> { let world = World::new().await; - let svc = GatewayService::init(world.args(), world.fqdn(), world.pool()).await; + let svc = GatewayService::init(world.args(), world.pool()).await; let account_name: AccountName = "test_user_123".parse()?; @@ -543,7 +570,7 @@ pub mod tests { #[tokio::test] async fn service_create_find_delete_project() -> anyhow::Result<()> { let world = World::new().await; - let svc = Arc::new(GatewayService::init(world.args(), world.fqdn(), world.pool()).await); + let svc = Arc::new(GatewayService::init(world.args(), world.pool()).await); let neo: AccountName = "neo".parse().unwrap(); let matrix: ProjectName = "matrix".parse().unwrap(); diff --git a/gateway/src/worker.rs b/gateway/src/worker.rs index ee71dfd8a..d371bdb66 100644 --- a/gateway/src/worker.rs +++ b/gateway/src/worker.rs @@ -115,33 +115,45 @@ where let _ = self.send.take().unwrap(); debug!("starting worker"); - while let Some(mut work) = self.recv.recv().await { + while let Some(work) = self.recv.recv().await { debug!(?work, "received work"); - loop { - work = { - let context = self.service.context(); - - // Safety: EndState's transitions are Infallible - work.next(&context).await.unwrap() - }; - - match self.service.update(&work).await { - Ok(_) => {} - Err(err) => info!("failed to update a state: {}\nstate: {:?}", err, work), - }; - - if work.is_done() { - break; - } else { - debug!(?work, "work not done yet"); - } - } + do_work(work, &self.service).await; } Ok(self) } } +pub async fn do_work< + 'c, + E: std::fmt::Display, + S: Service<'c, State = W, Error = E>, + W: EndState<'c> + Debug, +>( + mut work: W, + service: &'c S, +) { + loop { + work = { + let context = service.context(); + + // Safety: EndState's transitions are Infallible + work.next(&context).await.unwrap() + }; + + match service.update(&work).await { + Ok(_) => {} + Err(err) => info!("failed to update a state: {}\nstate: {:?}", err, work), + }; + + if work.is_done() { + break; + } else { + debug!(?work, "work not done yet"); + } + } +} + #[cfg(test)] pub mod tests { use std::convert::Infallible; diff --git a/gateway/tests/hello_world.crate b/gateway/tests/hello_world.crate index d4f72b6be50d084966e3c273d72c05b33e353b61..038d4d03e2fe22bcf8b7b13dc48ffc2b2ad057f9 100644 GIT binary patch delta 895 zcmV-_1AzRc2c`#*G=D7HnTHMV(zFebEkKfCC=4T|<&(vk5)G1y;}!YuJ4#+X+bLS0 zS+*j&FMJX2h4eiSc}`IX*;+~^rY+wKJiqP5OwHuYZLDv2o=EQxE%Sq~5}%|OMGwwf z3HrguK8>g!biy9B2Tve{HcSB=JX87L0Jt-5+yU4w4Rp!^8h^P_5GCE?{4Z^l68gtUf?ae;?f%G`Sum4Q&e+tk2Jnt$3xT?=WIRXHPB*FMI`;>) z{2wIU!~cnezh`779?QpP@E?RxcNhOb*b8g?KY<*=_1m*6czt$$3e*mNyT15kczt#< zJU@R2Z%%(by?-2DpT2^h-@(c7^38>F=p4fDDdtctgk)2m&mdOJpavtsqzDRUTpP85 zGLK-%g#cDiIx)jzCd7&ixVcmr6Z}tfVUuo$%2ua2pj0lyrXse9+%Cn z#a_ABvjkSM0H*BDs{NXj>oQiDAh4zVWKw3z-Al!1Jg3Mv+bYARkOiNkSb>moZo^-} zloNj{%ndYb@L3V3kjcss-MMTcut`C{72-e4dDcaFNL&75nHw@iQ9Gjri|1^HV+W_) z&?&)>;D3gG7`RT(GPI*DDqf$Zoi7={brfnTXu4E%$)ezsF*RGqQ?dGZTfOV~EfssE z($;F77RCr{X;im7#vQf3^_n0v1-YiFk-Nl6tMcHEotmcq6aFt#?GgEZP4K&|Z@E73 zqh8=smUirX5cQ*P?ESa9xo<=^WbuXEu*WG6vVX(asldC-3Oh7FpFhAJ6CA-OsQ~V4 zGWeJAe^vcNkN5)o9RB^t-@|{WU*rEN->2{& z`Mq8IclzCKjsK^p|3(>$mAommtrzYLs=O+Qpkjd^9OrN}L(_2EZgcD;IdHn;?;1^L z{dff5y`;mVvJR-6`up#rw>F`Upv3bgXoT3o2wUkQ4E#C_~zwJd#&E(B(q;GhhNbe6V^MijRKFOfhdvM-L zFbqERX+-^?+Zj-M@B~t5!xX^5GnJ1HfIH*H9f9rAK&LFAk$;;EV%ASy4F;^!4TIxh zr#BoXaTMb5Fhu%^j-yv`=*PZGYWGLh%z~Mea>k~PHGp?4TL{!`C8If-cDhM5*SSBa z<^Le*9{x`({5>Nx@mM~-fd8P=>+j+}=nOhF{+~b&;rh+l75s8`ehSo%f4{!?b$oqx zGCn_l2d__mJAb_#U!VRAKfQyK@#X6a=g>KXw<+dOEQDk+&u0)RW>ABXU{VByGp>zV zL77LeB%Ig+5~(0#cbpbLBr_rv9&*8rRa|nD z0vUl@RGQ0NgG|dt5fR z7JKDh&k|V40+_NptM+SBuFF^v9G+=jn` zm?sG;%ndYb@L3V1kjcss-MK6j*rXuf3h{5|JnN!7q%D7u%ng~MsGZ4zMRPX8se>^$ zbV~38xPKkL6Sz*!GPI*DDqf$Zoi7={brfnTXu4E%$)e!ll$x#MsaSowt={+imWsSm zX=}Ak3u6SfG^$%3;hq|4B*;ubu4!uGE-`FX9^9!@)AWDB|7EH@BLA-mez)~4*9U%Y z5crg(T{|E2hP`j>{kOZhZ$vg^@s-@L$0-l8!++GNz`M%|J2XI_Kf)dp9KmO)0Pbrt z_?Pj2RsBSd_yYVA{{5c6hyU)d#{W~u1E^nvt;H4#w?^Bu!@pKhn;6|w`myW3&*8u4 z4|eh29rpV*{-2`$n`A6f@}|(XUbr);@~R+$iUq!RoWscsO~Y-w&8d^*!0C>^Yc!$t zBX@lFk`9l`I-qjuufLDp*n~QQGNWF&&b`%N-}*P}TYogl7|*8;)2loJGFiE*Z0@aH z-$$3#d!q6psQ2lCQFTV6u;3zYG`&m~xsA6>ZF)>7Sx|lVVp0Y^ZPJdciHmuoQfxZ) Uo1&IlYI%OV