main.rs

  1use anyhow::{Context as _, anyhow};
  2use axum::headers::HeaderMapExt;
  3use axum::{
  4    Extension, Router,
  5    extract::MatchedPath,
  6    http::{Request, Response},
  7    routing::get,
  8};
  9
 10use collab::api::CloudflareIpCountryHeader;
 11use collab::llm::db::LlmDatabase;
 12use collab::migrations::run_database_migrations;
 13use collab::user_backfiller::spawn_user_backfiller;
 14use collab::{
 15    AppState, Config, Result, api::fetch_extensions_from_blob_store_periodically, db, env,
 16    executor::Executor, rpc::ResultExt,
 17};
 18use collab::{ServiceMode, api::billing::poll_stripe_events_periodically};
 19use db::Database;
 20use std::{
 21    env::args,
 22    net::{SocketAddr, TcpListener},
 23    path::Path,
 24    sync::Arc,
 25    time::Duration,
 26};
 27#[cfg(unix)]
 28use tokio::signal::unix::SignalKind;
 29use tower_http::trace::TraceLayer;
 30use tracing_subscriber::{
 31    Layer, filter::EnvFilter, fmt::format::JsonFields, util::SubscriberInitExt,
 32};
 33use util::ResultExt as _;
 34
 35const VERSION: &str = env!("CARGO_PKG_VERSION");
 36const REVISION: Option<&'static str> = option_env!("GITHUB_SHA");
 37
 38#[expect(clippy::result_large_err)]
 39#[tokio::main]
 40async fn main() -> Result<()> {
 41    if let Err(error) = env::load_dotenv() {
 42        eprintln!(
 43            "error loading .env.toml (this is expected in production): {}",
 44            error
 45        );
 46    }
 47
 48    let mut args = args().skip(1);
 49    match args.next().as_deref() {
 50        Some("version") => {
 51            println!("collab v{} ({})", VERSION, REVISION.unwrap_or("unknown"));
 52        }
 53        Some("migrate") => {
 54            let config = envy::from_env::<Config>().expect("error loading config");
 55            setup_app_database(&config).await?;
 56        }
 57        Some("seed") => {
 58            let config = envy::from_env::<Config>().expect("error loading config");
 59            let db_options = db::ConnectOptions::new(config.database_url.clone());
 60
 61            let mut db = Database::new(db_options).await?;
 62            db.initialize_notification_kinds().await?;
 63
 64            collab::seed::seed(&config, &db, false).await?;
 65
 66            if let Some(llm_database_url) = config.llm_database_url.clone() {
 67                let db_options = db::ConnectOptions::new(llm_database_url);
 68                let mut db = LlmDatabase::new(db_options.clone(), Executor::Production).await?;
 69                db.initialize().await?;
 70                collab::llm::db::seed_database(&config, &mut db, true).await?;
 71            }
 72        }
 73        Some("serve") => {
 74            let mode = match args.next().as_deref() {
 75                Some("collab") => ServiceMode::Collab,
 76                Some("api") => ServiceMode::Api,
 77                Some("all") => ServiceMode::All,
 78                _ => {
 79                    return Err(anyhow!(
 80                        "usage: collab <version | migrate | seed | serve <api|collab|all>>"
 81                    ))?;
 82                }
 83            };
 84
 85            let config = envy::from_env::<Config>().expect("error loading config");
 86            init_tracing(&config);
 87            init_panic_hook();
 88
 89            let mut app = Router::new()
 90                .route("/", get(handle_root))
 91                .route("/healthz", get(handle_liveness_probe))
 92                .layer(Extension(mode));
 93
 94            let listener = TcpListener::bind(format!("0.0.0.0:{}", config.http_port))
 95                .expect("failed to bind TCP listener");
 96
 97            let mut on_shutdown = None;
 98
 99            if mode.is_collab() || mode.is_api() {
100                setup_app_database(&config).await?;
101                setup_llm_database(&config).await?;
102
103                let state = AppState::new(config, Executor::Production).await?;
104
105                if let Some(stripe_billing) = state.stripe_billing.clone() {
106                    let executor = state.executor.clone();
107                    executor.spawn_detached(async move {
108                        stripe_billing.initialize().await.trace_err();
109                    });
110                }
111
112                if mode.is_collab() {
113                    state.db.purge_old_embeddings().await.trace_err();
114
115                    let epoch = state
116                        .db
117                        .create_server(&state.config.zed_environment)
118                        .await?;
119                    let rpc_server = collab::rpc::Server::new(epoch, state.clone());
120                    rpc_server.start().await?;
121
122                    poll_stripe_events_periodically(state.clone(), rpc_server.clone());
123
124                    app = app
125                        .merge(collab::api::routes(rpc_server.clone()))
126                        .merge(collab::rpc::routes(rpc_server.clone()));
127
128                    on_shutdown = Some(Box::new(move || rpc_server.teardown()));
129                }
130
131                if mode.is_api() {
132                    fetch_extensions_from_blob_store_periodically(state.clone());
133                    spawn_user_backfiller(state.clone());
134
135                    app = app
136                        .merge(collab::api::events::router())
137                        .merge(collab::api::extensions::router())
138                }
139
140                app = app.layer(Extension(state.clone()));
141            }
142
143            app = app.layer(
144                TraceLayer::new_for_http()
145                    .make_span_with(|request: &Request<_>| {
146                        let matched_path = request
147                            .extensions()
148                            .get::<MatchedPath>()
149                            .map(MatchedPath::as_str);
150
151                        let geoip_country_code = request
152                            .headers()
153                            .typed_get::<CloudflareIpCountryHeader>()
154                            .map(|header| header.to_string());
155
156                        tracing::info_span!(
157                            "http_request",
158                            method = ?request.method(),
159                            matched_path,
160                            geoip_country_code,
161                            user_id = tracing::field::Empty,
162                            login = tracing::field::Empty,
163                            authn.jti = tracing::field::Empty,
164                            is_staff = tracing::field::Empty
165                        )
166                    })
167                    .on_response(
168                        |response: &Response<_>, latency: Duration, _: &tracing::Span| {
169                            let duration_ms = latency.as_micros() as f64 / 1000.;
170                            tracing::info!(
171                                duration_ms,
172                                status = response.status().as_u16(),
173                                "finished processing request"
174                            );
175                        },
176                    ),
177            );
178
179            #[cfg(unix)]
180            let signal = async move {
181                let mut sigterm = tokio::signal::unix::signal(SignalKind::terminate())
182                    .expect("failed to listen for interrupt signal");
183                let mut sigint = tokio::signal::unix::signal(SignalKind::interrupt())
184                    .expect("failed to listen for interrupt signal");
185                let sigterm = sigterm.recv();
186                let sigint = sigint.recv();
187                futures::pin_mut!(sigterm, sigint);
188                futures::future::select(sigterm, sigint).await;
189            };
190
191            #[cfg(windows)]
192            let signal = async move {
193                // todo(windows):
194                // `ctrl_close` does not work well, because tokio's signal handler always returns soon,
195                // but system terminates the application soon after returning CTRL+CLOSE handler.
196                // So we should implement blocking handler to treat CTRL+CLOSE signal.
197                let mut ctrl_break = tokio::signal::windows::ctrl_break()
198                    .expect("failed to listen for interrupt signal");
199                let mut ctrl_c = tokio::signal::windows::ctrl_c()
200                    .expect("failed to listen for interrupt signal");
201                let ctrl_break = ctrl_break.recv();
202                let ctrl_c = ctrl_c.recv();
203                futures::pin_mut!(ctrl_break, ctrl_c);
204                futures::future::select(ctrl_break, ctrl_c).await;
205            };
206
207            axum::Server::from_tcp(listener)
208                .map_err(|e| anyhow!(e))?
209                .serve(app.into_make_service_with_connect_info::<SocketAddr>())
210                .with_graceful_shutdown(async move {
211                    signal.await;
212                    tracing::info!("Received interrupt signal");
213
214                    if let Some(on_shutdown) = on_shutdown {
215                        on_shutdown();
216                    }
217                })
218                .await
219                .map_err(|e| anyhow!(e))?;
220        }
221        _ => {
222            Err(anyhow!(
223                "usage: collab <version | migrate | seed | serve <api|collab|llm|all>>"
224            ))?;
225        }
226    }
227    Ok(())
228}
229
230async fn setup_app_database(config: &Config) -> Result<()> {
231    let db_options = db::ConnectOptions::new(config.database_url.clone());
232    let mut db = Database::new(db_options).await?;
233
234    let migrations_path = config.migrations_path.as_deref().unwrap_or_else(|| {
235        #[cfg(feature = "sqlite")]
236        let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations.sqlite");
237        #[cfg(not(feature = "sqlite"))]
238        let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations");
239
240        Path::new(default_migrations)
241    });
242
243    let migrations = run_database_migrations(db.options(), migrations_path).await?;
244    for (migration, duration) in migrations {
245        log::info!(
246            "Migrated {} {} {:?}",
247            migration.version,
248            migration.description,
249            duration
250        );
251    }
252
253    db.initialize_notification_kinds().await?;
254
255    if config.seed_path.is_some() {
256        collab::seed::seed(config, &db, false).await?;
257    }
258
259    Ok(())
260}
261
262async fn setup_llm_database(config: &Config) -> Result<()> {
263    let database_url = config
264        .llm_database_url
265        .as_ref()
266        .context("missing LLM_DATABASE_URL")?;
267
268    let db_options = db::ConnectOptions::new(database_url.clone());
269    let db = LlmDatabase::new(db_options, Executor::Production).await?;
270
271    let migrations_path = config
272        .llm_database_migrations_path
273        .as_deref()
274        .unwrap_or_else(|| {
275            #[cfg(feature = "sqlite")]
276            let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations_llm.sqlite");
277            #[cfg(not(feature = "sqlite"))]
278            let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations_llm");
279
280            Path::new(default_migrations)
281        });
282
283    let migrations = run_database_migrations(db.options(), migrations_path).await?;
284    for (migration, duration) in migrations {
285        log::info!(
286            "Migrated {} {} {:?}",
287            migration.version,
288            migration.description,
289            duration
290        );
291    }
292
293    Ok(())
294}
295
296async fn handle_root(Extension(mode): Extension<ServiceMode>) -> String {
297    format!("zed:{mode} v{VERSION} ({})", REVISION.unwrap_or("unknown"))
298}
299
300async fn handle_liveness_probe(app_state: Option<Extension<Arc<AppState>>>) -> Result<String> {
301    if let Some(state) = app_state {
302        state.db.get_all_users(0, 1).await?;
303    }
304
305    Ok("ok".to_string())
306}
307
308pub fn init_tracing(config: &Config) -> Option<()> {
309    use std::str::FromStr;
310    use tracing_subscriber::layer::SubscriberExt;
311
312    let filter = EnvFilter::from_str(config.rust_log.as_deref()?).log_err()?;
313
314    tracing_subscriber::registry()
315        .with(if config.log_json.unwrap_or(false) {
316            Box::new(
317                tracing_subscriber::fmt::layer()
318                    .fmt_fields(JsonFields::default())
319                    .event_format(
320                        tracing_subscriber::fmt::format()
321                            .json()
322                            .flatten_event(true)
323                            .with_span_list(false),
324                    )
325                    .with_filter(filter),
326            ) as Box<dyn Layer<_> + Send + Sync>
327        } else {
328            Box::new(
329                tracing_subscriber::fmt::layer()
330                    .event_format(tracing_subscriber::fmt::format().pretty())
331                    .with_filter(filter),
332            )
333        })
334        .init();
335
336    None
337}
338
339fn init_panic_hook() {
340    std::panic::set_hook(Box::new(move |panic_info| {
341        let panic_message = match panic_info.payload().downcast_ref::<&'static str>() {
342            Some(message) => *message,
343            None => match panic_info.payload().downcast_ref::<String>() {
344                Some(message) => message.as_str(),
345                None => "Box<Any>",
346            },
347        };
348        let backtrace = std::backtrace::Backtrace::force_capture();
349        let location = panic_info
350            .location()
351            .map(|loc| format!("{}:{}", loc.file(), loc.line()));
352        tracing::error!(panic = true, ?location, %panic_message, %backtrace, "Server Panic");
353    }));
354}