main.rs

  1use anyhow::anyhow;
  2use axum::headers::HeaderMapExt;
  3use axum::{
  4    Extension, Router,
  5    extract::MatchedPath,
  6    http::{Request, Response},
  7    routing::get,
  8};
  9
 10use collab::api::CloudflareIpCountryHeader;
 11use collab::api::billing::sync_llm_usage_with_stripe_periodically;
 12use collab::llm::db::LlmDatabase;
 13use collab::migrations::run_database_migrations;
 14use collab::user_backfiller::spawn_user_backfiller;
 15use collab::{
 16    AppState, Config, RateLimiter, Result, api::fetch_extensions_from_blob_store_periodically, db,
 17    env, executor::Executor, rpc::ResultExt,
 18};
 19use collab::{ServiceMode, api::billing::poll_stripe_events_periodically};
 20use db::Database;
 21use std::{
 22    env::args,
 23    net::{SocketAddr, TcpListener},
 24    path::Path,
 25    sync::Arc,
 26    time::Duration,
 27};
 28#[cfg(unix)]
 29use tokio::signal::unix::SignalKind;
 30use tower_http::trace::TraceLayer;
 31use tracing_subscriber::{
 32    Layer, filter::EnvFilter, fmt::format::JsonFields, util::SubscriberInitExt,
 33};
 34use util::{ResultExt as _, maybe};
 35
 36const VERSION: &str = env!("CARGO_PKG_VERSION");
 37const REVISION: Option<&'static str> = option_env!("GITHUB_SHA");
 38
 39#[tokio::main]
 40async fn main() -> Result<()> {
 41    if let Err(error) = env::load_dotenv() {
 42        eprintln!(
 43            "error loading .env.toml (this is expected in production): {}",
 44            error
 45        );
 46    }
 47
 48    let mut args = args().skip(1);
 49    match args.next().as_deref() {
 50        Some("version") => {
 51            println!("collab v{} ({})", VERSION, REVISION.unwrap_or("unknown"));
 52        }
 53        Some("migrate") => {
 54            let config = envy::from_env::<Config>().expect("error loading config");
 55            setup_app_database(&config).await?;
 56        }
 57        Some("seed") => {
 58            let config = envy::from_env::<Config>().expect("error loading config");
 59            let db_options = db::ConnectOptions::new(config.database_url.clone());
 60
 61            let mut db = Database::new(db_options, Executor::Production).await?;
 62            db.initialize_notification_kinds().await?;
 63
 64            collab::seed::seed(&config, &db, false).await?;
 65
 66            if let Some(llm_database_url) = config.llm_database_url.clone() {
 67                let db_options = db::ConnectOptions::new(llm_database_url);
 68                let mut db = LlmDatabase::new(db_options.clone(), Executor::Production).await?;
 69                db.initialize().await?;
 70                collab::llm::db::seed_database(&config, &mut db, true).await?;
 71            }
 72        }
 73        Some("serve") => {
 74            let mode = match args.next().as_deref() {
 75                Some("collab") => ServiceMode::Collab,
 76                Some("api") => ServiceMode::Api,
 77                Some("all") => ServiceMode::All,
 78                _ => {
 79                    return Err(anyhow!(
 80                        "usage: collab <version | migrate | seed | serve <api|collab|all>>"
 81                    ))?;
 82                }
 83            };
 84
 85            let config = envy::from_env::<Config>().expect("error loading config");
 86            init_tracing(&config);
 87            init_panic_hook();
 88
 89            let mut app = Router::new()
 90                .route("/", get(handle_root))
 91                .route("/healthz", get(handle_liveness_probe))
 92                .layer(Extension(mode));
 93
 94            let listener = TcpListener::bind(format!("0.0.0.0:{}", config.http_port))
 95                .expect("failed to bind TCP listener");
 96
 97            let mut on_shutdown = None;
 98
 99            if mode.is_collab() || mode.is_api() {
100                setup_app_database(&config).await?;
101                setup_llm_database(&config).await?;
102
103                let state = AppState::new(config, Executor::Production).await?;
104
105                if let Some(stripe_billing) = state.stripe_billing.clone() {
106                    let executor = state.executor.clone();
107                    executor.spawn_detached(async move {
108                        stripe_billing.initialize().await.trace_err();
109                    });
110                }
111
112                if mode.is_collab() {
113                    state.db.purge_old_embeddings().await.trace_err();
114                    RateLimiter::save_periodically(
115                        state.rate_limiter.clone(),
116                        state.executor.clone(),
117                    );
118
119                    let epoch = state
120                        .db
121                        .create_server(&state.config.zed_environment)
122                        .await?;
123                    let rpc_server = collab::rpc::Server::new(epoch, state.clone());
124                    rpc_server.start().await?;
125
126                    poll_stripe_events_periodically(state.clone(), rpc_server.clone());
127
128                    app = app
129                        .merge(collab::api::routes(rpc_server.clone()))
130                        .merge(collab::rpc::routes(rpc_server.clone()));
131
132                    on_shutdown = Some(Box::new(move || rpc_server.teardown()));
133                }
134
135                if mode.is_api() {
136                    fetch_extensions_from_blob_store_periodically(state.clone());
137                    spawn_user_backfiller(state.clone());
138
139                    let llm_db = maybe!(async {
140                        let database_url = state
141                            .config
142                            .llm_database_url
143                            .as_ref()
144                            .ok_or_else(|| anyhow!("missing LLM_DATABASE_URL"))?;
145                        let max_connections = state
146                            .config
147                            .llm_database_max_connections
148                            .ok_or_else(|| anyhow!("missing LLM_DATABASE_MAX_CONNECTIONS"))?;
149
150                        let mut db_options = db::ConnectOptions::new(database_url);
151                        db_options.max_connections(max_connections);
152                        LlmDatabase::new(db_options, state.executor.clone()).await
153                    })
154                    .await
155                    .trace_err();
156
157                    if let Some(mut llm_db) = llm_db {
158                        llm_db.initialize().await?;
159                        sync_llm_usage_with_stripe_periodically(state.clone());
160                    }
161
162                    app = app
163                        .merge(collab::api::events::router())
164                        .merge(collab::api::extensions::router())
165                }
166
167                app = app.layer(Extension(state.clone()));
168            }
169
170            app = app.layer(
171                TraceLayer::new_for_http()
172                    .make_span_with(|request: &Request<_>| {
173                        let matched_path = request
174                            .extensions()
175                            .get::<MatchedPath>()
176                            .map(MatchedPath::as_str);
177
178                        let geoip_country_code = request
179                            .headers()
180                            .typed_get::<CloudflareIpCountryHeader>()
181                            .map(|header| header.to_string());
182
183                        tracing::info_span!(
184                            "http_request",
185                            method = ?request.method(),
186                            matched_path,
187                            geoip_country_code,
188                            user_id = tracing::field::Empty,
189                            login = tracing::field::Empty,
190                            authn.jti = tracing::field::Empty,
191                            is_staff = tracing::field::Empty
192                        )
193                    })
194                    .on_response(
195                        |response: &Response<_>, latency: Duration, _: &tracing::Span| {
196                            let duration_ms = latency.as_micros() as f64 / 1000.;
197                            tracing::info!(
198                                duration_ms,
199                                status = response.status().as_u16(),
200                                "finished processing request"
201                            );
202                        },
203                    ),
204            );
205
206            #[cfg(unix)]
207            let signal = async move {
208                let mut sigterm = tokio::signal::unix::signal(SignalKind::terminate())
209                    .expect("failed to listen for interrupt signal");
210                let mut sigint = tokio::signal::unix::signal(SignalKind::interrupt())
211                    .expect("failed to listen for interrupt signal");
212                let sigterm = sigterm.recv();
213                let sigint = sigint.recv();
214                futures::pin_mut!(sigterm, sigint);
215                futures::future::select(sigterm, sigint).await;
216            };
217
218            #[cfg(windows)]
219            let signal = async move {
220                // todo(windows):
221                // `ctrl_close` does not work well, because tokio's signal handler always returns soon,
222                // but system terminates the application soon after returning CTRL+CLOSE handler.
223                // So we should implement blocking handler to treat CTRL+CLOSE signal.
224                let mut ctrl_break = tokio::signal::windows::ctrl_break()
225                    .expect("failed to listen for interrupt signal");
226                let mut ctrl_c = tokio::signal::windows::ctrl_c()
227                    .expect("failed to listen for interrupt signal");
228                let ctrl_break = ctrl_break.recv();
229                let ctrl_c = ctrl_c.recv();
230                futures::pin_mut!(ctrl_break, ctrl_c);
231                futures::future::select(ctrl_break, ctrl_c).await;
232            };
233
234            axum::Server::from_tcp(listener)
235                .map_err(|e| anyhow!(e))?
236                .serve(app.into_make_service_with_connect_info::<SocketAddr>())
237                .with_graceful_shutdown(async move {
238                    signal.await;
239                    tracing::info!("Received interrupt signal");
240
241                    if let Some(on_shutdown) = on_shutdown {
242                        on_shutdown();
243                    }
244                })
245                .await
246                .map_err(|e| anyhow!(e))?;
247        }
248        _ => {
249            Err(anyhow!(
250                "usage: collab <version | migrate | seed | serve <api|collab|llm|all>>"
251            ))?;
252        }
253    }
254    Ok(())
255}
256
257async fn setup_app_database(config: &Config) -> Result<()> {
258    let db_options = db::ConnectOptions::new(config.database_url.clone());
259    let mut db = Database::new(db_options, Executor::Production).await?;
260
261    let migrations_path = config.migrations_path.as_deref().unwrap_or_else(|| {
262        #[cfg(feature = "sqlite")]
263        let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations.sqlite");
264        #[cfg(not(feature = "sqlite"))]
265        let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations");
266
267        Path::new(default_migrations)
268    });
269
270    let migrations = run_database_migrations(db.options(), migrations_path).await?;
271    for (migration, duration) in migrations {
272        log::info!(
273            "Migrated {} {} {:?}",
274            migration.version,
275            migration.description,
276            duration
277        );
278    }
279
280    db.initialize_notification_kinds().await?;
281
282    if config.seed_path.is_some() {
283        collab::seed::seed(config, &db, false).await?;
284    }
285
286    Ok(())
287}
288
289async fn setup_llm_database(config: &Config) -> Result<()> {
290    let database_url = config
291        .llm_database_url
292        .as_ref()
293        .ok_or_else(|| anyhow!("missing LLM_DATABASE_URL"))?;
294
295    let db_options = db::ConnectOptions::new(database_url.clone());
296    let db = LlmDatabase::new(db_options, Executor::Production).await?;
297
298    let migrations_path = config
299        .llm_database_migrations_path
300        .as_deref()
301        .unwrap_or_else(|| {
302            #[cfg(feature = "sqlite")]
303            let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations_llm.sqlite");
304            #[cfg(not(feature = "sqlite"))]
305            let default_migrations = concat!(env!("CARGO_MANIFEST_DIR"), "/migrations_llm");
306
307            Path::new(default_migrations)
308        });
309
310    let migrations = run_database_migrations(db.options(), migrations_path).await?;
311    for (migration, duration) in migrations {
312        log::info!(
313            "Migrated {} {} {:?}",
314            migration.version,
315            migration.description,
316            duration
317        );
318    }
319
320    Ok(())
321}
322
323async fn handle_root(Extension(mode): Extension<ServiceMode>) -> String {
324    format!("zed:{mode} v{VERSION} ({})", REVISION.unwrap_or("unknown"))
325}
326
327async fn handle_liveness_probe(app_state: Option<Extension<Arc<AppState>>>) -> Result<String> {
328    if let Some(state) = app_state {
329        state.db.get_all_users(0, 1).await?;
330    }
331
332    Ok("ok".to_string())
333}
334
335pub fn init_tracing(config: &Config) -> Option<()> {
336    use std::str::FromStr;
337    use tracing_subscriber::layer::SubscriberExt;
338
339    let filter = EnvFilter::from_str(config.rust_log.as_deref()?).log_err()?;
340
341    tracing_subscriber::registry()
342        .with(if config.log_json.unwrap_or(false) {
343            Box::new(
344                tracing_subscriber::fmt::layer()
345                    .fmt_fields(JsonFields::default())
346                    .event_format(
347                        tracing_subscriber::fmt::format()
348                            .json()
349                            .flatten_event(true)
350                            .with_span_list(false),
351                    )
352                    .with_filter(filter),
353            ) as Box<dyn Layer<_> + Send + Sync>
354        } else {
355            Box::new(
356                tracing_subscriber::fmt::layer()
357                    .event_format(tracing_subscriber::fmt::format().pretty())
358                    .with_filter(filter),
359            )
360        })
361        .init();
362
363    None
364}
365
366fn init_panic_hook() {
367    std::panic::set_hook(Box::new(move |panic_info| {
368        let panic_message = match panic_info.payload().downcast_ref::<&'static str>() {
369            Some(message) => *message,
370            None => match panic_info.payload().downcast_ref::<String>() {
371                Some(message) => message.as_str(),
372                None => "Box<Any>",
373            },
374        };
375        let backtrace = std::backtrace::Backtrace::force_capture();
376        let location = panic_info
377            .location()
378            .map(|loc| format!("{}:{}", loc.file(), loc.line()));
379        tracing::error!(panic = true, ?location, %panic_message, %backtrace, "Server Panic");
380    }));
381}