]> git.proxmox.com Git - proxmox-backup.git/blob - src/bin/proxmox-backup-proxy.rs
proxmox-rest-server: pass owned RestEnvironment to get_index
[proxmox-backup.git] / src / bin / proxmox-backup-proxy.rs
1 use std::sync::{Mutex, Arc};
2 use std::path::{Path, PathBuf};
3 use std::os::unix::io::AsRawFd;
4 use std::future::Future;
5 use std::pin::Pin;
6
7 use anyhow::{bail, format_err, Error};
8 use futures::*;
9 use http::request::Parts;
10 use http::Response;
11 use hyper::{Body, StatusCode};
12 use hyper::header;
13 use url::form_urlencoded;
14
15 use openssl::ssl::{SslMethod, SslAcceptor, SslFiletype};
16 use tokio_stream::wrappers::ReceiverStream;
17 use serde_json::{json, Value};
18
19 use proxmox::try_block;
20 use proxmox::api::{RpcEnvironment, RpcEnvironmentType};
21 use proxmox::sys::linux::socket::set_tcp_keepalive;
22 use proxmox::tools::fs::CreateOptions;
23
24 use pbs_tools::task_log;
25 use pbs_datastore::DataStore;
26 use proxmox_rest_server::{
27 rotate_task_log_archive, extract_cookie , ApiConfig, RestServer, RestEnvironment, WorkerTask,
28 };
29
30 use proxmox_backup::{
31 server::{
32 auth::default_api_auth,
33 jobstate::{
34 self,
35 Job,
36 },
37 },
38 };
39
40 use pbs_buildcfg::configdir;
41 use proxmox_systemd::time::{compute_next_event, parse_calendar_event};
42 use pbs_tools::logrotate::LogRotate;
43
44 use pbs_api_types::{
45 Authid, TapeBackupJobConfig, VerificationJobConfig, SyncJobConfig, DataStoreConfig,
46 PruneOptions,
47 };
48
49 use proxmox_rest_server::daemon;
50
51 use proxmox_backup::server;
52 use proxmox_backup::auth_helpers::*;
53 use proxmox_backup::tools::{
54 PROXMOX_BACKUP_TCP_KEEPALIVE_TIME,
55 disks::{
56 DiskManage,
57 zfs_pool_stats,
58 get_pool_from_dataset,
59 },
60 };
61
62
63 use proxmox_backup::api2::pull::do_sync_job;
64 use proxmox_backup::api2::tape::backup::do_tape_backup_job;
65 use proxmox_backup::server::do_verification_job;
66 use proxmox_backup::server::do_prune_job;
67
68 fn main() -> Result<(), Error> {
69 proxmox_backup::tools::setup_safe_path_env();
70
71 let backup_uid = pbs_config::backup_user()?.uid;
72 let backup_gid = pbs_config::backup_group()?.gid;
73 let running_uid = nix::unistd::Uid::effective();
74 let running_gid = nix::unistd::Gid::effective();
75
76 if running_uid != backup_uid || running_gid != backup_gid {
77 bail!("proxy not running as backup user or group (got uid {} gid {})", running_uid, running_gid);
78 }
79
80 pbs_runtime::main(run())
81 }
82
83
84 fn extract_lang_header(headers: &http::HeaderMap) -> Option<String> {
85 if let Some(Ok(cookie)) = headers.get("COOKIE").map(|v| v.to_str()) {
86 return extract_cookie(cookie, "PBSLangCookie");
87 }
88 None
89 }
90
91 fn get_index<'a>(
92 env: RestEnvironment,
93 parts: Parts,
94 ) -> Pin<Box<dyn Future<Output = Response<Body>> + Send + 'a>> {
95 Box::pin(get_index_future(env, parts))
96 }
97
98 async fn get_index_future(
99 env: RestEnvironment,
100 parts: Parts,
101 ) -> Response<Body> {
102
103 let auth_id = env.get_auth_id();
104 let api = env.api_config();
105 let language = extract_lang_header(&parts.headers);
106
107 // fixme: make all IO async
108
109 let (userid, csrf_token) = match auth_id {
110 Some(auth_id) => {
111 let auth_id = auth_id.parse::<Authid>();
112 match auth_id {
113 Ok(auth_id) if !auth_id.is_token() => {
114 let userid = auth_id.user().clone();
115 let new_csrf_token = assemble_csrf_prevention_token(csrf_secret(), &userid);
116 (Some(userid), Some(new_csrf_token))
117 }
118 _ => (None, None)
119 }
120 }
121 None => (None, None),
122 };
123
124 let nodename = proxmox::tools::nodename();
125 let user = userid.as_ref().map(|u| u.as_str()).unwrap_or("");
126
127 let csrf_token = csrf_token.unwrap_or_else(|| String::from(""));
128
129 let mut debug = false;
130 let mut template_file = "index";
131
132 if let Some(query_str) = parts.uri.query() {
133 for (k, v) in form_urlencoded::parse(query_str.as_bytes()).into_owned() {
134 if k == "debug" && v != "0" && v != "false" {
135 debug = true;
136 } else if k == "console" {
137 template_file = "console";
138 }
139 }
140 }
141
142 let mut lang = String::from("");
143 if let Some(language) = language {
144 if Path::new(&format!("/usr/share/pbs-i18n/pbs-lang-{}.js", language)).exists() {
145 lang = language;
146 }
147 }
148
149 let data = json!({
150 "NodeName": nodename,
151 "UserName": user,
152 "CSRFPreventionToken": csrf_token,
153 "language": lang,
154 "debug": debug,
155 });
156
157 let (ct, index) = match api.render_template(template_file, &data) {
158 Ok(index) => ("text/html", index),
159 Err(err) => ("text/plain", format!("Error rendering template: {}", err)),
160 };
161
162 let mut resp = Response::builder()
163 .status(StatusCode::OK)
164 .header(header::CONTENT_TYPE, ct)
165 .body(index.into())
166 .unwrap();
167
168 if let Some(userid) = userid {
169 resp.extensions_mut().insert(Authid::from((userid, None)));
170 }
171
172 resp
173 }
174
175 async fn run() -> Result<(), Error> {
176 if let Err(err) = syslog::init(
177 syslog::Facility::LOG_DAEMON,
178 log::LevelFilter::Info,
179 Some("proxmox-backup-proxy")) {
180 bail!("unable to inititialize syslog - {}", err);
181 }
182
183 // Note: To debug early connection error use
184 // PROXMOX_DEBUG=1 ./target/release/proxmox-backup-proxy
185 let debug = std::env::var("PROXMOX_DEBUG").is_ok();
186
187 let _ = public_auth_key(); // load with lazy_static
188 let _ = csrf_secret(); // load with lazy_static
189
190 let mut config = ApiConfig::new(
191 pbs_buildcfg::JS_DIR,
192 &proxmox_backup::api2::ROUTER,
193 RpcEnvironmentType::PUBLIC,
194 default_api_auth(),
195 &get_index,
196 )?;
197
198 config.add_alias("novnc", "/usr/share/novnc-pve");
199 config.add_alias("extjs", "/usr/share/javascript/extjs");
200 config.add_alias("qrcodejs", "/usr/share/javascript/qrcodejs");
201 config.add_alias("fontawesome", "/usr/share/fonts-font-awesome");
202 config.add_alias("xtermjs", "/usr/share/pve-xtermjs");
203 config.add_alias("locale", "/usr/share/pbs-i18n");
204 config.add_alias("widgettoolkit", "/usr/share/javascript/proxmox-widget-toolkit");
205 config.add_alias("docs", "/usr/share/doc/proxmox-backup/html");
206
207 let mut indexpath = PathBuf::from(pbs_buildcfg::JS_DIR);
208 indexpath.push("index.hbs");
209 config.register_template("index", &indexpath)?;
210 config.register_template("console", "/usr/share/pve-xtermjs/index.html.hbs")?;
211
212 let backup_user = pbs_config::backup_user()?;
213 let mut commando_sock = proxmox_rest_server::CommandSocket::new(proxmox_rest_server::our_ctrl_sock(), backup_user.gid);
214
215 let dir_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid);
216 let file_opts = CreateOptions::new().owner(backup_user.uid).group(backup_user.gid);
217
218 config.enable_access_log(
219 pbs_buildcfg::API_ACCESS_LOG_FN,
220 Some(dir_opts.clone()),
221 Some(file_opts.clone()),
222 &mut commando_sock,
223 )?;
224
225 config.enable_auth_log(
226 pbs_buildcfg::API_AUTH_LOG_FN,
227 Some(dir_opts.clone()),
228 Some(file_opts.clone()),
229 &mut commando_sock,
230 )?;
231
232 let rest_server = RestServer::new(config);
233 proxmox_rest_server::init_worker_tasks(pbs_buildcfg::PROXMOX_BACKUP_LOG_DIR_M!().into(), file_opts.clone())?;
234
235 //openssl req -x509 -newkey rsa:4096 -keyout /etc/proxmox-backup/proxy.key -out /etc/proxmox-backup/proxy.pem -nodes
236
237 // we build the initial acceptor here as we cannot start if this fails
238 let acceptor = make_tls_acceptor()?;
239 let acceptor = Arc::new(Mutex::new(acceptor));
240
241 // to renew the acceptor we just add a command-socket handler
242 commando_sock.register_command(
243 "reload-certificate".to_string(),
244 {
245 let acceptor = Arc::clone(&acceptor);
246 move |_value| -> Result<_, Error> {
247 log::info!("reloading certificate");
248 match make_tls_acceptor() {
249 Err(err) => log::error!("error reloading certificate: {}", err),
250 Ok(new_acceptor) => {
251 let mut guard = acceptor.lock().unwrap();
252 *guard = new_acceptor;
253 }
254 }
255 Ok(Value::Null)
256 }
257 },
258 )?;
259
260 // to remove references for not configured datastores
261 commando_sock.register_command(
262 "datastore-removed".to_string(),
263 |_value| {
264 if let Err(err) = DataStore::remove_unused_datastores() {
265 log::error!("could not refresh datastores: {}", err);
266 }
267 Ok(Value::Null)
268 }
269 )?;
270
271 let server = daemon::create_daemon(
272 ([0,0,0,0,0,0,0,0], 8007).into(),
273 move |listener| {
274
275 let connections = accept_connections(listener, acceptor, debug);
276 let connections = hyper::server::accept::from_stream(ReceiverStream::new(connections));
277
278 Ok(async {
279 daemon::systemd_notify(daemon::SystemdNotify::Ready)?;
280
281 hyper::Server::builder(connections)
282 .serve(rest_server)
283 .with_graceful_shutdown(proxmox_rest_server::shutdown_future())
284 .map_err(Error::from)
285 .await
286 })
287 },
288 );
289
290 proxmox_rest_server::write_pid(pbs_buildcfg::PROXMOX_BACKUP_PROXY_PID_FN)?;
291
292 let init_result: Result<(), Error> = try_block!({
293 proxmox_rest_server::register_task_control_commands(&mut commando_sock)?;
294 commando_sock.spawn()?;
295 proxmox_rest_server::catch_shutdown_signal()?;
296 proxmox_rest_server::catch_reload_signal()?;
297 Ok(())
298 });
299
300 if let Err(err) = init_result {
301 bail!("unable to start daemon - {}", err);
302 }
303
304 start_task_scheduler();
305 start_stat_generator();
306
307 server.await?;
308 log::info!("server shutting down, waiting for active workers to complete");
309 proxmox_rest_server::last_worker_future().await?;
310 log::info!("done - exit server");
311
312 Ok(())
313 }
314
315 fn make_tls_acceptor() -> Result<SslAcceptor, Error> {
316 let key_path = configdir!("/proxy.key");
317 let cert_path = configdir!("/proxy.pem");
318
319 let mut acceptor = SslAcceptor::mozilla_intermediate_v5(SslMethod::tls()).unwrap();
320 acceptor.set_private_key_file(key_path, SslFiletype::PEM)
321 .map_err(|err| format_err!("unable to read proxy key {} - {}", key_path, err))?;
322 acceptor.set_certificate_chain_file(cert_path)
323 .map_err(|err| format_err!("unable to read proxy cert {} - {}", cert_path, err))?;
324 acceptor.check_private_key().unwrap();
325
326 Ok(acceptor.build())
327 }
328
329 type ClientStreamResult =
330 Result<std::pin::Pin<Box<tokio_openssl::SslStream<tokio::net::TcpStream>>>, Error>;
331 const MAX_PENDING_ACCEPTS: usize = 1024;
332
333 fn accept_connections(
334 listener: tokio::net::TcpListener,
335 acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>,
336 debug: bool,
337 ) -> tokio::sync::mpsc::Receiver<ClientStreamResult> {
338
339 let (sender, receiver) = tokio::sync::mpsc::channel(MAX_PENDING_ACCEPTS);
340
341 tokio::spawn(accept_connection(listener, acceptor, debug, sender));
342
343 receiver
344 }
345
346 async fn accept_connection(
347 listener: tokio::net::TcpListener,
348 acceptor: Arc<Mutex<openssl::ssl::SslAcceptor>>,
349 debug: bool,
350 sender: tokio::sync::mpsc::Sender<ClientStreamResult>,
351 ) {
352 let accept_counter = Arc::new(());
353
354 loop {
355 let (sock, _addr) = match listener.accept().await {
356 Ok(conn) => conn,
357 Err(err) => {
358 eprintln!("error accepting tcp connection: {}", err);
359 continue;
360 }
361 };
362
363 sock.set_nodelay(true).unwrap();
364 let _ = set_tcp_keepalive(sock.as_raw_fd(), PROXMOX_BACKUP_TCP_KEEPALIVE_TIME);
365
366 let ssl = { // limit acceptor_guard scope
367 // Acceptor can be reloaded using the command socket "reload-certificate" command
368 let acceptor_guard = acceptor.lock().unwrap();
369
370 match openssl::ssl::Ssl::new(acceptor_guard.context()) {
371 Ok(ssl) => ssl,
372 Err(err) => {
373 eprintln!("failed to create Ssl object from Acceptor context - {}", err);
374 continue;
375 },
376 }
377 };
378
379 let stream = match tokio_openssl::SslStream::new(ssl, sock) {
380 Ok(stream) => stream,
381 Err(err) => {
382 eprintln!("failed to create SslStream using ssl and connection socket - {}", err);
383 continue;
384 },
385 };
386
387 let mut stream = Box::pin(stream);
388 let sender = sender.clone();
389
390 if Arc::strong_count(&accept_counter) > MAX_PENDING_ACCEPTS {
391 eprintln!("connection rejected - to many open connections");
392 continue;
393 }
394
395 let accept_counter = Arc::clone(&accept_counter);
396 tokio::spawn(async move {
397 let accept_future = tokio::time::timeout(
398 Duration::new(10, 0), stream.as_mut().accept());
399
400 let result = accept_future.await;
401
402 match result {
403 Ok(Ok(())) => {
404 if sender.send(Ok(stream)).await.is_err() && debug {
405 eprintln!("detect closed connection channel");
406 }
407 }
408 Ok(Err(err)) => {
409 if debug {
410 eprintln!("https handshake failed - {}", err);
411 }
412 }
413 Err(_) => {
414 if debug {
415 eprintln!("https handshake timeout");
416 }
417 }
418 }
419
420 drop(accept_counter); // decrease reference count
421 });
422 }
423 }
424
425 fn start_stat_generator() {
426 let abort_future = proxmox_rest_server::shutdown_future();
427 let future = Box::pin(run_stat_generator());
428 let task = futures::future::select(future, abort_future);
429 tokio::spawn(task.map(|_| ()));
430 }
431
432 fn start_task_scheduler() {
433 let abort_future = proxmox_rest_server::shutdown_future();
434 let future = Box::pin(run_task_scheduler());
435 let task = futures::future::select(future, abort_future);
436 tokio::spawn(task.map(|_| ()));
437 }
438
439 use std::time::{SystemTime, Instant, Duration, UNIX_EPOCH};
440
441 fn next_minute() -> Result<Instant, Error> {
442 let now = SystemTime::now();
443 let epoch_now = now.duration_since(UNIX_EPOCH)?;
444 let epoch_next = Duration::from_secs((epoch_now.as_secs()/60 + 1)*60);
445 Ok(Instant::now() + epoch_next - epoch_now)
446 }
447
448 async fn run_task_scheduler() {
449
450 let mut count: usize = 0;
451
452 loop {
453 count += 1;
454
455 let delay_target = match next_minute() { // try to run very minute
456 Ok(d) => d,
457 Err(err) => {
458 eprintln!("task scheduler: compute next minute failed - {}", err);
459 tokio::time::sleep_until(tokio::time::Instant::from_std(Instant::now() + Duration::from_secs(60))).await;
460 continue;
461 }
462 };
463
464 if count > 2 { // wait 1..2 minutes before starting
465 match schedule_tasks().catch_unwind().await {
466 Err(panic) => {
467 match panic.downcast::<&str>() {
468 Ok(msg) => {
469 eprintln!("task scheduler panic: {}", msg);
470 }
471 Err(_) => {
472 eprintln!("task scheduler panic - unknown type");
473 }
474 }
475 }
476 Ok(Err(err)) => {
477 eprintln!("task scheduler failed - {:?}", err);
478 }
479 Ok(Ok(_)) => {}
480 }
481 }
482
483 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
484 }
485 }
486
487 async fn schedule_tasks() -> Result<(), Error> {
488
489 schedule_datastore_garbage_collection().await;
490 schedule_datastore_prune().await;
491 schedule_datastore_sync_jobs().await;
492 schedule_datastore_verify_jobs().await;
493 schedule_tape_backup_jobs().await;
494 schedule_task_log_rotate().await;
495
496 Ok(())
497 }
498
499 async fn schedule_datastore_garbage_collection() {
500
501 let config = match pbs_config::datastore::config() {
502 Err(err) => {
503 eprintln!("unable to read datastore config - {}", err);
504 return;
505 }
506 Ok((config, _digest)) => config,
507 };
508
509 for (store, (_, store_config)) in config.sections {
510 let datastore = match DataStore::lookup_datastore(&store) {
511 Ok(datastore) => datastore,
512 Err(err) => {
513 eprintln!("lookup_datastore failed - {}", err);
514 continue;
515 }
516 };
517
518 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
519 Ok(c) => c,
520 Err(err) => {
521 eprintln!("datastore config from_value failed - {}", err);
522 continue;
523 }
524 };
525
526 let event_str = match store_config.gc_schedule {
527 Some(event_str) => event_str,
528 None => continue,
529 };
530
531 let event = match parse_calendar_event(&event_str) {
532 Ok(event) => event,
533 Err(err) => {
534 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
535 continue;
536 }
537 };
538
539 if datastore.garbage_collection_running() { continue; }
540
541 let worker_type = "garbage_collection";
542
543 let last = match jobstate::last_run_time(worker_type, &store) {
544 Ok(time) => time,
545 Err(err) => {
546 eprintln!("could not get last run time of {} {}: {}", worker_type, store, err);
547 continue;
548 }
549 };
550
551 let next = match compute_next_event(&event, last, false) {
552 Ok(Some(next)) => next,
553 Ok(None) => continue,
554 Err(err) => {
555 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
556 continue;
557 }
558 };
559
560 let now = proxmox::tools::time::epoch_i64();
561
562 if next > now { continue; }
563
564 let job = match Job::new(worker_type, &store) {
565 Ok(job) => job,
566 Err(_) => continue, // could not get lock
567 };
568
569 let auth_id = Authid::root_auth_id();
570
571 if let Err(err) = crate::server::do_garbage_collection_job(job, datastore, auth_id, Some(event_str), false) {
572 eprintln!("unable to start garbage collection job on datastore {} - {}", store, err);
573 }
574 }
575 }
576
577 async fn schedule_datastore_prune() {
578
579 let config = match pbs_config::datastore::config() {
580 Err(err) => {
581 eprintln!("unable to read datastore config - {}", err);
582 return;
583 }
584 Ok((config, _digest)) => config,
585 };
586
587 for (store, (_, store_config)) in config.sections {
588
589 let store_config: DataStoreConfig = match serde_json::from_value(store_config) {
590 Ok(c) => c,
591 Err(err) => {
592 eprintln!("datastore '{}' config from_value failed - {}", store, err);
593 continue;
594 }
595 };
596
597 let event_str = match store_config.prune_schedule {
598 Some(event_str) => event_str,
599 None => continue,
600 };
601
602 let prune_options = PruneOptions {
603 keep_last: store_config.keep_last,
604 keep_hourly: store_config.keep_hourly,
605 keep_daily: store_config.keep_daily,
606 keep_weekly: store_config.keep_weekly,
607 keep_monthly: store_config.keep_monthly,
608 keep_yearly: store_config.keep_yearly,
609 };
610
611 if !pbs_datastore::prune::keeps_something(&prune_options) { // no prune settings - keep all
612 continue;
613 }
614
615 let worker_type = "prune";
616 if check_schedule(worker_type, &event_str, &store) {
617 let job = match Job::new(worker_type, &store) {
618 Ok(job) => job,
619 Err(_) => continue, // could not get lock
620 };
621
622 let auth_id = Authid::root_auth_id().clone();
623 if let Err(err) = do_prune_job(job, prune_options, store.clone(), &auth_id, Some(event_str)) {
624 eprintln!("unable to start datastore prune job {} - {}", &store, err);
625 }
626 };
627 }
628 }
629
630 async fn schedule_datastore_sync_jobs() {
631
632
633 let config = match pbs_config::sync::config() {
634 Err(err) => {
635 eprintln!("unable to read sync job config - {}", err);
636 return;
637 }
638 Ok((config, _digest)) => config,
639 };
640
641 for (job_id, (_, job_config)) in config.sections {
642 let job_config: SyncJobConfig = match serde_json::from_value(job_config) {
643 Ok(c) => c,
644 Err(err) => {
645 eprintln!("sync job config from_value failed - {}", err);
646 continue;
647 }
648 };
649
650 let event_str = match job_config.schedule {
651 Some(ref event_str) => event_str.clone(),
652 None => continue,
653 };
654
655 let worker_type = "syncjob";
656 if check_schedule(worker_type, &event_str, &job_id) {
657 let job = match Job::new(worker_type, &job_id) {
658 Ok(job) => job,
659 Err(_) => continue, // could not get lock
660 };
661
662 let auth_id = Authid::root_auth_id().clone();
663 if let Err(err) = do_sync_job(job, job_config, &auth_id, Some(event_str), false) {
664 eprintln!("unable to start datastore sync job {} - {}", &job_id, err);
665 }
666 };
667 }
668 }
669
670 async fn schedule_datastore_verify_jobs() {
671
672 let config = match pbs_config::verify::config() {
673 Err(err) => {
674 eprintln!("unable to read verification job config - {}", err);
675 return;
676 }
677 Ok((config, _digest)) => config,
678 };
679 for (job_id, (_, job_config)) in config.sections {
680 let job_config: VerificationJobConfig = match serde_json::from_value(job_config) {
681 Ok(c) => c,
682 Err(err) => {
683 eprintln!("verification job config from_value failed - {}", err);
684 continue;
685 }
686 };
687 let event_str = match job_config.schedule {
688 Some(ref event_str) => event_str.clone(),
689 None => continue,
690 };
691
692 let worker_type = "verificationjob";
693 let auth_id = Authid::root_auth_id().clone();
694 if check_schedule(worker_type, &event_str, &job_id) {
695 let job = match Job::new(&worker_type, &job_id) {
696 Ok(job) => job,
697 Err(_) => continue, // could not get lock
698 };
699 if let Err(err) = do_verification_job(job, job_config, &auth_id, Some(event_str), false) {
700 eprintln!("unable to start datastore verification job {} - {}", &job_id, err);
701 }
702 };
703 }
704 }
705
706 async fn schedule_tape_backup_jobs() {
707
708 let config = match pbs_config::tape_job::config() {
709 Err(err) => {
710 eprintln!("unable to read tape job config - {}", err);
711 return;
712 }
713 Ok((config, _digest)) => config,
714 };
715 for (job_id, (_, job_config)) in config.sections {
716 let job_config: TapeBackupJobConfig = match serde_json::from_value(job_config) {
717 Ok(c) => c,
718 Err(err) => {
719 eprintln!("tape backup job config from_value failed - {}", err);
720 continue;
721 }
722 };
723 let event_str = match job_config.schedule {
724 Some(ref event_str) => event_str.clone(),
725 None => continue,
726 };
727
728 let worker_type = "tape-backup-job";
729 let auth_id = Authid::root_auth_id().clone();
730 if check_schedule(worker_type, &event_str, &job_id) {
731 let job = match Job::new(&worker_type, &job_id) {
732 Ok(job) => job,
733 Err(_) => continue, // could not get lock
734 };
735 if let Err(err) = do_tape_backup_job(job, job_config.setup, &auth_id, Some(event_str), false) {
736 eprintln!("unable to start tape backup job {} - {}", &job_id, err);
737 }
738 };
739 }
740 }
741
742
743 async fn schedule_task_log_rotate() {
744
745 let worker_type = "logrotate";
746 let job_id = "access-log_and_task-archive";
747
748 // schedule daily at 00:00 like normal logrotate
749 let schedule = "00:00";
750
751 if !check_schedule(worker_type, schedule, job_id) {
752 // if we never ran the rotation, schedule instantly
753 match jobstate::JobState::load(worker_type, job_id) {
754 Ok(state) => match state {
755 jobstate::JobState::Created { .. } => {},
756 _ => return,
757 },
758 _ => return,
759 }
760 }
761
762 let mut job = match Job::new(worker_type, job_id) {
763 Ok(job) => job,
764 Err(_) => return, // could not get lock
765 };
766
767 if let Err(err) = WorkerTask::new_thread(
768 worker_type,
769 None,
770 Authid::root_auth_id().to_string(),
771 false,
772 move |worker| {
773 job.start(&worker.upid().to_string())?;
774 task_log!(worker, "starting task log rotation");
775
776 let result = try_block!({
777 let max_size = 512 * 1024 - 1; // an entry has ~ 100b, so > 5000 entries/file
778 let max_files = 20; // times twenty files gives > 100000 task entries
779 let has_rotated = rotate_task_log_archive(max_size, true, Some(max_files))?;
780 if has_rotated {
781 task_log!(worker, "task log archive was rotated");
782 } else {
783 task_log!(worker, "task log archive was not rotated");
784 }
785
786 let max_size = 32 * 1024 * 1024 - 1;
787 let max_files = 14;
788 let mut logrotate = LogRotate::new(pbs_buildcfg::API_ACCESS_LOG_FN, true)
789 .ok_or_else(|| format_err!("could not get API access log file names"))?;
790
791 if logrotate.rotate(max_size, None, Some(max_files))? {
792 println!("rotated access log, telling daemons to re-open log file");
793 pbs_runtime::block_on(command_reopen_access_logfiles())?;
794 task_log!(worker, "API access log was rotated");
795 } else {
796 task_log!(worker, "API access log was not rotated");
797 }
798
799 let mut logrotate = LogRotate::new(pbs_buildcfg::API_AUTH_LOG_FN, true)
800 .ok_or_else(|| format_err!("could not get API auth log file names"))?;
801
802 if logrotate.rotate(max_size, None, Some(max_files))? {
803 println!("rotated auth log, telling daemons to re-open log file");
804 pbs_runtime::block_on(command_reopen_auth_logfiles())?;
805 task_log!(worker, "API authentication log was rotated");
806 } else {
807 task_log!(worker, "API authentication log was not rotated");
808 }
809
810 Ok(())
811 });
812
813 let status = worker.create_state(&result);
814
815 if let Err(err) = job.finish(status) {
816 eprintln!("could not finish job state for {}: {}", worker_type, err);
817 }
818
819 result
820 },
821 ) {
822 eprintln!("unable to start task log rotation: {}", err);
823 }
824
825 }
826
827 async fn command_reopen_access_logfiles() -> Result<(), Error> {
828 // only care about the most recent daemon instance for each, proxy & api, as other older ones
829 // should not respond to new requests anyway, but only finish their current one and then exit.
830 let sock = proxmox_rest_server::our_ctrl_sock();
831 let f1 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
832
833 let pid = proxmox_rest_server::read_pid(pbs_buildcfg::PROXMOX_BACKUP_API_PID_FN)?;
834 let sock = proxmox_rest_server::ctrl_sock_from_pid(pid);
835 let f2 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-access-log-reopen\"}\n");
836
837 match futures::join!(f1, f2) {
838 (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)),
839 (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)),
840 (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)),
841 _ => Ok(()),
842 }
843 }
844
845 async fn command_reopen_auth_logfiles() -> Result<(), Error> {
846 // only care about the most recent daemon instance for each, proxy & api, as other older ones
847 // should not respond to new requests anyway, but only finish their current one and then exit.
848 let sock = proxmox_rest_server::our_ctrl_sock();
849 let f1 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-auth-log-reopen\"}\n");
850
851 let pid = proxmox_rest_server::read_pid(pbs_buildcfg::PROXMOX_BACKUP_API_PID_FN)?;
852 let sock = proxmox_rest_server::ctrl_sock_from_pid(pid);
853 let f2 = proxmox_rest_server::send_command(sock, "{\"command\":\"api-auth-log-reopen\"}\n");
854
855 match futures::join!(f1, f2) {
856 (Err(e1), Err(e2)) => Err(format_err!("reopen commands failed, proxy: {}; api: {}", e1, e2)),
857 (Err(e1), Ok(_)) => Err(format_err!("reopen commands failed, proxy: {}", e1)),
858 (Ok(_), Err(e2)) => Err(format_err!("reopen commands failed, api: {}", e2)),
859 _ => Ok(()),
860 }
861 }
862
863 async fn run_stat_generator() {
864
865 let mut count = 0;
866 loop {
867 count += 1;
868 let save = if count >= 6 { count = 0; true } else { false };
869
870 let delay_target = Instant::now() + Duration::from_secs(10);
871
872 generate_host_stats(save).await;
873
874 tokio::time::sleep_until(tokio::time::Instant::from_std(delay_target)).await;
875
876 }
877
878 }
879
880 fn rrd_update_gauge(name: &str, value: f64, save: bool) {
881 use proxmox_backup::rrd;
882 if let Err(err) = rrd::update_value(name, value, rrd::DST::Gauge, save) {
883 eprintln!("rrd::update_value '{}' failed - {}", name, err);
884 }
885 }
886
887 fn rrd_update_derive(name: &str, value: f64, save: bool) {
888 use proxmox_backup::rrd;
889 if let Err(err) = rrd::update_value(name, value, rrd::DST::Derive, save) {
890 eprintln!("rrd::update_value '{}' failed - {}", name, err);
891 }
892 }
893
894 async fn generate_host_stats(save: bool) {
895 use proxmox::sys::linux::procfs::{
896 read_meminfo, read_proc_stat, read_proc_net_dev, read_loadavg};
897
898 pbs_runtime::block_in_place(move || {
899
900 match read_proc_stat() {
901 Ok(stat) => {
902 rrd_update_gauge("host/cpu", stat.cpu, save);
903 rrd_update_gauge("host/iowait", stat.iowait_percent, save);
904 }
905 Err(err) => {
906 eprintln!("read_proc_stat failed - {}", err);
907 }
908 }
909
910 match read_meminfo() {
911 Ok(meminfo) => {
912 rrd_update_gauge("host/memtotal", meminfo.memtotal as f64, save);
913 rrd_update_gauge("host/memused", meminfo.memused as f64, save);
914 rrd_update_gauge("host/swaptotal", meminfo.swaptotal as f64, save);
915 rrd_update_gauge("host/swapused", meminfo.swapused as f64, save);
916 }
917 Err(err) => {
918 eprintln!("read_meminfo failed - {}", err);
919 }
920 }
921
922 match read_proc_net_dev() {
923 Ok(netdev) => {
924 use pbs_config::network::is_physical_nic;
925 let mut netin = 0;
926 let mut netout = 0;
927 for item in netdev {
928 if !is_physical_nic(&item.device) { continue; }
929 netin += item.receive;
930 netout += item.send;
931 }
932 rrd_update_derive("host/netin", netin as f64, save);
933 rrd_update_derive("host/netout", netout as f64, save);
934 }
935 Err(err) => {
936 eprintln!("read_prox_net_dev failed - {}", err);
937 }
938 }
939
940 match read_loadavg() {
941 Ok(loadavg) => {
942 rrd_update_gauge("host/loadavg", loadavg.0 as f64, save);
943 }
944 Err(err) => {
945 eprintln!("read_loadavg failed - {}", err);
946 }
947 }
948
949 let disk_manager = DiskManage::new();
950
951 gather_disk_stats(disk_manager.clone(), Path::new("/"), "host", save);
952
953 match pbs_config::datastore::config() {
954 Ok((config, _)) => {
955 let datastore_list: Vec<DataStoreConfig> =
956 config.convert_to_typed_array("datastore").unwrap_or_default();
957
958 for config in datastore_list {
959
960 let rrd_prefix = format!("datastore/{}", config.name);
961 let path = std::path::Path::new(&config.path);
962 gather_disk_stats(disk_manager.clone(), path, &rrd_prefix, save);
963 }
964 }
965 Err(err) => {
966 eprintln!("read datastore config failed - {}", err);
967 }
968 }
969
970 });
971 }
972
973 fn check_schedule(worker_type: &str, event_str: &str, id: &str) -> bool {
974 let event = match parse_calendar_event(event_str) {
975 Ok(event) => event,
976 Err(err) => {
977 eprintln!("unable to parse schedule '{}' - {}", event_str, err);
978 return false;
979 }
980 };
981
982 let last = match jobstate::last_run_time(worker_type, &id) {
983 Ok(time) => time,
984 Err(err) => {
985 eprintln!("could not get last run time of {} {}: {}", worker_type, id, err);
986 return false;
987 }
988 };
989
990 let next = match compute_next_event(&event, last, false) {
991 Ok(Some(next)) => next,
992 Ok(None) => return false,
993 Err(err) => {
994 eprintln!("compute_next_event for '{}' failed - {}", event_str, err);
995 return false;
996 }
997 };
998
999 let now = proxmox::tools::time::epoch_i64();
1000 next <= now
1001 }
1002
1003 fn gather_disk_stats(disk_manager: Arc<DiskManage>, path: &Path, rrd_prefix: &str, save: bool) {
1004
1005 match proxmox_backup::tools::disks::disk_usage(path) {
1006 Ok(status) => {
1007 let rrd_key = format!("{}/total", rrd_prefix);
1008 rrd_update_gauge(&rrd_key, status.total as f64, save);
1009 let rrd_key = format!("{}/used", rrd_prefix);
1010 rrd_update_gauge(&rrd_key, status.used as f64, save);
1011 }
1012 Err(err) => {
1013 eprintln!("read disk_usage on {:?} failed - {}", path, err);
1014 }
1015 }
1016
1017 match disk_manager.find_mounted_device(path) {
1018 Ok(None) => {},
1019 Ok(Some((fs_type, device, source))) => {
1020 let mut device_stat = None;
1021 match fs_type.as_str() {
1022 "zfs" => {
1023 if let Some(source) = source {
1024 let pool = get_pool_from_dataset(&source).unwrap_or(&source);
1025 match zfs_pool_stats(pool) {
1026 Ok(stat) => device_stat = stat,
1027 Err(err) => eprintln!("zfs_pool_stats({:?}) failed - {}", pool, err),
1028 }
1029 }
1030 }
1031 _ => {
1032 if let Ok(disk) = disk_manager.clone().disk_by_dev_num(device.into_dev_t()) {
1033 match disk.read_stat() {
1034 Ok(stat) => device_stat = stat,
1035 Err(err) => eprintln!("disk.read_stat {:?} failed - {}", path, err),
1036 }
1037 }
1038 }
1039 }
1040 if let Some(stat) = device_stat {
1041 let rrd_key = format!("{}/read_ios", rrd_prefix);
1042 rrd_update_derive(&rrd_key, stat.read_ios as f64, save);
1043 let rrd_key = format!("{}/read_bytes", rrd_prefix);
1044 rrd_update_derive(&rrd_key, (stat.read_sectors*512) as f64, save);
1045
1046 let rrd_key = format!("{}/write_ios", rrd_prefix);
1047 rrd_update_derive(&rrd_key, stat.write_ios as f64, save);
1048 let rrd_key = format!("{}/write_bytes", rrd_prefix);
1049 rrd_update_derive(&rrd_key, (stat.write_sectors*512) as f64, save);
1050
1051 let rrd_key = format!("{}/io_ticks", rrd_prefix);
1052 rrd_update_derive(&rrd_key, (stat.io_ticks as f64)/1000.0, save);
1053 }
1054 }
1055 Err(err) => {
1056 eprintln!("find_mounted_device failed - {}", err);
1057 }
1058 }
1059 }