bootc-dev · cgwalters · Jul 28, 2025 · Jul 10, 2025 · Jul 24, 2025 · cgwalters
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/crates/blockdev/Cargo.toml b/crates/blockdev/Cargo.toml
@@ -11,9 +11,13 @@ anyhow = { workspace = true }
 bootc-utils = { package = "bootc-internal-utils", path = "../utils", version = "0.0.0" }
 camino = { workspace = true, features = ["serde1"] }
 fn-error-context = { workspace = true }
+libc = { workspace = true }
 regex = "1.10.4"
+rustix = { workspace = true }
 serde = { workspace = true, features = ["derive"] }
 serde_json = { workspace = true }
+tempfile = { workspace = true }
+tokio = { workspace = true, features = ["signal"] }
 tracing = { workspace = true }
 
 [dev-dependencies]

diff --git a/crates/blockdev/src/blockdev.rs b/crates/blockdev/src/blockdev.rs
@@ -1,12 +1,12 @@
 use std::collections::HashMap;
 use std::env;
 use std::path::Path;
-use std::process::Command;
+use std::path::PathBuf;
+use std::process::{Command, Stdio};
 use std::sync::OnceLock;
 
 use anyhow::{anyhow, Context, Result};
-use camino::Utf8Path;
-use camino::Utf8PathBuf;
+use camino::{Utf8Path, Utf8PathBuf};
 use fn_error_context::context;
 use regex::Regex;
 use serde::Deserialize;
@@ -181,6 +181,14 @@ pub fn partitions_of(dev: &Utf8Path) -> Result<PartitionTable> {
 
 pub struct LoopbackDevice {
     pub dev: Option<Utf8PathBuf>,
+    // Handle to the cleanup helper process
+    cleanup_handle: Option<LoopbackCleanupHandle>,
+}
+
+/// Handle to manage the cleanup helper process for loopback devices
+struct LoopbackCleanupHandle {
+    /// Child process handle
+    child: std::process::Child,
 }
 
 impl LoopbackDevice {
@@ -208,7 +216,25 @@ impl LoopbackDevice {
             .run_get_string()?;
         let dev = Utf8PathBuf::from(dev.trim());
         tracing::debug!("Allocated loopback {dev}");
-        Ok(Self { dev: Some(dev) })
+
+        // Try to spawn cleanup helper, but don't fail if it doesn't work
+        let cleanup_handle = match Self::spawn_cleanup_helper(dev.as_str()) {
+            Ok(handle) => Some(handle),
+            Err(e) => {
+                tracing::warn!(
+                    "Failed to spawn loopback cleanup helper for {}: {}. \
+                     Loopback device may not be cleaned up if process is interrupted.",
+                    dev,
+                    e
+                );
+                None
+            }
+        };
+
+        Ok(Self {
+            dev: Some(dev),
+            cleanup_handle,
+        })
     }
 
     // Access the path to the loopback block device.
@@ -217,13 +243,85 @@ impl LoopbackDevice {
         self.dev.as_deref().unwrap()
     }
 
+    /// Spawn a cleanup helper process that will clean up the loopback device
+    /// if the parent process dies unexpectedly
+    fn spawn_cleanup_helper(device_path: &str) -> Result<LoopbackCleanupHandle> {
+        // Try multiple strategies to find the bootc binary
+        let bootc_path = Self::find_bootc_binary()
+            .context("Failed to locate bootc binary for cleanup helper")?;
+
+        // Create the helper process
+        let mut cmd = Command::new(bootc_path);
+        cmd.args(["loopback-cleanup-helper", "--device", device_path]);
+
+        // Set environment variable to indicate this is a cleanup helper
+        cmd.env("BOOTC_LOOPBACK_CLEANUP_HELPER", "1");
+
+        // Set up stdio to redirect to /dev/null
+        cmd.stdin(Stdio::null());
+        cmd.stdout(Stdio::null());
+        // Don't redirect stderr so we can see error messages
+
+        // Spawn the process
+        let child = cmd
+            .spawn()
+            .context("Failed to spawn loopback cleanup helper")?;
+
+        Ok(LoopbackCleanupHandle { child })
+    }
+
+    /// Find the bootc binary using multiple strategies
+    fn find_bootc_binary() -> Result<PathBuf> {
+        // Strategy 1: Try /proc/self/exe (works in most cases)
+        if let Ok(exe_path) = std::fs::read_link("/proc/self/exe") {
 // OK now, we always copy our binary to a tempfile, set its security context 
 // OK now, we always copy our binary to a tempfile, set its security context 
+            if exe_path.exists() {
+                return Ok(exe_path);
+            } else {
+                tracing::warn!("/proc/self/exe points to non-existent path: {:?}", exe_path);
+            }
+        } else {
+            tracing::warn!("Failed to read /proc/self/exe");
+        }
+
+        // Strategy 2: Try argv[0] from std::env
+        if let Some(argv0) = std::env::args().next() {
+            let argv0_path = PathBuf::from(argv0);
+            if argv0_path.is_absolute() && argv0_path.exists() {
+                return Ok(argv0_path);
+            }
+            // If it's relative, try to resolve it
+            if let Ok(canonical) = argv0_path.canonicalize() {
+                return Ok(canonical);
+            }
+        }
+
+        // Strategy 3: Try common installation paths
+        let common_paths = ["/usr/bin/bootc", "/usr/local/bin/bootc"];
+
+        for path in &common_paths {
+            let path_buf = PathBuf::from(path);
+            if path_buf.exists() {
+                return Ok(path_buf);
+            }
+        }
+
+        anyhow::bail!("Could not locate bootc binary using any available strategy")
+    }
+
     // Shared backend for our `close` and `drop` implementations.
     fn impl_close(&mut self) -> Result<()> {
         // SAFETY: This is the only place we take the option
         let Some(dev) = self.dev.take() else {
             tracing::trace!("loopback device already deallocated");
             return Ok(());
         };
+
+        // Kill the cleanup helper since we're cleaning up normally
+        if let Some(mut cleanup_handle) = self.cleanup_handle.take() {
+            // Send SIGTERM to the child process and let it do the cleanup
+            let _ = cleanup_handle.child.kill();
+        }
+
         Command::new("losetup").args(["-d", dev.as_str()]).run()
     }
 
@@ -240,6 +338,56 @@ impl Drop for LoopbackDevice {
     }
 }
 
+/// Main function for the loopback cleanup helper process
+/// This function does not return - it either exits normally or via signal
+pub async fn run_loopback_cleanup_helper(device_path: &str) -> Result<()> {
+    // Check if we're running as a cleanup helper
+    if std::env::var("BOOTC_LOOPBACK_CLEANUP_HELPER").is_err() {
+        anyhow::bail!("This function should only be called as a cleanup helper");
+    }
+
+    // Set up death signal notification - we want to be notified when parent dies
+    rustix::process::set_parent_process_death_signal(Some(rustix::process::Signal::TERM))
+        .context("Failed to set parent death signal")?;
+
+    // Wait for SIGTERM (either from parent death or normal cleanup)
+    tokio::signal::unix::signal(tokio::signal::unix::SignalKind::terminate())
+        .expect("Failed to create signal stream")
+        .recv()
+        .await;
+
+    // Clean up the loopback device
+    let output = std::process::Command::new("losetup")
+        .args(["-d", device_path])
+        .output();
+
+    match output {
+        Ok(output) if output.status.success() => {
+            // Log to systemd journal instead of stderr
+            tracing::info!("Cleaned up leaked loopback device {}", device_path);
+            std::process::exit(0);
+        }
+        Ok(output) => {
+            let stderr = String::from_utf8_lossy(&output.stderr);
+            tracing::error!(
+                "Failed to clean up loopback device {}: {}. Stderr: {}",
+                device_path,
+                output.status,
+                stderr.trim()
+            );
+            std::process::exit(1);
+        }
+        Err(e) => {
+            tracing::error!(
+                "Error executing losetup to clean up loopback device {}: {}",
+                device_path,
+                e
+            );
+            std::process::exit(1);
+        }
+    }
+}
+
 /// Parse key-value pairs from lsblk --pairs.
 /// Newer versions of lsblk support JSON but the one in CentOS 7 doesn't.
 fn split_lsblk_line(line: &str) -> HashMap<String, String> {

diff --git a/crates/lib/src/cli.rs b/crates/lib/src/cli.rs
@@ -462,6 +462,18 @@ pub(crate) enum InternalsOpts {
         #[clap(allow_hyphen_values = true)]
         args: Vec<OsString>,
     },
+    /// Loopback device cleanup helper (internal use only)
+    LoopbackCleanupHelper {
+        /// Device path to clean up
+        #[clap(long)]
+        device: String,
+    },
+    /// Test loopback device allocation and cleanup (internal use only)
+    AllocateCleanupLoopback {
+        /// File path to create loopback device for
+        #[clap(long)]
+        file_path: Utf8PathBuf,
+    },
     /// Invoked from ostree-ext to complete an installation.
     BootcInstallCompletion {
         /// Path to the sysroot
@@ -1263,6 +1275,29 @@ async fn run_from_opt(opt: Opt) -> Result<()> {
                 let rootfs = &Dir::open_ambient_dir("/", cap_std::ambient_authority())?;
                 crate::install::completion::run_from_ostree(rootfs, &sysroot, &stateroot).await
             }
+            InternalsOpts::LoopbackCleanupHelper { device } => {
+                crate::blockdev::run_loopback_cleanup_helper(&device).await
+            }
+            InternalsOpts::AllocateCleanupLoopback { file_path: _ } => {
+                // Create a temporary file for testing
+                let temp_file =
+                    tempfile::NamedTempFile::new().context("Failed to create temporary file")?;
+                let temp_path = temp_file.path();
+
+                // Create a loopback device
+                let loopback = crate::blockdev::LoopbackDevice::new(temp_path)
+                    .context("Failed to create loopback device")?;
+
+                println!("Created loopback device: {}", loopback.path());
+
+                // Close the device to test cleanup
+                loopback
+                    .close()
+                    .context("Failed to close loopback device")?;
+
+                println!("Successfully closed loopback device");
+                Ok(())
+            }
             #[cfg(feature = "rhsm")]
             InternalsOpts::PublishRhsmFacts => crate::rhsm::publish_facts(&root).await,
         },

diff --git a/crates/lib/src/lib.rs b/crates/lib/src/lib.rs
@@ -38,3 +38,6 @@ mod kernel;
 
 #[cfg(feature = "rhsm")]
 mod rhsm;
+
+// Re-export blockdev crate for internal use
+pub(crate) use bootc_blockdev as blockdev;