mozilla · sylvestre · Mar 15, 2026 · Mar 15, 2026 · Mar 15, 2026 · Mar 15, 2026
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -44,6 +44,8 @@ jobs:
       - name: Clone repository
         uses: actions/checkout@v5
 
+      # TODO: restore `cargo test` once per-feature tests are compatible with
+      # both server-side and client-side compilation modes.
       - name: Check feature ${{ matrix.feature }}
         run: cargo check --no-default-features --features ${{ matrix.feature }}
 

diff --git a/docs/Architecture.md b/docs/Architecture.md
@@ -1,21 +1,166 @@
 # Sccache high level architecture
 
-This schema shows at high level how sccache works.
+Sccache supports two compilation modes: **server-side compilation** (legacy) and **client-side compilation** (new). The mode is controlled by the `SCCACHE_CLIENT_SIDE_COMPILE` environment variable.
 
+## Server-Side Compilation (Legacy Mode)
+
+This is the default mode when `SCCACHE_CLIENT_SIDE_COMPILE` is unset or set to `0`.
+
+In this mode, the server performs all compilation work:
+
+```mermaid
+  sequenceDiagram
+      participant Client as Client Process
+      participant Server as Sccache Server
+      participant Storage as Cache Storage
+
+      Client->>Server: 1. Compile Request (exe, args, cwd, env)
+      Server->>Server: 2. Detect Compiler
+      Server->>Server: 3. Preprocess & Hash
+      Server->>Storage: 4. Check Cache
+      alt Cache Lookup Result: Hit
+          rect rgba(0, 128, 0, 0.1)
+              Storage-->>Server: Cached Entry
+              Server-->>Client: 5a. Return Cached Result
+          end
+      else Hit: No - Cache Miss
+          rect rgba(200, 0, 0, 0.1)
+              Storage-->>Server: Miss
+              Server->>Server: 5b. Compile Locally
+              Server->>Storage: 6. Store Result
+              Server-->>Client: 7. Return Result
+          end
+      end
+```
+
+**Characteristics**:
+- Server performs compiler detection, preprocessing, hash generation, and compilation
+- All work happens on the server machine
+- Server can become a bottleneck with many parallel clients
+- Higher server CPU and memory usage
+
+## Client-Side Compilation (New Mode)
+
+Enabled by setting `SCCACHE_CLIENT_SIDE_COMPILE=1`.
+
+In this mode, the client performs compilation work and the server acts as pure storage:
+
+```mermaid
+  sequenceDiagram
+      participant Client as Client Process
+      participant Server as Sccache Server (Storage Only)
+      participant Storage as Cache Storage
+
+      Client->>Client: 1. Detect Compiler
+      Client->>Client: 2. Preprocess & Hash
+      Client->>Server: 3. CacheGet Request (cache_key)
+      Server->>Storage: 4. Query Storage
+      alt Cache Lookup Result: Hit
+          rect rgba(0, 128, 0, 0.1)
+              Storage-->>Server: Cached Entry
+              Server-->>Client: 5a. Return Cache Entry
+              Client->>Client: Use Cached Result
+          end
+      else Hit: No - Cache Miss
+          rect rgba(200, 0, 0, 0.1)
+              Storage-->>Server: Miss
+              Server-->>Client: 5b. Cache Miss
+              Client->>Client: 6. Compile Locally
+              Client->>Server: 7. CachePut Request (cache_key, entry)
+              Server->>Storage: 8. Store in Cache
+          end
+      end
+```
+
+**Characteristics**:
+- Client performs compiler detection, preprocessing, hash generation, and compilation
+- Server only handles cache storage operations (get/put)
+- Work is distributed across all clients (better scalability)
+- Lower server CPU and memory usage
+- Reduced network latency (single request instead of multiple round trips)
+
+**Why this is fast**: preprocessing in client-side mode is cheap — it only concatenates source files rather than running the full C/C++ preprocessor. This avoids the expensive `#include` expansion and macro evaluation that dominates traditional preprocessing time, making it practical to move this work to the client without a performance penalty.
+
+**Note**: Client-side compilation is functional but considered experimental. Enable it by setting `SCCACHE_CLIENT_SIDE_COMPILE=1`.
+
+## Comparison
+
+| Aspect | Server-Side (Legacy) | Client-Side (New) |
+|--------|---------------------|-------------------|
+| Compiler Detection | Server | Client (with caching) |
+| Preprocessing | Server | Client |
+| Hash Generation | Server | Client |
+| Compilation | Server | Client |
+| Server Role | Full compilation service | Pure storage service |
+| Server CPU Usage | High | Low |
+| Server Memory Usage | Moderate | Low |
+| Client Overhead | Low | Moderate |
+| Scalability | Limited by server | Excellent |
+| Network Requests | Multiple round trips | Single request |
+
+## Cache Key Generation
+
+Regardless of the mode, cache keys are generated from:
 
 ```mermaid
   flowchart LR
       id1[[Environment variables]] --> hash
       id2[[Compiler binary]] --> hash
       id3[[Compiler arguments]] --> hash
-      id5[[Files]] --> |  | hash
-      Compile --> Upload
-      Storage[(Storage)] --> | yes | Download
-      hash([hash]) --> | exists? | Storage
-      Storage --> | no | Compile
-      Upload --> Storage
+      id5[[Preprocessed Files]] --> hash
+      hash([BLAKE3 Hash]) --> key[Cache Key]
+
+      style id1 fill:#e8f4fd,stroke:#5dade2,color:#333
+      style id2 fill:#e8f4fd,stroke:#5dade2,color:#333
+      style id3 fill:#e8f4fd,stroke:#5dade2,color:#333
+      style id5 fill:#e8f4fd,stroke:#5dade2,color:#333
+      style hash fill:#eafaf1,stroke:#58d68d,color:#333
+      style key fill:#fef9e7,stroke:#f4d03f,color:#333
 ```
 
+### C/C++ vs Rust
+
+The "preprocessing" step differs significantly between languages:
+
+- **C/C++**: runs the compiler's preprocessor (`gcc -E` / `clang -E`) to expand all `#include` directives and macros, producing a single translation unit. The preprocessed output is then hashed. This is the expensive part — include expansion can pull in thousands of header files.
+
+- **Rust**: there is no preprocessor. Instead, sccache runs `rustc --emit dep-info`, a lightweight invocation that outputs a `.d` file listing all source files and environment variables the crate depends on — without compiling anything. Sccache then hashes each source file individually, along with extern crate `.rlib` files, static libraries, and any target JSON file. This dependency discovery step is fast compared to full compilation.
+
+In client-side mode, this work moves to the client. For Rust, the cost is minimal since `--emit dep-info` is cheap. For C/C++, preprocessing is replaced by simple file concatenation, avoiding the expensive include expansion entirely.
+
+For more details about how hash generation works, see [the caching documentation](Caching.md).
+
+## Protocol
+
+### Server-Side Mode Protocol
+
+- **Request**: `Compile(Compile)` - Contains executable path, arguments, working directory, environment variables
+- **Response**: `CompileFinished(CompileFinished)` - Contains exit code, stdout, stderr, and output file paths
+
+### Client-Side Mode Protocol
+
+- **Request**: `CacheGet(CacheGetRequest)` - Contains cache key
+- **Response**: `CacheGetResponse::Hit(Vec<u8>)` - Cache entry as bytes
+- **Response**: `CacheGetResponse::Miss` - Cache miss
+- **Request**: `CachePut(CachePutRequest)` - Contains cache key and entry bytes
+- **Response**: `CachePutResponse(Duration)` - Storage duration
+
+The protocol supports version negotiation to maintain backward compatibility during migration from server-side to client-side mode.
+
+## Storage Backends
+
+Both modes use the same cache storage backends:
+
+- **Local Disk** (`SCCACHE_DIR`)
+- **S3 Compatible** (`SCCACHE_BUCKET`, `SCCACHE_ENDPOINT`)
+- **Redis** (`SCCACHE_REDIS_ENDPOINT`)
+- **Memcached** (`SCCACHE_MEMCACHED_ENDPOINT`)
+- **Google Cloud Storage** (`SCCACHE_GCS_BUCKET`)
+- **Azure Blob Storage** (`SCCACHE_AZURE_CONNECTION_STRING`)
+- **GitHub Actions Cache** (`SCCACHE_GHA_CACHE_URL`)
+- **WebDAV** (`SCCACHE_WEBDAV_ENDPOINT`)
+- **Alibaba Cloud OSS** (`SCCACHE_OSS_BUCKET`)
+- **Tencent Cloud COS** (`SCCACHE_COS_BUCKET`)
 
-For more details about hash generation works, see [the caching documentation](Caching.md).
+See [Configuration.md](Configuration.md) for storage backend configuration details.
 
diff --git a/src/cache/cache.rs b/src/cache/cache.rs
@@ -297,7 +297,7 @@ impl Storage for RemoteStorage {
 pub fn build_single_cache(
     cache_type: &CacheType,
     basedirs: &[Vec<u8>],
-    _pool: &tokio::runtime::Handle,
+    pool: &tokio::runtime::Handle,
 ) -> Result<Arc<dyn Storage>> {
     match cache_type {
         #[cfg(feature = "azure")]
@@ -330,6 +330,7 @@ pub fn build_single_cache(
                 service_account.as_deref(),
                 (*rw_mode).into(),
                 credential_url.as_deref(),
+                pool,
             )
             .map_err(|err| anyhow!("create gcs cache failed: {err:?}"))?;
             let storage = RemoteStorage::new(operator, basedirs.to_vec());

diff --git a/src/cache/cache_io.rs b/src/cache/cache_io.rs
@@ -13,6 +13,7 @@
 use super::utils::{get_file_mode, set_file_mode};
 use crate::errors::*;
 use fs_err as fs;
+use serde::{Deserialize, Serialize};
 use std::fmt;
 use std::io::{Cursor, Read, Seek, Write};
 use std::path::PathBuf;
@@ -21,7 +22,7 @@ use zip::write::FileOptions;
 use zip::{CompressionMethod, ZipArchive, ZipWriter};
 
 /// Cache object sourced by a file.
-#[derive(Clone)]
+#[derive(Clone, Debug, Serialize, Deserialize)]
 pub struct FileObjectSource {
     /// Identifier for this object. Should be unique within a compilation unit.
     /// Note that a compilation unit is a single source file in C/C++ and a crate in Rust.
@@ -172,13 +173,26 @@ impl CacheRead {
 /// Data to be stored in the compiler cache.
 pub struct CacheWrite {
     zip: ZipWriter<Cursor<Vec<u8>>>,
+    /// Pre-built zip bytes (from `from_bytes`). When set, `finish()` returns
+    /// these bytes directly instead of finalising the ZipWriter.
+    prebuilt: Option<Vec<u8>>,
 }
 
 impl CacheWrite {
     /// Create a new, empty cache entry.
     pub fn new() -> CacheWrite {
         CacheWrite {
             zip: ZipWriter::new(Cursor::new(vec![])),
+            prebuilt: None,
+        }
+    }
+
+    /// Create a cache entry from pre-serialized bytes received over the wire.
+    /// `finish()` will return these bytes unchanged.
+    pub fn from_bytes(data: Vec<u8>) -> CacheWrite {
+        CacheWrite {
+            zip: ZipWriter::new(Cursor::new(vec![])),
+            prebuilt: Some(data),
         }
     }
 
@@ -257,7 +271,10 @@ impl CacheWrite {
 
     /// Finish writing data to the cache entry writer, and return the data.
     pub fn finish(self) -> Result<Vec<u8>> {
-        let CacheWrite { mut zip } = self;
+        let CacheWrite { mut zip, prebuilt } = self;
+        if let Some(bytes) = prebuilt {
+            return Ok(bytes);
+        }
         let cur = zip.finish().context("Failed to finish cache entry zip")?;
         Ok(cur.into_inner())
     }

diff --git a/src/cache/gcs.rs b/src/cache/gcs.rs
@@ -45,6 +45,7 @@ impl GCSCache {
         service_account: Option<&str>,
         rw_mode: CacheMode,
         credential_url: Option<&str>,
+        pool: &tokio::runtime::Handle,
     ) -> Result<Operator> {
         let mut builder = Gcs::default()
             .bucket(bucket)
@@ -64,11 +65,9 @@ impl GCSCache {
                 .map_err(|err| anyhow!("gcs credential url is invalid: {err:?}"))?;
 
             // For TaskCluster integration, fetch token directly and provide it to OpenDAL
-            let token = tokio::task::block_in_place(|| {
-                tokio::runtime::Handle::current()
-                    .block_on(fetch_taskcluster_token(cred_url, rw_to_scope(rw_mode)))
-            })
-            .map_err(|e| anyhow!("Failed to fetch TaskCluster token: {e}"))?;
+            let token = pool
+                .block_on(fetch_taskcluster_token(cred_url, rw_to_scope(rw_mode)))
+                .map_err(|e| anyhow!("Failed to fetch TaskCluster token: {e}"))?;
             builder = builder.token(token);
         }
 
@@ -93,7 +92,10 @@ async fn fetch_taskcluster_token(url: &str, scope: &str) -> Result<String> {
     debug!("gcs: start to load token from: {}", url);
 
     let user_agent = format!("{}/{}", env!("CARGO_PKG_NAME"), env!("CARGO_PKG_VERSION"));
-    let client = Client::builder().user_agent(user_agent).build()?;
+    let client = Client::builder()
+        .user_agent(user_agent)
+        .timeout(std::time::Duration::from_secs(30))
+        .build()?;
     let res = client.get(url).send().await?;
 
     if res.status().is_success() {