diff --git a/daw-backend/Fade.wav b/daw-backend/Fade.wav
deleted file mode 100644
index 23475eb..0000000
Binary files a/daw-backend/Fade.wav and /dev/null differ
diff --git a/daw-backend/audio.flac b/daw-backend/audio.flac
deleted file mode 100644
index b2d146f..0000000
Binary files a/daw-backend/audio.flac and /dev/null differ
diff --git a/daw-backend/src/audio/disk_reader.rs b/daw-backend/src/audio/disk_reader.rs
index c288128..5c264f7 100644
--- a/daw-backend/src/audio/disk_reader.rs
+++ b/daw-backend/src/audio/disk_reader.rs
@@ -69,6 +69,11 @@ pub struct ReadAheadBuffer {
     channels: u32,
     /// Source file sample rate.
     sample_rate: u32,
+    /// Last file-local frame requested by the audio callback.
+    /// Written by the consumer (render_from_file), read by the disk reader.
+    /// The disk reader uses this instead of the global playhead to know
+    /// where in the file to buffer around.
+    target_frame: AtomicU64,
 }
 
 // SAFETY: See the doc comment on ReadAheadBuffer for the full safety argument.
@@ -102,6 +107,7 @@ impl ReadAheadBuffer {
             capacity_frames,
             channels,
             sample_rate,
+            target_frame: AtomicU64::new(0),
         }
     }
 
@@ -158,6 +164,20 @@ impl ReadAheadBuffer {
         self.valid_frames.load(Ordering::Acquire)
     }
 
+    /// Update the target frame — the file-local frame the audio callback
+    /// is currently reading from. Called by `render_from_file` (consumer).
+    #[inline]
+    pub fn set_target_frame(&self, frame: u64) {
+        self.target_frame.store(frame, Ordering::Relaxed);
+    }
+
+    /// Get the target frame set by the audio callback.
+    /// Called by the disk reader thread (producer).
+    #[inline]
+    pub fn target_frame(&self) -> u64 {
+        self.target_frame.load(Ordering::Relaxed)
+    }
+
     /// Reset the buffer to start at `new_start` with zero valid frames.
     /// Called by the **disk reader thread** (producer) after a seek.
     pub fn reset(&self, new_start: u64) {
@@ -431,20 +451,16 @@ pub struct DiskReader {
 
 impl DiskReader {
     /// Create a new disk reader with a background thread.
-    ///
-    /// `playhead_frame` should be the same `Arc<AtomicU64>` used by the engine
-    /// so the disk reader knows where to fill ahead.
     pub fn new(playhead_frame: Arc<AtomicU64>, _sample_rate: u32) -> Self {
         let (command_tx, command_rx) = rtrb::RingBuffer::new(64);
         let running = Arc::new(AtomicBool::new(true));
 
         let thread_running = running.clone();
-        let thread_playhead = playhead_frame.clone();
 
         let thread_handle = std::thread::Builder::new()
             .name("disk-reader".into())
             .spawn(move || {
-                Self::reader_thread(command_rx, thread_playhead, thread_running);
+                Self::reader_thread(command_rx, thread_running);
             })
             .expect("Failed to spawn disk reader thread");
 
@@ -473,7 +489,6 @@ impl DiskReader {
     /// The disk reader background thread.
     fn reader_thread(
         mut command_rx: rtrb::Consumer<DiskReaderCommand>,
-        playhead_frame: Arc<AtomicU64>,
         running: Arc<AtomicBool>,
     ) {
         let mut active_files: HashMap<usize, (CompressedReader, Arc<ReadAheadBuffer>)> =
@@ -506,6 +521,7 @@ impl DiskReader {
                     }
                     DiskReaderCommand::Seek { frame } => {
                         for (_, (reader, buffer)) in active_files.iter_mut() {
+                            buffer.set_target_frame(frame);
                             buffer.reset(frame);
                             if let Err(e) = reader.seek(frame) {
                                 eprintln!("[DiskReader] Seek error: {}", e);
@@ -518,26 +534,28 @@ impl DiskReader {
                 }
             }
 
-            let playhead = playhead_frame.load(Ordering::Relaxed);
-
-            // Fill each active file's buffer ahead of the playhead.
+            // Fill each active file's buffer ahead of its target frame.
+            // Each file's target_frame is set by the audio callback in
+            // render_from_file, giving the file-local frame being read.
+            // This is independent of the global engine playhead.
             for (_pool_index, (reader, buffer)) in active_files.iter_mut() {
+                let target = buffer.target_frame();
                 let buf_start = buffer.start_frame();
                 let buf_valid = buffer.valid_frames_count();
                 let buf_end = buf_start + buf_valid;
 
-                // If the playhead has jumped behind or far ahead of the buffer,
+                // If the target has jumped behind or far ahead of the buffer,
                 // seek the decoder and reset.
-                if playhead < buf_start || playhead > buf_end + reader.sample_rate as u64 {
-                    buffer.reset(playhead);
-                    let _ = reader.seek(playhead);
+                if target < buf_start || target > buf_end + reader.sample_rate as u64 {
+                    buffer.reset(target);
+                    let _ = reader.seek(target);
                     continue;
                 }
 
-                // Advance the buffer start to reclaim space behind the playhead.
+                // Advance the buffer start to reclaim space behind the target.
                 // Keep a small lookback for sinc interpolation (~32 frames).
                 let lookback = 64u64;
-                let advance_to = playhead.saturating_sub(lookback);
+                let advance_to = target.saturating_sub(lookback);
                 if advance_to > buf_start {
                     buffer.advance_start(advance_to);
                 }
@@ -547,7 +565,7 @@ impl DiskReader {
                 let buf_valid = buffer.valid_frames_count();
                 let buf_end = buf_start + buf_valid;
                 let prefetch_target =
-                    playhead + (PREFETCH_SECONDS * reader.sample_rate as f64) as u64;
+                    target + (PREFETCH_SECONDS * reader.sample_rate as f64) as u64;
 
                 if buf_end >= prefetch_target {
                     continue; // Already filled far enough ahead.
diff --git a/daw-backend/src/audio/engine.rs b/daw-backend/src/audio/engine.rs
index cde4b96..94f1b13 100644
--- a/daw-backend/src/audio/engine.rs
+++ b/daw-backend/src/audio/engine.rs
@@ -489,6 +489,10 @@ impl Engine {
                 self.playhead_atomic.store(0, Ordering::Relaxed);
                 // Stop all MIDI notes when stopping playback
                 self.project.stop_all_notes();
+                // Reset disk reader buffers to the new playhead position
+                if let Some(ref mut dr) = self.disk_reader {
+                    dr.send(crate::audio::disk_reader::DiskReaderCommand::Seek { frame: 0 });
+                }
             }
             Command::Pause => {
                 self.playing = false;
@@ -1686,165 +1690,144 @@ impl Engine {
             }
 
             Command::ImportAudio(path) => {
-                let path_str = path.to_string_lossy().to_string();
-
-                // Step 1: Read metadata (fast — no decoding)
-                let metadata = match crate::io::read_metadata(&path) {
-                    Ok(m) => m,
-                    Err(e) => {
-                        eprintln!("[ENGINE] ImportAudio failed to read metadata for {:?}: {}", path, e);
-                        return;
-                    }
-                };
-
-                let pool_index;
-
-                eprintln!("[ENGINE] ImportAudio: format={:?}, ch={}, sr={}, n_frames={:?}, duration={:.2}s, path={}",
-                    metadata.format, metadata.channels, metadata.sample_rate, metadata.n_frames, metadata.duration, path_str);
-
-                match metadata.format {
-                    crate::io::AudioFormat::Pcm => {
-                        // WAV/AIFF: memory-map the file for instant availability
-                        let file = match std::fs::File::open(&path) {
-                            Ok(f) => f,
-                            Err(e) => {
-                                eprintln!("[ENGINE] ImportAudio failed to open {:?}: {}", path, e);
-                                return;
-                            }
-                        };
-
-                        // SAFETY: The file is opened read-only. The mmap is shared
-                        // immutably. We never write to it.
-                        let mmap = match unsafe { memmap2::Mmap::map(&file) } {
-                            Ok(m) => m,
-                            Err(e) => {
-                                eprintln!("[ENGINE] ImportAudio mmap failed for {:?}: {}", path, e);
-                                return;
-                            }
-                        };
-
-                        // Parse WAV header to find PCM data offset and format
-                        let header = match crate::io::parse_wav_header(&mmap) {
-                            Ok(h) => h,
-                            Err(e) => {
-                                eprintln!("[ENGINE] ImportAudio WAV parse failed for {:?}: {}", path, e);
-                                return;
-                            }
-                        };
-
-                        let audio_file = crate::audio::pool::AudioFile::from_mmap(
-                            path.clone(),
-                            mmap,
-                            header.data_offset,
-                            header.sample_format,
-                            header.channels,
-                            header.sample_rate,
-                            header.total_frames,
-                        );
-
-                        pool_index = self.audio_pool.add_file(audio_file);
-                    }
-                    crate::io::AudioFormat::Compressed => {
-                        let sync_decode = std::env::var("DAW_SYNC_DECODE").is_ok();
-
-                        if sync_decode {
-                            // Diagnostic: full synchronous decode to InMemory (bypasses ring buffer)
-                            eprintln!("[ENGINE] DAW_SYNC_DECODE: doing full decode of {:?}", path);
-                            match crate::io::AudioFile::load(&path) {
-                                Ok(loaded) => {
-                                    let ext = path.extension()
-                                        .and_then(|e| e.to_str())
-                                        .map(|s| s.to_lowercase());
-                                    let audio_file = crate::audio::pool::AudioFile::with_format(
-                                        path.clone(),
-                                        loaded.data,
-                                        loaded.channels,
-                                        loaded.sample_rate,
-                                        ext,
-                                    );
-                                    pool_index = self.audio_pool.add_file(audio_file);
-                                    eprintln!("[ENGINE] DAW_SYNC_DECODE: pool_index={}, frames={}", pool_index, loaded.frames);
-                                }
-                                Err(e) => {
-                                    eprintln!("[ENGINE] DAW_SYNC_DECODE failed: {}", e);
-                                    return;
-                                }
-                            }
-                        } else {
-                            // Normal path: stream decode via disk reader
-                            let ext = path.extension()
-                                .and_then(|e| e.to_str())
-                                .map(|s| s.to_lowercase());
-
-                            let total_frames = metadata.n_frames.unwrap_or_else(|| {
-                                (metadata.duration * metadata.sample_rate as f64).ceil() as u64
-                            });
-
-                            let mut audio_file = crate::audio::pool::AudioFile::from_compressed(
-                                path.clone(),
-                                metadata.channels,
-                                metadata.sample_rate,
-                                total_frames,
-                                ext,
-                            );
-
-                            let buffer = crate::audio::disk_reader::DiskReader::create_buffer(
-                                metadata.sample_rate,
-                                metadata.channels,
-                            );
-                            audio_file.read_ahead = Some(buffer.clone());
-
-                            pool_index = self.audio_pool.add_file(audio_file);
-
-                            eprintln!("[ENGINE] Compressed: total_frames={}, pool_index={}, has_disk_reader={}",
-                                total_frames, pool_index, self.disk_reader.is_some());
-
-                            if let Some(ref mut dr) = self.disk_reader {
-                                dr.send(crate::audio::disk_reader::DiskReaderCommand::ActivateFile {
-                                    pool_index,
-                                    path: path.clone(),
-                                    buffer,
-                                });
-                            }
-
-                            // Spawn background thread to decode full file for waveform display
-                            let bg_tx = self.chunk_generation_tx.clone();
-                            let bg_path = path.clone();
-                            let _ = std::thread::Builder::new()
-                                .name(format!("waveform-decode-{}", pool_index))
-                                .spawn(move || {
-                                    eprintln!("[WAVEFORM DECODE] Starting full decode of {:?}", bg_path);
-                                    match crate::io::AudioFile::load(&bg_path) {
-                                        Ok(loaded) => {
-                                            eprintln!("[WAVEFORM DECODE] Complete: {} frames, {} channels",
-                                                loaded.frames, loaded.channels);
-                                            let _ = bg_tx.send(AudioEvent::WaveformDecodeComplete {
-                                                pool_index,
-                                                samples: loaded.data,
-                                            });
-                                        }
-                                        Err(e) => {
-                                            eprintln!("[WAVEFORM DECODE] Failed to decode {:?}: {}", bg_path, e);
-                                        }
-                                    }
-                                });
-                        }
-                    }
+                if let Err(e) = self.do_import_audio(&path) {
+                    eprintln!("[ENGINE] ImportAudio failed for {:?}: {}", path, e);
                 }
-
-                // Emit AudioFileReady event
-                let _ = self.event_tx.push(AudioEvent::AudioFileReady {
-                    pool_index,
-                    path: path_str,
-                    channels: metadata.channels,
-                    sample_rate: metadata.sample_rate,
-                    duration: metadata.duration,
-                    format: metadata.format,
-                });
             }
         }
     }
 
+    /// Import an audio file into the pool: mmap for PCM, streaming for compressed.
+    /// Returns the pool index on success. Emits AudioFileReady event.
+    fn do_import_audio(&mut self, path: &std::path::Path) -> Result<usize, String> {
+        let path_str = path.to_string_lossy().to_string();
+
+        let metadata = crate::io::read_metadata(path)
+            .map_err(|e| format!("Failed to read metadata for {:?}: {}", path, e))?;
+
+        eprintln!("[ENGINE] ImportAudio: format={:?}, ch={}, sr={}, n_frames={:?}, duration={:.2}s, path={}",
+            metadata.format, metadata.channels, metadata.sample_rate, metadata.n_frames, metadata.duration, path_str);
+
+        let pool_index = match metadata.format {
+            crate::io::AudioFormat::Pcm => {
+                let file = std::fs::File::open(path)
+                    .map_err(|e| format!("Failed to open {:?}: {}", path, e))?;
+
+                // SAFETY: The file is opened read-only. The mmap is shared
+                // immutably. We never write to it.
+                let mmap = unsafe { memmap2::Mmap::map(&file) }
+                    .map_err(|e| format!("mmap failed for {:?}: {}", path, e))?;
+
+                let header = crate::io::parse_wav_header(&mmap)
+                    .map_err(|e| format!("WAV parse failed for {:?}: {}", path, e))?;
+
+                let audio_file = crate::audio::pool::AudioFile::from_mmap(
+                    path.to_path_buf(),
+                    mmap,
+                    header.data_offset,
+                    header.sample_format,
+                    header.channels,
+                    header.sample_rate,
+                    header.total_frames,
+                );
+
+                self.audio_pool.add_file(audio_file)
+            }
+            crate::io::AudioFormat::Compressed => {
+                let sync_decode = std::env::var("DAW_SYNC_DECODE").is_ok();
+
+                if sync_decode {
+                    eprintln!("[ENGINE] DAW_SYNC_DECODE: doing full decode of {:?}", path);
+                    let loaded = crate::io::AudioFile::load(path)
+                        .map_err(|e| format!("DAW_SYNC_DECODE failed: {}", e))?;
+                    let ext = path.extension()
+                        .and_then(|e| e.to_str())
+                        .map(|s| s.to_lowercase());
+                    let audio_file = crate::audio::pool::AudioFile::with_format(
+                        path.to_path_buf(),
+                        loaded.data,
+                        loaded.channels,
+                        loaded.sample_rate,
+                        ext,
+                    );
+                    let idx = self.audio_pool.add_file(audio_file);
+                    eprintln!("[ENGINE] DAW_SYNC_DECODE: pool_index={}, frames={}", idx, loaded.frames);
+                    idx
+                } else {
+                    let ext = path.extension()
+                        .and_then(|e| e.to_str())
+                        .map(|s| s.to_lowercase());
+
+                    let total_frames = metadata.n_frames.unwrap_or_else(|| {
+                        (metadata.duration * metadata.sample_rate as f64).ceil() as u64
+                    });
+
+                    let mut audio_file = crate::audio::pool::AudioFile::from_compressed(
+                        path.to_path_buf(),
+                        metadata.channels,
+                        metadata.sample_rate,
+                        total_frames,
+                        ext,
+                    );
+
+                    let buffer = crate::audio::disk_reader::DiskReader::create_buffer(
+                        metadata.sample_rate,
+                        metadata.channels,
+                    );
+                    audio_file.read_ahead = Some(buffer.clone());
+
+                    let idx = self.audio_pool.add_file(audio_file);
+
+                    eprintln!("[ENGINE] Compressed: total_frames={}, pool_index={}, has_disk_reader={}",
+                        total_frames, idx, self.disk_reader.is_some());
+
+                    if let Some(ref mut dr) = self.disk_reader {
+                        dr.send(crate::audio::disk_reader::DiskReaderCommand::ActivateFile {
+                            pool_index: idx,
+                            path: path.to_path_buf(),
+                            buffer,
+                        });
+                    }
+
+                    // Spawn background thread to decode full file for waveform display
+                    let bg_tx = self.chunk_generation_tx.clone();
+                    let bg_path = path.to_path_buf();
+                    let _ = std::thread::Builder::new()
+                        .name(format!("waveform-decode-{}", idx))
+                        .spawn(move || {
+                            eprintln!("[WAVEFORM DECODE] Starting full decode of {:?}", bg_path);
+                            match crate::io::AudioFile::load(&bg_path) {
+                                Ok(loaded) => {
+                                    eprintln!("[WAVEFORM DECODE] Complete: {} frames, {} channels",
+                                        loaded.frames, loaded.channels);
+                                    let _ = bg_tx.send(AudioEvent::WaveformDecodeComplete {
+                                        pool_index: idx,
+                                        samples: loaded.data,
+                                    });
+                                }
+                                Err(e) => {
+                                    eprintln!("[WAVEFORM DECODE] Failed to decode {:?}: {}", bg_path, e);
+                                }
+                            }
+                        });
+                    idx
+                }
+            }
+        };
+
+        // Emit AudioFileReady event
+        let _ = self.event_tx.push(AudioEvent::AudioFileReady {
+            pool_index,
+            path: path_str,
+            channels: metadata.channels,
+            sample_rate: metadata.sample_rate,
+            duration: metadata.duration,
+            format: metadata.format,
+        });
+
+        Ok(pool_index)
+    }
+
     /// Handle synchronous queries from the UI thread
     fn handle_query(&mut self, query: Query) {
         let response = match query {
@@ -2231,6 +2214,9 @@ impl Engine {
 
                 QueryResponse::AudioFileAddedSync(Ok(pool_index))
             }
+            Query::ImportAudioSync(path) => {
+                QueryResponse::AudioImportedSync(self.do_import_audio(&path))
+            }
             Query::GetProject => {
                 // Clone the entire project for serialization
                 QueryResponse::ProjectRetrieved(Ok(Box::new(self.project.clone())))
@@ -2674,6 +2660,21 @@ impl EngineController {
         let _ = self.command_tx.push(Command::ImportAudio(path));
     }
 
+    /// Import an audio file synchronously and get the pool index.
+    /// Does the same work as `import_audio` (mmap for PCM, streaming for
+    /// compressed) but returns the real pool index directly.
+    /// NOTE: briefly blocks the UI thread during file setup (sub-ms for PCM
+    /// mmap; a few ms for compressed streaming init). If this becomes a
+    /// problem for very large files, switch to async import with event-based
+    /// pool index reconciliation.
+    pub fn import_audio_sync(&mut self, path: std::path::PathBuf) -> Result<usize, String> {
+        let query = Query::ImportAudioSync(path);
+        match self.send_query(query)? {
+            QueryResponse::AudioImportedSync(result) => result,
+            _ => Err("Unexpected query response".to_string()),
+        }
+    }
+
     /// Add a clip to an audio track
     pub fn add_audio_clip(&mut self, track_id: TrackId, pool_index: usize, start_time: f64, duration: f64, offset: f64) {
         let _ = self.command_tx.push(Command::AddAudioClip(track_id, pool_index, start_time, duration, offset));
diff --git a/daw-backend/src/audio/pool.rs b/daw-backend/src/audio/pool.rs
index 7374da8..67ce6e3 100644
--- a/daw-backend/src/audio/pool.rs
+++ b/daw-backend/src/audio/pool.rs
@@ -511,6 +511,11 @@ impl AudioClipPool {
 
         let src_start_position = start_time_seconds * audio_file.sample_rate as f64;
 
+        // Tell the disk reader where we're reading so it buffers the right region.
+        if use_read_ahead {
+            read_ahead.unwrap().set_target_frame(src_start_position as u64);
+        }
+
         let mut rendered_frames = 0;
 
         if audio_file.sample_rate == engine_sample_rate {
diff --git a/daw-backend/src/command/types.rs b/daw-backend/src/command/types.rs
index 67cee46..38e080e 100644
--- a/daw-backend/src/command/types.rs
+++ b/daw-backend/src/command/types.rs
@@ -333,6 +333,14 @@ pub enum Query {
     AddAudioClipSync(TrackId, usize, f64, f64, f64),
     /// Add an audio file to the pool synchronously (path, data, channels, sample_rate) - returns pool index
     AddAudioFileSync(String, Vec<f32>, u32, u32),
+    /// Import an audio file synchronously (path) - returns pool index.
+    /// Does the same work as Command::ImportAudio (mmap for PCM, streaming
+    /// setup for compressed) but returns the real pool index in the response.
+    /// NOTE: briefly blocks the UI thread during file setup (sub-ms for PCM
+    /// mmap; a few ms for compressed streaming init). If this becomes a
+    /// problem for very large files, switch to async import with event-based
+    /// pool index reconciliation.
+    ImportAudioSync(std::path::PathBuf),
     /// Get raw audio samples from pool (pool_index) - returns (samples, sample_rate, channels)
     GetPoolAudioSamples(usize),
     /// Get a clone of the current project for serialization
@@ -404,6 +412,8 @@ pub enum QueryResponse {
     AudioClipInstanceAdded(Result<AudioClipInstanceId, String>),
     /// Audio file added to pool (returns pool index)
     AudioFileAddedSync(Result<usize, String>),
+    /// Audio file imported to pool (returns pool index)
+    AudioImportedSync(Result<usize, String>),
     /// Raw audio samples from pool (samples, sample_rate, channels)
     PoolAudioSamples(Result<(Vec<f32>, u32, u32), String>),
     /// Project retrieved
diff --git a/lightningbeam-ui/lightningbeam-editor/src/cqt_gpu.rs b/lightningbeam-ui/lightningbeam-editor/src/cqt_gpu.rs
new file mode 100644
index 0000000..427558a
--- /dev/null
+++ b/lightningbeam-ui/lightningbeam-editor/src/cqt_gpu.rs
@@ -0,0 +1,683 @@
+/// GPU-based Constant-Q Transform (CQT) spectrogram with streaming ring-buffer cache.
+///
+/// Replaces the old FFT spectrogram with a CQT that has logarithmic frequency spacing
+/// (bins map directly to MIDI notes). Only the visible viewport is computed, with results
+/// cached in a ring-buffer texture so scrolling only computes new columns.
+///
+/// Architecture:
+/// - CqtGpuResources stored in CallbackResources (long-lived, holds pipelines)
+/// - CqtCacheEntry per pool_index (cache texture, bin params, ring buffer state)
+/// - CqtCallback implements CallbackTrait (per-frame compute + render)
+/// - Compute shader reads audio from waveform mip-0 textures (already on GPU)
+/// - Render shader reads from cache texture with colormap
+
+use std::collections::HashMap;
+use wgpu::util::DeviceExt;
+
+use crate::waveform_gpu::WaveformGpuResources;
+
+/// CQT parameters
+const BINS_PER_OCTAVE: u32 = 24;
+const FREQ_BINS: u32 = 174; // ceil(log2(4186.0 / 27.5) * 24) = ceil(173.95)
+const HOP_SIZE: u32 = 512;
+const CACHE_CAPACITY: u32 = 4096;
+const MAX_COLS_PER_FRAME: u32 = 256;
+const F_MIN: f64 = 27.5; // A0 = MIDI 21
+const WAVEFORM_TEX_WIDTH: u32 = 2048;
+
+/// Per-bin CQT kernel parameters, uploaded as a storage buffer.
+/// Must match BinInfo in cqt_compute.wgsl.
+#[repr(C)]
+#[derive(Debug, Copy, Clone, bytemuck::Pod, bytemuck::Zeroable)]
+struct CqtBinParams {
+    window_length: u32,
+    phase_step: f32, // 2*pi*Q / N_k
+    _pad0: u32,
+    _pad1: u32,
+}
+
+/// Compute shader uniform params. Must match CqtParams in cqt_compute.wgsl.
+#[repr(C)]
+#[derive(Debug, Copy, Clone, bytemuck::Pod, bytemuck::Zeroable)]
+struct CqtComputeParams {
+    hop_size: u32,
+    freq_bins: u32,
+    cache_capacity: u32,
+    cache_write_offset: u32,
+    num_columns: u32,
+    column_start: u32,
+    tex_width: u32,
+    total_frames: u32,
+    sample_rate: f32,
+    _pad0: u32,
+    _pad1: u32,
+    _pad2: u32,
+}
+
+/// Render shader uniform params. Must match Params in cqt_render.wgsl exactly.
+/// Layout: clip_rect(16) + 18 × f32(72) + pad vec2(8) = 96 bytes
+#[repr(C)]
+#[derive(Debug, Copy, Clone, bytemuck::Pod, bytemuck::Zeroable)]
+pub struct CqtRenderParams {
+    pub clip_rect: [f32; 4],          // 16 bytes @ offset 0
+    pub viewport_start_time: f32,     // 4 @ 16
+    pub pixels_per_second: f32,       // 4 @ 20
+    pub audio_duration: f32,          // 4 @ 24
+    pub sample_rate: f32,             // 4 @ 28
+    pub clip_start_time: f32,         // 4 @ 32
+    pub trim_start: f32,              // 4 @ 36
+    pub freq_bins: f32,               // 4 @ 40
+    pub bins_per_octave: f32,         // 4 @ 44
+    pub hop_size: f32,                // 4 @ 48
+    pub scroll_y: f32,                // 4 @ 52
+    pub note_height: f32,             // 4 @ 56
+    pub min_note: f32,                // 4 @ 60
+    pub max_note: f32,                // 4 @ 64
+    pub gamma: f32,                   // 4 @ 68
+    pub cache_capacity: f32,          // 4 @ 72
+    pub cache_start_column: f32,      // 4 @ 76
+    pub cache_valid_start: f32,       // 4 @ 80
+    pub cache_valid_end: f32,         // 4 @ 84
+    pub _pad: [f32; 2],              // 8 @ 88, total 96
+}
+
+/// Per-pool-index cache entry with ring buffer and GPU resources.
+#[allow(dead_code)]
+struct CqtCacheEntry {
+    // Cache texture (Rgba16Float for universal filterable + storage support)
+    cache_texture: wgpu::Texture,
+    cache_texture_view: wgpu::TextureView,
+    cache_storage_view: wgpu::TextureView,
+    cache_capacity: u32,
+    freq_bins: u32,
+
+    // Ring buffer state
+    cache_start_column: i64,
+    cache_valid_start: i64,
+    cache_valid_end: i64,
+
+    // CQT kernel data
+    bin_params_buffer: wgpu::Buffer,
+
+    // Waveform texture reference (cloned from WaveformGpuEntry)
+    waveform_texture_view: wgpu::TextureView,
+    waveform_total_frames: u64,
+
+    // Bind groups
+    compute_bind_group: wgpu::BindGroup,
+    compute_uniform_buffer: wgpu::Buffer,
+    render_bind_group: wgpu::BindGroup,
+    render_uniform_buffer: wgpu::Buffer,
+
+    // Metadata
+    sample_rate: u32,
+}
+
+/// Global GPU resources for CQT (stored in egui_wgpu::CallbackResources).
+pub struct CqtGpuResources {
+    entries: HashMap<usize, CqtCacheEntry>,
+    compute_pipeline: wgpu::ComputePipeline,
+    compute_bind_group_layout: wgpu::BindGroupLayout,
+    render_pipeline: wgpu::RenderPipeline,
+    render_bind_group_layout: wgpu::BindGroupLayout,
+    sampler: wgpu::Sampler,
+}
+
+/// Per-frame callback for computing and rendering a CQT spectrogram.
+pub struct CqtCallback {
+    pub pool_index: usize,
+    pub params: CqtRenderParams,
+    pub target_format: wgpu::TextureFormat,
+    pub sample_rate: u32,
+    /// Visible column range (global CQT column indices)
+    pub visible_col_start: i64,
+    pub visible_col_end: i64,
+}
+
+/// Precompute CQT bin parameters for a given sample rate.
+fn precompute_bin_params(sample_rate: u32) -> Vec<CqtBinParams> {
+    let b = BINS_PER_OCTAVE as f64;
+    let q = 1.0 / (2.0_f64.powf(1.0 / b) - 1.0);
+
+    (0..FREQ_BINS)
+        .map(|k| {
+            let f_k = F_MIN * 2.0_f64.powf(k as f64 / b);
+            let n_k = (q * sample_rate as f64 / f_k).ceil() as u32;
+            let phase_step = (2.0 * std::f64::consts::PI * q / n_k as f64) as f32;
+            CqtBinParams {
+                window_length: n_k,
+                phase_step,
+                _pad0: 0,
+                _pad1: 0,
+            }
+        })
+        .collect()
+}
+
+impl CqtGpuResources {
+    pub fn new(device: &wgpu::Device, target_format: wgpu::TextureFormat) -> Self {
+        // Compute shader
+        let compute_shader = device.create_shader_module(wgpu::ShaderModuleDescriptor {
+            label: Some("cqt_compute_shader"),
+            source: wgpu::ShaderSource::Wgsl(
+                include_str!("panes/shaders/cqt_compute.wgsl").into(),
+            ),
+        });
+
+        // Render shader
+        let render_shader = device.create_shader_module(wgpu::ShaderModuleDescriptor {
+            label: Some("cqt_render_shader"),
+            source: wgpu::ShaderSource::Wgsl(
+                include_str!("panes/shaders/cqt_render.wgsl").into(),
+            ),
+        });
+
+        // Compute bind group layout:
+        //   0: audio_tex (texture_2d<f32>, read)
+        //   1: cqt_out (texture_storage_2d<rgba16float, write>)
+        //   2: params (uniform)
+        //   3: bins (storage, read)
+        let compute_bind_group_layout =
+            device.create_bind_group_layout(&wgpu::BindGroupLayoutDescriptor {
+                label: Some("cqt_compute_bgl"),
+                entries: &[
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 0,
+                        visibility: wgpu::ShaderStages::COMPUTE,
+                        ty: wgpu::BindingType::Texture {
+                            sample_type: wgpu::TextureSampleType::Float { filterable: false },
+                            view_dimension: wgpu::TextureViewDimension::D2,
+                            multisampled: false,
+                        },
+                        count: None,
+                    },
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 1,
+                        visibility: wgpu::ShaderStages::COMPUTE,
+                        ty: wgpu::BindingType::StorageTexture {
+                            access: wgpu::StorageTextureAccess::WriteOnly,
+                            format: wgpu::TextureFormat::Rgba16Float,
+                            view_dimension: wgpu::TextureViewDimension::D2,
+                        },
+                        count: None,
+                    },
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 2,
+                        visibility: wgpu::ShaderStages::COMPUTE,
+                        ty: wgpu::BindingType::Buffer {
+                            ty: wgpu::BufferBindingType::Uniform,
+                            has_dynamic_offset: false,
+                            min_binding_size: None,
+                        },
+                        count: None,
+                    },
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 3,
+                        visibility: wgpu::ShaderStages::COMPUTE,
+                        ty: wgpu::BindingType::Buffer {
+                            ty: wgpu::BufferBindingType::Storage { read_only: true },
+                            has_dynamic_offset: false,
+                            min_binding_size: None,
+                        },
+                        count: None,
+                    },
+                ],
+            });
+
+        // Render bind group layout: cache_tex + sampler + uniforms
+        let render_bind_group_layout =
+            device.create_bind_group_layout(&wgpu::BindGroupLayoutDescriptor {
+                label: Some("cqt_render_bgl"),
+                entries: &[
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 0,
+                        visibility: wgpu::ShaderStages::FRAGMENT,
+                        ty: wgpu::BindingType::Texture {
+                            sample_type: wgpu::TextureSampleType::Float { filterable: true },
+                            view_dimension: wgpu::TextureViewDimension::D2,
+                            multisampled: false,
+                        },
+                        count: None,
+                    },
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 1,
+                        visibility: wgpu::ShaderStages::FRAGMENT,
+                        ty: wgpu::BindingType::Sampler(wgpu::SamplerBindingType::Filtering),
+                        count: None,
+                    },
+                    wgpu::BindGroupLayoutEntry {
+                        binding: 2,
+                        visibility: wgpu::ShaderStages::FRAGMENT,
+                        ty: wgpu::BindingType::Buffer {
+                            ty: wgpu::BufferBindingType::Uniform,
+                            has_dynamic_offset: false,
+                            min_binding_size: None,
+                        },
+                        count: None,
+                    },
+                ],
+            });
+
+        // Compute pipeline
+        let compute_pipeline_layout =
+            device.create_pipeline_layout(&wgpu::PipelineLayoutDescriptor {
+                label: Some("cqt_compute_pipeline_layout"),
+                bind_group_layouts: &[&compute_bind_group_layout],
+                push_constant_ranges: &[],
+            });
+
+        let compute_pipeline =
+            device.create_compute_pipeline(&wgpu::ComputePipelineDescriptor {
+                label: Some("cqt_compute_pipeline"),
+                layout: Some(&compute_pipeline_layout),
+                module: &compute_shader,
+                entry_point: Some("main"),
+                compilation_options: Default::default(),
+                cache: None,
+            });
+
+        // Render pipeline
+        let render_pipeline_layout =
+            device.create_pipeline_layout(&wgpu::PipelineLayoutDescriptor {
+                label: Some("cqt_render_pipeline_layout"),
+                bind_group_layouts: &[&render_bind_group_layout],
+                push_constant_ranges: &[],
+            });
+
+        let render_pipeline = device.create_render_pipeline(&wgpu::RenderPipelineDescriptor {
+            label: Some("cqt_render_pipeline"),
+            layout: Some(&render_pipeline_layout),
+            vertex: wgpu::VertexState {
+                module: &render_shader,
+                entry_point: Some("vs_main"),
+                buffers: &[],
+                compilation_options: Default::default(),
+            },
+            fragment: Some(wgpu::FragmentState {
+                module: &render_shader,
+                entry_point: Some("fs_main"),
+                targets: &[Some(wgpu::ColorTargetState {
+                    format: target_format,
+                    blend: Some(wgpu::BlendState::ALPHA_BLENDING),
+                    write_mask: wgpu::ColorWrites::ALL,
+                })],
+                compilation_options: Default::default(),
+            }),
+            primitive: wgpu::PrimitiveState {
+                topology: wgpu::PrimitiveTopology::TriangleList,
+                ..Default::default()
+            },
+            depth_stencil: None,
+            multisample: wgpu::MultisampleState::default(),
+            multiview: None,
+            cache: None,
+        });
+
+        // Bilinear sampler for smooth interpolation in render shader
+        let sampler = device.create_sampler(&wgpu::SamplerDescriptor {
+            label: Some("cqt_sampler"),
+            mag_filter: wgpu::FilterMode::Linear,
+            min_filter: wgpu::FilterMode::Linear,
+            mipmap_filter: wgpu::FilterMode::Nearest,
+            ..Default::default()
+        });
+
+        Self {
+            entries: HashMap::new(),
+            compute_pipeline,
+            compute_bind_group_layout,
+            render_pipeline,
+            render_bind_group_layout,
+            sampler,
+        }
+    }
+
+    /// Create a cache entry for a pool index, referencing the waveform texture.
+    fn ensure_cache_entry(
+        &mut self,
+        device: &wgpu::Device,
+        pool_index: usize,
+        waveform_texture_view: wgpu::TextureView,
+        total_frames: u64,
+        sample_rate: u32,
+    ) {
+        if self.entries.contains_key(&pool_index) {
+            return;
+        }
+
+        // Create cache texture (ring buffer)
+        let cache_texture = device.create_texture(&wgpu::TextureDescriptor {
+            label: Some(&format!("cqt_cache_{}", pool_index)),
+            size: wgpu::Extent3d {
+                width: CACHE_CAPACITY,
+                height: FREQ_BINS,
+                depth_or_array_layers: 1,
+            },
+            mip_level_count: 1,
+            sample_count: 1,
+            dimension: wgpu::TextureDimension::D2,
+            format: wgpu::TextureFormat::Rgba16Float,
+            usage: wgpu::TextureUsages::STORAGE_BINDING | wgpu::TextureUsages::TEXTURE_BINDING,
+            view_formats: &[],
+        });
+
+        let cache_texture_view = cache_texture.create_view(&wgpu::TextureViewDescriptor {
+            label: Some(&format!("cqt_cache_{}_view", pool_index)),
+            ..Default::default()
+        });
+
+        let cache_storage_view = cache_texture.create_view(&wgpu::TextureViewDescriptor {
+            label: Some(&format!("cqt_cache_{}_storage", pool_index)),
+            ..Default::default()
+        });
+
+        // Precompute bin params
+        let bin_params = precompute_bin_params(sample_rate);
+        let bin_params_buffer = device.create_buffer_init(&wgpu::util::BufferInitDescriptor {
+            label: Some(&format!("cqt_bins_{}", pool_index)),
+            contents: bytemuck::cast_slice(&bin_params),
+            usage: wgpu::BufferUsages::STORAGE,
+        });
+
+        // Compute uniform buffer
+        let compute_uniform_buffer = device.create_buffer(&wgpu::BufferDescriptor {
+            label: Some(&format!("cqt_compute_uniforms_{}", pool_index)),
+            size: std::mem::size_of::<CqtComputeParams>() as u64,
+            usage: wgpu::BufferUsages::UNIFORM | wgpu::BufferUsages::COPY_DST,
+            mapped_at_creation: false,
+        });
+
+        // Render uniform buffer
+        let render_uniform_buffer = device.create_buffer(&wgpu::BufferDescriptor {
+            label: Some(&format!("cqt_render_uniforms_{}", pool_index)),
+            size: std::mem::size_of::<CqtRenderParams>() as u64,
+            usage: wgpu::BufferUsages::UNIFORM | wgpu::BufferUsages::COPY_DST,
+            mapped_at_creation: false,
+        });
+
+        // Compute bind group
+        let compute_bind_group = device.create_bind_group(&wgpu::BindGroupDescriptor {
+            label: Some(&format!("cqt_compute_bg_{}", pool_index)),
+            layout: &self.compute_bind_group_layout,
+            entries: &[
+                wgpu::BindGroupEntry {
+                    binding: 0,
+                    resource: wgpu::BindingResource::TextureView(&waveform_texture_view),
+                },
+                wgpu::BindGroupEntry {
+                    binding: 1,
+                    resource: wgpu::BindingResource::TextureView(&cache_storage_view),
+                },
+                wgpu::BindGroupEntry {
+                    binding: 2,
+                    resource: compute_uniform_buffer.as_entire_binding(),
+                },
+                wgpu::BindGroupEntry {
+                    binding: 3,
+                    resource: bin_params_buffer.as_entire_binding(),
+                },
+            ],
+        });
+
+        // Render bind group
+        let render_bind_group = device.create_bind_group(&wgpu::BindGroupDescriptor {
+            label: Some(&format!("cqt_render_bg_{}", pool_index)),
+            layout: &self.render_bind_group_layout,
+            entries: &[
+                wgpu::BindGroupEntry {
+                    binding: 0,
+                    resource: wgpu::BindingResource::TextureView(&cache_texture_view),
+                },
+                wgpu::BindGroupEntry {
+                    binding: 1,
+                    resource: wgpu::BindingResource::Sampler(&self.sampler),
+                },
+                wgpu::BindGroupEntry {
+                    binding: 2,
+                    resource: render_uniform_buffer.as_entire_binding(),
+                },
+            ],
+        });
+
+        self.entries.insert(
+            pool_index,
+            CqtCacheEntry {
+                cache_texture,
+                cache_texture_view,
+                cache_storage_view,
+                cache_capacity: CACHE_CAPACITY,
+                freq_bins: FREQ_BINS,
+                cache_start_column: 0,
+                cache_valid_start: 0,
+                cache_valid_end: 0,
+                bin_params_buffer,
+                waveform_texture_view,
+                waveform_total_frames: total_frames,
+                compute_bind_group,
+                compute_uniform_buffer,
+                render_bind_group,
+                render_uniform_buffer,
+                sample_rate,
+            },
+        );
+    }
+
+}
+
+/// Dispatch compute shader to fill CQT columns in the cache.
+/// Free function to avoid borrow conflicts with CqtGpuResources.entries.
+fn dispatch_cqt_compute(
+    device: &wgpu::Device,
+    queue: &wgpu::Queue,
+    pipeline: &wgpu::ComputePipeline,
+    entry: &CqtCacheEntry,
+    start_col: i64,
+    end_col: i64,
+) -> Vec<wgpu::CommandBuffer> {
+    let num_cols = (end_col - start_col) as u32;
+    if num_cols == 0 {
+        return Vec::new();
+    }
+
+    // Clamp to max per frame
+    let num_cols = num_cols.min(MAX_COLS_PER_FRAME);
+
+    // Calculate ring buffer write offset
+    let cache_write_offset =
+        ((start_col - entry.cache_start_column) as u32) % entry.cache_capacity;
+
+    let params = CqtComputeParams {
+        hop_size: HOP_SIZE,
+        freq_bins: FREQ_BINS,
+        cache_capacity: entry.cache_capacity,
+        cache_write_offset,
+        num_columns: num_cols,
+        column_start: start_col.max(0) as u32,
+        tex_width: WAVEFORM_TEX_WIDTH,
+        total_frames: entry.waveform_total_frames as u32,
+        sample_rate: entry.sample_rate as f32,
+        _pad0: 0,
+        _pad1: 0,
+        _pad2: 0,
+    };
+
+    queue.write_buffer(
+        &entry.compute_uniform_buffer,
+        0,
+        bytemuck::cast_slice(&[params]),
+    );
+
+    let mut encoder = device.create_command_encoder(&wgpu::CommandEncoderDescriptor {
+        label: Some("cqt_compute_encoder"),
+    });
+
+    {
+        let mut pass = encoder.begin_compute_pass(&wgpu::ComputePassDescriptor {
+            label: Some("cqt_compute_pass"),
+            timestamp_writes: None,
+        });
+        pass.set_pipeline(pipeline);
+        pass.set_bind_group(0, &entry.compute_bind_group, &[]);
+
+        // Dispatch: X = ceil(freq_bins / 64), Y = num_columns
+        let workgroups_x = (FREQ_BINS + 63) / 64;
+        pass.dispatch_workgroups(workgroups_x, num_cols, 1);
+    }
+
+    vec![encoder.finish()]
+}
+
+impl egui_wgpu::CallbackTrait for CqtCallback {
+    fn prepare(
+        &self,
+        device: &wgpu::Device,
+        queue: &wgpu::Queue,
+        _screen_descriptor: &egui_wgpu::ScreenDescriptor,
+        _egui_encoder: &mut wgpu::CommandEncoder,
+        resources: &mut egui_wgpu::CallbackResources,
+    ) -> Vec<wgpu::CommandBuffer> {
+        // Initialize CQT resources if needed
+        if !resources.contains::<CqtGpuResources>() {
+            resources.insert(CqtGpuResources::new(device, self.target_format));
+        }
+
+        // First, check if waveform data is available and extract what we need
+        let waveform_info: Option<(wgpu::TextureView, u64)> = {
+            let waveform_gpu: Option<&WaveformGpuResources> = resources.get();
+            waveform_gpu.and_then(|wgpu_res| {
+                wgpu_res.entries.get(&self.pool_index).map(|entry| {
+                    // Clone the texture view (Arc internally, cheap)
+                    (entry.texture_views[0].clone(), entry.total_frames)
+                })
+            })
+        };
+
+        let (waveform_view, total_frames) = match waveform_info {
+            Some(info) => info,
+            None => return Vec::new(), // Waveform not uploaded yet
+        };
+
+        let cqt_gpu: &mut CqtGpuResources = resources.get_mut().unwrap();
+
+        // Ensure cache entry exists
+        cqt_gpu.ensure_cache_entry(
+            device,
+            self.pool_index,
+            waveform_view,
+            total_frames,
+            self.sample_rate,
+        );
+
+        // Determine which columns need computing
+        let vis_start = self.visible_col_start.max(0);
+        let max_col = (total_frames as i64) / HOP_SIZE as i64;
+        let vis_end = self.visible_col_end.min(max_col);
+
+        // Read current cache state, compute what's needed, then update state.
+        // We split borrows carefully: read entry state, compute, then write back.
+        let cmds;
+        {
+            let entry = cqt_gpu.entries.get(&self.pool_index).unwrap();
+            let cache_valid_start = entry.cache_valid_start;
+            let cache_valid_end = entry.cache_valid_end;
+
+            if vis_start >= vis_end {
+                cmds = Vec::new();
+            } else if vis_start >= cache_valid_start && vis_end <= cache_valid_end {
+                // Fully cached
+                cmds = Vec::new();
+            } else if vis_start >= cache_valid_start
+                && vis_start < cache_valid_end
+                && vis_end > cache_valid_end
+            {
+                // Scrolling right
+                let actual_end =
+                    cache_valid_end + (vis_end - cache_valid_end).min(MAX_COLS_PER_FRAME as i64);
+                cmds = dispatch_cqt_compute(
+                    device, queue, &cqt_gpu.compute_pipeline, entry,
+                    cache_valid_end, actual_end,
+                );
+                let entry = cqt_gpu.entries.get_mut(&self.pool_index).unwrap();
+                entry.cache_valid_end = actual_end;
+                if entry.cache_valid_end - entry.cache_valid_start > entry.cache_capacity as i64 {
+                    entry.cache_valid_start = entry.cache_valid_end - entry.cache_capacity as i64;
+                    entry.cache_start_column = entry.cache_valid_start;
+                }
+            } else if vis_end <= cache_valid_end
+                && vis_end > cache_valid_start
+                && vis_start < cache_valid_start
+            {
+                // Scrolling left
+                let actual_start =
+                    cache_valid_start - (cache_valid_start - vis_start).min(MAX_COLS_PER_FRAME as i64);
+                cmds = dispatch_cqt_compute(
+                    device, queue, &cqt_gpu.compute_pipeline, entry,
+                    actual_start, cache_valid_start,
+                );
+                let entry = cqt_gpu.entries.get_mut(&self.pool_index).unwrap();
+                entry.cache_valid_start = actual_start;
+                entry.cache_start_column = actual_start;
+                if entry.cache_valid_end - entry.cache_valid_start > entry.cache_capacity as i64 {
+                    entry.cache_valid_end = entry.cache_valid_start + entry.cache_capacity as i64;
+                }
+            } else {
+                // No overlap or first compute — reset cache
+                let entry = cqt_gpu.entries.get_mut(&self.pool_index).unwrap();
+                entry.cache_start_column = vis_start;
+                entry.cache_valid_start = vis_start;
+                entry.cache_valid_end = vis_start;
+
+                let compute_end = vis_start + (vis_end - vis_start).min(MAX_COLS_PER_FRAME as i64);
+                let entry = cqt_gpu.entries.get(&self.pool_index).unwrap();
+                cmds = dispatch_cqt_compute(
+                    device, queue, &cqt_gpu.compute_pipeline, entry,
+                    vis_start, compute_end,
+                );
+                let entry = cqt_gpu.entries.get_mut(&self.pool_index).unwrap();
+                entry.cache_valid_end = compute_end;
+            }
+        }
+
+        // Update render uniform buffer
+        let entry = cqt_gpu.entries.get(&self.pool_index).unwrap();
+        let mut params = self.params;
+        params.cache_start_column = entry.cache_start_column as f32;
+        params.cache_valid_start = entry.cache_valid_start as f32;
+        params.cache_valid_end = entry.cache_valid_end as f32;
+        params.cache_capacity = entry.cache_capacity as f32;
+
+        queue.write_buffer(
+            &entry.render_uniform_buffer,
+            0,
+            bytemuck::cast_slice(&[params]),
+        );
+
+        cmds
+    }
+
+    fn paint(
+        &self,
+        _info: eframe::egui::PaintCallbackInfo,
+        render_pass: &mut wgpu::RenderPass<'static>,
+        resources: &egui_wgpu::CallbackResources,
+    ) {
+        let cqt_gpu: &CqtGpuResources = match resources.get() {
+            Some(r) => r,
+            None => return,
+        };
+
+        let entry = match cqt_gpu.entries.get(&self.pool_index) {
+            Some(e) => e,
+            None => return,
+        };
+
+        // Don't render if nothing is cached yet
+        if entry.cache_valid_start >= entry.cache_valid_end {
+            return;
+        }
+
+        render_pass.set_pipeline(&cqt_gpu.render_pipeline);
+        render_pass.set_bind_group(0, &entry.render_bind_group, &[]);
+        render_pass.draw(0..3, 0..1);
+    }
+}
diff --git a/lightningbeam-ui/lightningbeam-editor/src/main.rs b/lightningbeam-ui/lightningbeam-editor/src/main.rs
index 8d34909..d82cfed 100644
--- a/lightningbeam-ui/lightningbeam-editor/src/main.rs
+++ b/lightningbeam-ui/lightningbeam-editor/src/main.rs
@@ -20,8 +20,7 @@ mod theme;
 use theme::{Theme, ThemeMode};
 
 mod waveform_gpu;
-mod spectrogram_gpu;
-mod spectrogram_compute;
+mod cqt_gpu;
 
 mod config;
 use config::AppConfig;
@@ -2382,16 +2381,20 @@ impl EditorApp {
         let sample_rate = metadata.sample_rate;
 
         if let Some(ref controller_arc) = self.audio_controller {
-            // Predict the pool index (engine assigns sequentially)
-            let pool_index = self.action_executor.document().audio_clips.len();
-
-            // Send async import command (non-blocking)
-            {
+            // Import synchronously to get the real pool index from the engine.
+            // NOTE: briefly blocks the UI thread (sub-ms for PCM mmap; a few ms
+            // for compressed streaming init).
+            let pool_index = {
                 let mut controller = controller_arc.lock().unwrap();
-                controller.import_audio(path.to_path_buf());
-            }
+                match controller.import_audio_sync(path.to_path_buf()) {
+                    Ok(idx) => idx,
+                    Err(e) => {
+                        eprintln!("Failed to import audio '{}': {}", path.display(), e);
+                        return None;
+                    }
+                }
+            };
 
-            // Create audio clip in document immediately (metadata is enough)
             let clip = AudioClip::new_sampled(&name, pool_index, duration);
             let clip_id = self.action_executor.document_mut().add_audio_clip(clip);
 
diff --git a/lightningbeam-ui/lightningbeam-editor/src/panes/piano_roll.rs b/lightningbeam-ui/lightningbeam-editor/src/panes/piano_roll.rs
index a9fa000..c96dd33 100644
--- a/lightningbeam-ui/lightningbeam-editor/src/panes/piano_roll.rs
+++ b/lightningbeam-ui/lightningbeam-editor/src/panes/piano_roll.rs
@@ -92,10 +92,6 @@ pub struct PianoRollPane {
     // Resolved note cache — tracks when to invalidate
     cached_clip_id: Option<u32>,
 
-    // Spectrogram cache — keyed by audio pool index
-    // Stores pre-computed SpectrogramUpload data ready for GPU
-    spectrogram_computed: HashMap<usize, crate::spectrogram_gpu::SpectrogramUpload>,
-
     // Spectrogram gamma (power curve for colormap)
     spectrogram_gamma: f32,
 }
@@ -126,8 +122,7 @@ impl PianoRollPane {
             auto_scroll_enabled: true,
             user_scrolled_since_play: false,
             cached_clip_id: None,
-            spectrogram_computed: HashMap::new(),
-            spectrogram_gamma: 5.0,
+            spectrogram_gamma: 0.8,
         }
     }
 
@@ -1256,80 +1251,51 @@ impl PianoRollPane {
             }
         }
 
-        let screen_size = ui.ctx().input(|i| i.content_rect().size());
-
-        // Render spectrogram for each sampled clip on this layer
+        // Render CQT spectrogram for each sampled clip on this layer
         for &(pool_index, timeline_start, trim_start, _duration, sample_rate) in &clip_infos {
-            // Compute spectrogram if not cached
-            let needs_compute = !self.spectrogram_computed.contains_key(&pool_index);
-            let pending_upload = if needs_compute {
-                if let Some((samples, sr, ch)) = shared.raw_audio_cache.get(&pool_index) {
-                    let spec_data = crate::spectrogram_compute::compute_spectrogram(
-                        samples, *sr, *ch, 2048, 512,
-                    );
-                    if spec_data.time_bins > 0 {
-                        let upload = crate::spectrogram_gpu::SpectrogramUpload {
-                            magnitudes: spec_data.magnitudes,
-                            time_bins: spec_data.time_bins as u32,
-                            freq_bins: spec_data.freq_bins as u32,
-                            sample_rate: spec_data.sample_rate,
-                            hop_size: spec_data.hop_size as u32,
-                            fft_size: spec_data.fft_size as u32,
-                            duration: spec_data.duration as f32,
-                        };
-                        // Store a marker so we don't recompute
-                        self.spectrogram_computed.insert(pool_index, crate::spectrogram_gpu::SpectrogramUpload {
-                            magnitudes: Vec::new(), // We don't need to keep the data around
-                            time_bins: upload.time_bins,
-                            freq_bins: upload.freq_bins,
-                            sample_rate: upload.sample_rate,
-                            hop_size: upload.hop_size,
-                            fft_size: upload.fft_size,
-                            duration: upload.duration,
-                        });
-                        Some(upload)
-                    } else {
-                        None
-                    }
-                } else {
-                    None
-                }
+            // Get audio duration from the raw audio cache
+            let audio_duration = if let Some((samples, sr, ch)) = shared.raw_audio_cache.get(&pool_index) {
+                samples.len() as f64 / (*sr as f64 * *ch as f64)
             } else {
-                None
-            };
-
-            // Get cached spectrogram metadata for params
-            let spec_meta = self.spectrogram_computed.get(&pool_index);
-            let (time_bins, freq_bins, hop_size, fft_size, audio_duration) = match spec_meta {
-                Some(m) => (m.time_bins as f32, m.freq_bins as f32, m.hop_size as f32, m.fft_size as f32, m.duration),
-                None => continue,
+                continue;
             };
 
             if view_rect.width() > 0.0 && view_rect.height() > 0.0 {
-                let callback = crate::spectrogram_gpu::SpectrogramCallback {
+                // Calculate visible CQT column range for streaming
+                let viewport_end_time = self.viewport_start_time + (view_rect.width() / self.pixels_per_second) as f64;
+                let vis_audio_start = (self.viewport_start_time - timeline_start + trim_start).max(0.0);
+                let vis_audio_end = (viewport_end_time - timeline_start + trim_start).min(audio_duration);
+                let vis_col_start = (vis_audio_start * sample_rate as f64 / 512.0).floor() as i64;
+                let vis_col_end = (vis_audio_end * sample_rate as f64 / 512.0).ceil() as i64 + 1;
+
+                let callback = crate::cqt_gpu::CqtCallback {
                     pool_index,
-                    params: crate::spectrogram_gpu::SpectrogramParams {
+                    params: crate::cqt_gpu::CqtRenderParams {
                         clip_rect: [view_rect.min.x, view_rect.min.y, view_rect.max.x, view_rect.max.y],
                         viewport_start_time: self.viewport_start_time as f32,
                         pixels_per_second: self.pixels_per_second,
-                        audio_duration,
+                        audio_duration: audio_duration as f32,
                         sample_rate: sample_rate as f32,
                         clip_start_time: timeline_start as f32,
                         trim_start: trim_start as f32,
-                        time_bins,
-                        freq_bins,
-                        hop_size,
-                        fft_size,
+                        freq_bins: 174.0,
+                        bins_per_octave: 24.0,
+                        hop_size: 512.0,
                         scroll_y: self.scroll_y,
                         note_height: self.note_height,
-                        screen_size: [screen_size.x, screen_size.y],
                         min_note: MIN_NOTE as f32,
                         max_note: MAX_NOTE as f32,
                         gamma: self.spectrogram_gamma,
-                        _pad: [0.0; 3],
+                        cache_capacity: 0.0, // filled by prepare()
+                        cache_start_column: 0.0,
+                        cache_valid_start: 0.0,
+                        cache_valid_end: 0.0,
+                        _pad: [0.0; 2],
                     },
                     target_format: shared.target_format,
-                    pending_upload,
+                    sample_rate,
+                    visible_col_start: vis_col_start,
+                    visible_col_end: vis_col_end,
                 };
 
                 ui.painter().add(egui_wgpu::Callback::new_paint_callback(
diff --git a/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_compute.wgsl b/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_compute.wgsl
new file mode 100644
index 0000000..fd80e4c
--- /dev/null
+++ b/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_compute.wgsl
@@ -0,0 +1,101 @@
+// GPU Constant-Q Transform (CQT) compute shader.
+//
+// Reads raw audio samples from a waveform mip-0 texture (Rgba16Float, packed
+// row-major at TEX_WIDTH=2048) and computes CQT magnitude for each
+// (freq_bin, time_column) pair, writing normalized dB values into a ring-buffer
+// cache texture (R32Float, width=cache_capacity, height=freq_bins).
+//
+// Dispatch: (ceil(freq_bins / 64), num_columns, 1)
+// Each thread handles one frequency bin for one time column.
+
+struct CqtParams {
+    hop_size: u32,
+    freq_bins: u32,
+    cache_capacity: u32,
+    cache_write_offset: u32,  // ring buffer position to start writing
+    num_columns: u32,         // how many columns in this dispatch
+    column_start: u32,        // global CQT column index of first column
+    tex_width: u32,           // waveform texture width (2048)
+    total_frames: u32,        // total audio frames in waveform texture
+    sample_rate: f32,
+    _pad0: u32,
+    _pad1: u32,
+    _pad2: u32,
+}
+
+struct BinInfo {
+    window_length: u32,
+    phase_step: f32, // 2*pi*Q / N_k
+    _pad0: u32,
+    _pad1: u32,
+}
+
+@group(0) @binding(0) var audio_tex: texture_2d<f32>;
+@group(0) @binding(1) var cqt_out: texture_storage_2d<rgba16float, write>;
+@group(0) @binding(2) var<uniform> params: CqtParams;
+@group(0) @binding(3) var<storage, read> bins: array<BinInfo>;
+
+const PI2: f32 = 6.283185307;
+
+@compute @workgroup_size(64)
+fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
+    let bin_k = gid.x;
+    let col_rel = gid.y; // relative to this dispatch batch
+
+    if bin_k >= params.freq_bins || col_rel >= params.num_columns {
+        return;
+    }
+
+    let global_col = params.column_start + col_rel;
+    let sample_start = global_col * params.hop_size;
+
+    let info = bins[bin_k];
+    let n_k = info.window_length;
+
+    // Center the analysis window: offset by half the window length so the
+    // column timestamp refers to the center of the window, not the start.
+    // This gives better time alignment, especially for low-frequency bins
+    // that have very long windows.
+    let half_win = n_k / 2u;
+
+    // Accumulate complex inner product: sum of x[n] * w[n] * exp(-i * phase_step * n)
+    var sum_re: f32 = 0.0;
+    var sum_im: f32 = 0.0;
+
+    for (var n = 0u; n < n_k; n++) {
+        // Center the window around the hop position
+        let raw_idx = i32(sample_start) + i32(n) - i32(half_win);
+        if raw_idx < 0 || u32(raw_idx) >= params.total_frames {
+            continue;
+        }
+        let sample_idx = u32(raw_idx);
+
+        // Read audio sample from 2D waveform texture (mip 0)
+        // At mip 0: R=G=left, B=A=right; average to mono
+        let tx = sample_idx % params.tex_width;
+        let ty = sample_idx / params.tex_width;
+        let texel = textureLoad(audio_tex, vec2<i32>(i32(tx), i32(ty)), 0);
+        let sample_val = (texel.r + texel.b) * 0.5;
+
+        // Hann window computed analytically
+        let window = 0.5 * (1.0 - cos(PI2 * f32(n) / f32(n_k)));
+
+        // Complex exponential: exp(-i * phase_step * n)
+        let angle = info.phase_step * f32(n);
+        let windowed = sample_val * window;
+        sum_re += windowed * cos(angle);
+        sum_im -= windowed * sin(angle);
+    }
+
+    // Magnitude, normalized by window length
+    let mag = sqrt(sum_re * sum_re + sum_im * sum_im) / f32(n_k);
+
+    // Convert to dB, map -80dB..0dB -> 0.0..1.0
+    // WGSL log() is natural log, so log10(x) = log(x) / log(10)
+    let db = 20.0 * log(mag + 1e-10) / 2.302585093;
+    let normalized = clamp((db + 80.0) / 80.0, 0.0, 1.0);
+
+    // Write to ring buffer cache texture
+    let cache_x = (params.cache_write_offset + col_rel) % params.cache_capacity;
+    textureStore(cqt_out, vec2<i32>(i32(cache_x), i32(bin_k)), vec4(normalized, 0.0, 0.0, 1.0));
+}
diff --git a/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/spectrogram.wgsl b/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_render.wgsl
similarity index 58%
rename from lightningbeam-ui/lightningbeam-editor/src/panes/shaders/spectrogram.wgsl
rename to lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_render.wgsl
index 62252c4..02266a4 100644
--- a/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/spectrogram.wgsl
+++ b/lightningbeam-ui/lightningbeam-editor/src/panes/shaders/cqt_render.wgsl
@@ -1,30 +1,37 @@
-// Spectrogram rendering shader for FFT magnitude data.
-// Texture layout: X = frequency bin, Y = time bin
-// Values: normalized magnitude (0.0 = silence, 1.0 = peak)
-// Vertical axis maps MIDI notes to frequency bins (matching piano roll)
+// CQT spectrogram render shader.
+//
+// Reads from a ring-buffer cache texture (Rgba16Float) where:
+//   X = time column (ring buffer index), Y = CQT frequency bin
+// CQT bins map directly to MIDI notes via: bin = (note - min_note) * bins_per_octave / 12
+//
+// Applies the same colormap as the old FFT spectrogram.
 
+// Must match CqtRenderParams in cqt_gpu.rs exactly (96 bytes).
 struct Params {
-    clip_rect: vec4<f32>,
-    viewport_start_time: f32,
-    pixels_per_second: f32,
-    audio_duration: f32,
-    sample_rate: f32,
-    clip_start_time: f32,
-    trim_start: f32,
-    time_bins: f32,
-    freq_bins: f32,
-    hop_size: f32,
-    fft_size: f32,
-    scroll_y: f32,
-    note_height: f32,
-    screen_size: vec2<f32>,
-    min_note: f32,
-    max_note: f32,
-    gamma: f32,
+    clip_rect: vec4<f32>,         // 16 @ 0
+    viewport_start_time: f32,     // 4 @ 16
+    pixels_per_second: f32,       // 4 @ 20
+    audio_duration: f32,          // 4 @ 24
+    sample_rate: f32,             // 4 @ 28
+    clip_start_time: f32,         // 4 @ 32
+    trim_start: f32,              // 4 @ 36
+    freq_bins: f32,               // 4 @ 40
+    bins_per_octave: f32,         // 4 @ 44
+    hop_size: f32,                // 4 @ 48
+    scroll_y: f32,                // 4 @ 52
+    note_height: f32,             // 4 @ 56
+    min_note: f32,                // 4 @ 60
+    max_note: f32,                // 4 @ 64
+    gamma: f32,                   // 4 @ 68
+    cache_capacity: f32,          // 4 @ 72
+    cache_start_column: f32,      // 4 @ 76
+    cache_valid_start: f32,       // 4 @ 80
+    cache_valid_end: f32,         // 4 @ 84
+    _pad: vec2<f32>,              // 8 @ 88, total 96
 }
 
-@group(0) @binding(0) var spec_tex: texture_2d<f32>;
-@group(0) @binding(1) var spec_sampler: sampler;
+@group(0) @binding(0) var cache_tex: texture_2d<f32>;
+@group(0) @binding(1) var cache_sampler: sampler;
 @group(0) @binding(2) var<uniform> params: Params;
 
 struct VertexOutput {
@@ -42,7 +49,6 @@ fn vs_main(@builtin(vertex_index) vi: u32) -> VertexOutput {
     return out;
 }
 
-// Signed distance from point to rounded rectangle boundary
 fn rounded_rect_sdf(pos: vec2<f32>, rect_min: vec2<f32>, rect_max: vec2<f32>, r: f32) -> f32 {
     let center = (rect_min + rect_max) * 0.5;
     let half_size = (rect_max - rect_min) * 0.5;
@@ -55,27 +61,21 @@ fn colormap(v: f32, gamma: f32) -> vec4<f32> {
     let t = pow(clamp(v, 0.0, 1.0), gamma);
 
     if t < 1.0 / 6.0 {
-        // Black -> blue
         let s = t * 6.0;
         return vec4(0.0, 0.0, s, 1.0);
     } else if t < 2.0 / 6.0 {
-        // Blue -> purple
         let s = (t - 1.0 / 6.0) * 6.0;
         return vec4(s * 0.6, 0.0, 1.0 - s * 0.2, 1.0);
     } else if t < 3.0 / 6.0 {
-        // Purple -> red
         let s = (t - 2.0 / 6.0) * 6.0;
         return vec4(0.6 + s * 0.4, 0.0, 0.8 - s * 0.8, 1.0);
     } else if t < 4.0 / 6.0 {
-        // Red -> orange
         let s = (t - 3.0 / 6.0) * 6.0;
         return vec4(1.0, s * 0.5, 0.0, 1.0);
     } else if t < 5.0 / 6.0 {
-        // Orange -> yellow
         let s = (t - 4.0 / 6.0) * 6.0;
         return vec4(1.0, 0.5 + s * 0.5, 0.0, 1.0);
     } else {
-        // Yellow -> white
         let s = (t - 5.0 / 6.0) * 6.0;
         return vec4(1.0, 1.0, s, 1.0);
     }
@@ -98,11 +98,9 @@ fn fs_main(in: VertexOutput) -> @location(0) vec4<f32> {
     let content_top = params.clip_rect.y - params.scroll_y;
     let content_bottom = params.clip_rect.y + (params.max_note - params.min_note + 1.0) * params.note_height - params.scroll_y;
 
-    // Rounded corners: content edges on X, visible viewport edges on Y.
-    // This rounds left/right where the clip starts/ends, and top/bottom at the view boundary.
+    // Rounded corners
     let vis_top = max(content_top, params.clip_rect.y);
     let vis_bottom = min(content_bottom, params.clip_rect.w);
-
     let corner_radius = 6.0;
     let dist = rounded_rect_sdf(
         vec2(frag_x, frag_y),
@@ -114,7 +112,7 @@ fn fs_main(in: VertexOutput) -> @location(0) vec4<f32> {
         discard;
     }
 
-    // Fragment X -> audio time -> time bin
+    // Fragment X -> audio time -> global CQT column
     let timeline_time = params.viewport_start_time + (frag_x - params.clip_rect.x) / params.pixels_per_second;
     let audio_time = timeline_time - params.clip_start_time + params.trim_start;
 
@@ -122,32 +120,35 @@ fn fs_main(in: VertexOutput) -> @location(0) vec4<f32> {
         discard;
     }
 
-    let time_bin = audio_time * params.sample_rate / params.hop_size;
-    if time_bin < 0.0 || time_bin >= params.time_bins {
+    let global_col = audio_time * params.sample_rate / params.hop_size;
+
+    // Check if this column is in the cached range
+    if global_col < params.cache_valid_start || global_col >= params.cache_valid_end {
         discard;
     }
 
-    // Fragment Y -> MIDI note -> frequency -> frequency bin
+    // Fragment Y -> MIDI note -> CQT bin (direct mapping!)
     let note = params.max_note - ((frag_y - params.clip_rect.y + params.scroll_y) / params.note_height);
 
     if note < params.min_note || note > params.max_note {
         discard;
     }
 
-    // MIDI note -> frequency: freq = 440 * 2^((note - 69) / 12)
-    let freq = 440.0 * pow(2.0, (note - 69.0) / 12.0);
+    // CQT bin: each octave has bins_per_octave bins, starting from min_note
+    let bin = (note - params.min_note) * params.bins_per_octave / 12.0;
 
-    // Frequency -> FFT bin index
-    let freq_bin = freq * params.fft_size / params.sample_rate;
-
-    if freq_bin < 0.0 || freq_bin >= params.freq_bins {
+    if bin < 0.0 || bin >= params.freq_bins {
         discard;
     }
 
-    // Sample texture with bilinear filtering
-    let u = freq_bin / params.freq_bins;
-    let v = time_bin / params.time_bins;
-    let magnitude = textureSampleLevel(spec_tex, spec_sampler, vec2(u, v), 0.0).r;
+    // Map global column to ring buffer position
+    let ring_pos = global_col - params.cache_start_column;
+    let cache_x = ring_pos % params.cache_capacity;
+
+    // Sample cache texture with bilinear filtering
+    let u = (cache_x + 0.5) / params.cache_capacity;
+    let v = (bin + 0.5) / params.freq_bins;
+    let magnitude = textureSampleLevel(cache_tex, cache_sampler, vec2(u, v), 0.0).r;
 
     return colormap(magnitude, params.gamma);
 }
diff --git a/lightningbeam-ui/lightningbeam-editor/src/spectrogram_compute.rs b/lightningbeam-ui/lightningbeam-editor/src/spectrogram_compute.rs
deleted file mode 100644
index 28cb38d..0000000
--- a/lightningbeam-ui/lightningbeam-editor/src/spectrogram_compute.rs
+++ /dev/null
@@ -1,144 +0,0 @@
-/// CPU-side FFT computation for spectrogram visualization.
-///
-/// Uses rayon to parallelize FFT across time slices on all CPU cores.
-/// Produces a 2D magnitude grid (time bins x frequency bins) for GPU texture upload.
-
-use rayon::prelude::*;
-use std::f32::consts::PI;
-
-/// Pre-computed spectrogram data ready for GPU upload
-pub struct SpectrogramData {
-    /// Flattened 2D array of normalized magnitudes [time_bins * freq_bins], row-major
-    /// Each value is 0.0 (silence) to 1.0 (peak), log-scale normalized
-    pub magnitudes: Vec<f32>,
-    pub time_bins: usize,
-    pub freq_bins: usize,
-    pub sample_rate: u32,
-    pub hop_size: usize,
-    pub fft_size: usize,
-    pub duration: f64,
-}
-
-/// Compute a spectrogram from raw audio samples using parallel FFT.
-///
-/// Each time slice is processed independently via rayon, making this
-/// scale well across all CPU cores.
-pub fn compute_spectrogram(
-    samples: &[f32],
-    sample_rate: u32,
-    channels: u32,
-    fft_size: usize,
-    hop_size: usize,
-) -> SpectrogramData {
-    // Mix to mono
-    let mono: Vec<f32> = if channels >= 2 {
-        samples
-            .chunks(channels as usize)
-            .map(|frame| frame.iter().sum::<f32>() / channels as f32)
-            .collect()
-    } else {
-        samples.to_vec()
-    };
-
-    let freq_bins = fft_size / 2 + 1;
-    let duration = mono.len() as f64 / sample_rate as f64;
-
-    if mono.len() < fft_size {
-        return SpectrogramData {
-            magnitudes: Vec::new(),
-            time_bins: 0,
-            freq_bins,
-            sample_rate,
-            hop_size,
-            fft_size,
-            duration,
-        };
-    }
-
-    let time_bins = (mono.len().saturating_sub(fft_size)) / hop_size + 1;
-
-    // Precompute Hann window
-    let window: Vec<f32> = (0..fft_size)
-        .map(|i| 0.5 * (1.0 - (2.0 * PI * i as f32 / fft_size as f32).cos()))
-        .collect();
-
-    // Precompute twiddle factors for Cooley-Tukey radix-2 FFT
-    let twiddles: Vec<(f32, f32)> = (0..fft_size / 2)
-        .map(|k| {
-            let angle = -2.0 * PI * k as f32 / fft_size as f32;
-            (angle.cos(), angle.sin())
-        })
-        .collect();
-
-    // Bit-reversal permutation table
-    let bits = (fft_size as f32).log2() as u32;
-    let bit_rev: Vec<usize> = (0..fft_size)
-        .map(|i| (i as u32).reverse_bits().wrapping_shr(32 - bits) as usize)
-        .collect();
-
-    // Process all time slices in parallel
-    let magnitudes: Vec<f32> = (0..time_bins)
-        .into_par_iter()
-        .flat_map(|t| {
-            let offset = t * hop_size;
-            let mut re = vec![0.0f32; fft_size];
-            let mut im = vec![0.0f32; fft_size];
-
-            // Load windowed samples in bit-reversed order
-            for i in 0..fft_size {
-                let sample = if offset + i < mono.len() {
-                    mono[offset + i]
-                } else {
-                    0.0
-                };
-                re[bit_rev[i]] = sample * window[i];
-            }
-
-            // Cooley-Tukey radix-2 DIT FFT
-            let mut half_size = 1;
-            while half_size < fft_size {
-                let step = half_size * 2;
-                let twiddle_step = fft_size / step;
-
-                for k in (0..fft_size).step_by(step) {
-                    for j in 0..half_size {
-                        let tw_idx = j * twiddle_step;
-                        let (tw_re, tw_im) = twiddles[tw_idx];
-
-                        let a = k + j;
-                        let b = a + half_size;
-
-                        let t_re = tw_re * re[b] - tw_im * im[b];
-                        let t_im = tw_re * im[b] + tw_im * re[b];
-
-                        re[b] = re[a] - t_re;
-                        im[b] = im[a] - t_im;
-                        re[a] += t_re;
-                        im[a] += t_im;
-                    }
-                }
-                half_size = step;
-            }
-
-            // Extract magnitudes for positive frequencies
-            let mut mags = Vec::with_capacity(freq_bins);
-            for f in 0..freq_bins {
-                let mag = (re[f] * re[f] + im[f] * im[f]).sqrt();
-                // dB normalization: -80dB floor to 0dB ceiling → 0.0 to 1.0
-                let db = 20.0 * (mag + 1e-10).log10();
-                mags.push(((db + 80.0) / 80.0).clamp(0.0, 1.0));
-            }
-            mags
-        })
-        .collect();
-
-    SpectrogramData {
-        magnitudes,
-        time_bins,
-        freq_bins,
-        sample_rate,
-        hop_size,
-        fft_size,
-        duration,
-    }
-}
diff --git a/lightningbeam-ui/lightningbeam-editor/src/spectrogram_gpu.rs b/lightningbeam-ui/lightningbeam-editor/src/spectrogram_gpu.rs
deleted file mode 100644
index d82773c..0000000
--- a/lightningbeam-ui/lightningbeam-editor/src/spectrogram_gpu.rs
+++ /dev/null
@@ -1,350 +0,0 @@
-/// GPU resources for spectrogram rendering.
-///
-/// Follows the same pattern as waveform_gpu.rs:
-/// - SpectrogramGpuResources stored in CallbackResources (long-lived)
-/// - SpectrogramCallback implements egui_wgpu::CallbackTrait (per-frame)
-/// - R32Float texture holds magnitude data (time bins × freq bins)
-/// - Fragment shader applies colormap and frequency mapping
-
-use std::collections::HashMap;
-
-/// GPU resources for all spectrograms (stored in egui_wgpu::CallbackResources)
-pub struct SpectrogramGpuResources {
-    pub entries: HashMap<usize, SpectrogramGpuEntry>,
-    render_pipeline: wgpu::RenderPipeline,
-    render_bind_group_layout: wgpu::BindGroupLayout,
-    sampler: wgpu::Sampler,
-}
-
-/// Per-audio-pool GPU data for one spectrogram
-#[allow(dead_code)]
-pub struct SpectrogramGpuEntry {
-    pub texture: wgpu::Texture,
-    pub texture_view: wgpu::TextureView,
-    pub render_bind_group: wgpu::BindGroup,
-    pub uniform_buffer: wgpu::Buffer,
-    pub time_bins: u32,
-    pub freq_bins: u32,
-    pub sample_rate: u32,
-    pub hop_size: u32,
-    pub fft_size: u32,
-    pub duration: f32,
-}
-
-/// Uniform buffer struct — must match spectrogram.wgsl Params exactly
-#[repr(C)]
-#[derive(Debug, Copy, Clone, bytemuck::Pod, bytemuck::Zeroable)]
-pub struct SpectrogramParams {
-    pub clip_rect: [f32; 4],        // 16 bytes @ offset 0
-    pub viewport_start_time: f32,    // 4 bytes @ offset 16
-    pub pixels_per_second: f32,      // 4 bytes @ offset 20
-    pub audio_duration: f32,         // 4 bytes @ offset 24
-    pub sample_rate: f32,            // 4 bytes @ offset 28
-    pub clip_start_time: f32,        // 4 bytes @ offset 32
-    pub trim_start: f32,             // 4 bytes @ offset 36
-    pub time_bins: f32,              // 4 bytes @ offset 40
-    pub freq_bins: f32,              // 4 bytes @ offset 44
-    pub hop_size: f32,               // 4 bytes @ offset 48
-    pub fft_size: f32,               // 4 bytes @ offset 52
-    pub scroll_y: f32,               // 4 bytes @ offset 56
-    pub note_height: f32,            // 4 bytes @ offset 60
-    pub screen_size: [f32; 2],       // 8 bytes @ offset 64
-    pub min_note: f32,               // 4 bytes @ offset 72
-    pub max_note: f32,               // 4 bytes @ offset 76
-    pub gamma: f32,                  // 4 bytes @ offset 80
-    pub _pad: [f32; 3],              // 12 bytes @ offset 84 (pad to 96 for WGSL struct alignment)
-}
-// Total: 96 bytes (multiple of 16 for vec4 alignment)
-
-/// Data for a pending spectrogram texture upload
-pub struct SpectrogramUpload {
-    pub magnitudes: Vec<f32>,
-    pub time_bins: u32,
-    pub freq_bins: u32,
-    pub sample_rate: u32,
-    pub hop_size: u32,
-    pub fft_size: u32,
-    pub duration: f32,
-}
-
-/// Per-frame callback for rendering one spectrogram instance
-pub struct SpectrogramCallback {
-    pub pool_index: usize,
-    pub params: SpectrogramParams,
-    pub target_format: wgpu::TextureFormat,
-    pub pending_upload: Option<SpectrogramUpload>,
-}
-
-impl SpectrogramGpuResources {
-    pub fn new(device: &wgpu::Device, target_format: wgpu::TextureFormat) -> Self {
-        // Shader
-        let shader = device.create_shader_module(wgpu::ShaderModuleDescriptor {
-            label: Some("spectrogram_render_shader"),
-            source: wgpu::ShaderSource::Wgsl(
-                include_str!("panes/shaders/spectrogram.wgsl").into(),
-            ),
-        });
-
-        // Bind group layout: texture + sampler + uniforms
-        let render_bind_group_layout =
-            device.create_bind_group_layout(&wgpu::BindGroupLayoutDescriptor {
-                label: Some("spectrogram_render_bgl"),
-                entries: &[
-                    wgpu::BindGroupLayoutEntry {
-                        binding: 0,
-                        visibility: wgpu::ShaderStages::FRAGMENT,
-                        ty: wgpu::BindingType::Texture {
-                            sample_type: wgpu::TextureSampleType::Float { filterable: true },
-                            view_dimension: wgpu::TextureViewDimension::D2,
-                            multisampled: false,
-                        },
-                        count: None,
-                    },
-                    wgpu::BindGroupLayoutEntry {
-                        binding: 1,
-                        visibility: wgpu::ShaderStages::FRAGMENT,
-                        ty: wgpu::BindingType::Sampler(wgpu::SamplerBindingType::Filtering),
-                        count: None,
-                    },
-                    wgpu::BindGroupLayoutEntry {
-                        binding: 2,
-                        visibility: wgpu::ShaderStages::FRAGMENT,
-                        ty: wgpu::BindingType::Buffer {
-                            ty: wgpu::BufferBindingType::Uniform,
-                            has_dynamic_offset: false,
-                            min_binding_size: None,
-                        },
-                        count: None,
-                    },
-                ],
-            });
-
-        // Render pipeline
-        let pipeline_layout = device.create_pipeline_layout(&wgpu::PipelineLayoutDescriptor {
-            label: Some("spectrogram_pipeline_layout"),
-            bind_group_layouts: &[&render_bind_group_layout],
-            push_constant_ranges: &[],
-        });
-
-        let render_pipeline = device.create_render_pipeline(&wgpu::RenderPipelineDescriptor {
-            label: Some("spectrogram_render_pipeline"),
-            layout: Some(&pipeline_layout),
-            vertex: wgpu::VertexState {
-                module: &shader,
-                entry_point: Some("vs_main"),
-                buffers: &[],
-                compilation_options: Default::default(),
-            },
-            fragment: Some(wgpu::FragmentState {
-                module: &shader,
-                entry_point: Some("fs_main"),
-                targets: &[Some(wgpu::ColorTargetState {
-                    format: target_format,
-                    blend: Some(wgpu::BlendState::ALPHA_BLENDING),
-                    write_mask: wgpu::ColorWrites::ALL,
-                })],
-                compilation_options: Default::default(),
-            }),
-            primitive: wgpu::PrimitiveState {
-                topology: wgpu::PrimitiveTopology::TriangleList,
-                ..Default::default()
-            },
-            depth_stencil: None,
-            multisample: wgpu::MultisampleState::default(),
-            multiview: None,
-            cache: None,
-        });
-
-        // Bilinear sampler for smooth frequency interpolation
-        let sampler = device.create_sampler(&wgpu::SamplerDescriptor {
-            label: Some("spectrogram_sampler"),
-            mag_filter: wgpu::FilterMode::Linear,
-            min_filter: wgpu::FilterMode::Linear,
-            mipmap_filter: wgpu::FilterMode::Nearest,
-            ..Default::default()
-        });
-
-        Self {
-            entries: HashMap::new(),
-            render_pipeline,
-            render_bind_group_layout,
-            sampler,
-        }
-    }
-
-    /// Upload pre-computed spectrogram magnitude data as a GPU texture
-    pub fn upload_spectrogram(
-        &mut self,
-        device: &wgpu::Device,
-        queue: &wgpu::Queue,
-        pool_index: usize,
-        upload: &SpectrogramUpload,
-    ) {
-        // Remove old entry
-        self.entries.remove(&pool_index);
-
-        if upload.time_bins == 0 || upload.freq_bins == 0 {
-            return;
-        }
-
-        // Data layout: magnitudes[t * freq_bins + f] — each row is one time slice
-        // with freq_bins values. So texture width = freq_bins, height = time_bins.
-        // R8Unorm is filterable (unlike R32Float) for bilinear interpolation.
-        let tex_width = upload.freq_bins;
-        let tex_height = upload.time_bins;
-
-        let texture = device.create_texture(&wgpu::TextureDescriptor {
-            label: Some(&format!("spectrogram_{}", pool_index)),
-            size: wgpu::Extent3d {
-                width: tex_width,
-                height: tex_height,
-                depth_or_array_layers: 1,
-            },
-            mip_level_count: 1,
-            sample_count: 1,
-            dimension: wgpu::TextureDimension::D2,
-            format: wgpu::TextureFormat::R8Unorm,
-            usage: wgpu::TextureUsages::TEXTURE_BINDING | wgpu::TextureUsages::COPY_DST,
-            view_formats: &[],
-        });
-
-        // Convert f32 magnitudes to u8 for R8Unorm, with row padding for alignment.
-        // wgpu requires bytes_per_row to be a multiple of COPY_BYTES_PER_ROW_ALIGNMENT (256).
-        let align = wgpu::COPY_BYTES_PER_ROW_ALIGNMENT;
-        let unpadded_row = tex_width; // 1 byte per texel for R8Unorm
-        let padded_row = (unpadded_row + align - 1) / align * align;
-
-        let mut texel_data = vec![0u8; padded_row as usize * tex_height as usize];
-        for row in 0..tex_height as usize {
-            let src_offset = row * tex_width as usize;
-            let dst_offset = row * padded_row as usize;
-            for col in 0..tex_width as usize {
-                let m = upload.magnitudes[src_offset + col];
-                texel_data[dst_offset + col] = (m.clamp(0.0, 1.0) * 255.0) as u8;
-            }
-        }
-
-        // Upload magnitude data
-        queue.write_texture(
-            wgpu::TexelCopyTextureInfo {
-                texture: &texture,
-                mip_level: 0,
-                origin: wgpu::Origin3d::ZERO,
-                aspect: wgpu::TextureAspect::All,
-            },
-            &texel_data,
-            wgpu::TexelCopyBufferLayout {
-                offset: 0,
-                bytes_per_row: Some(padded_row),
-                rows_per_image: Some(tex_height),
-            },
-            wgpu::Extent3d {
-                width: tex_width,
-                height: tex_height,
-                depth_or_array_layers: 1,
-            },
-        );
-
-        let texture_view = texture.create_view(&wgpu::TextureViewDescriptor {
-            label: Some(&format!("spectrogram_{}_view", pool_index)),
-            ..Default::default()
-        });
-
-        let uniform_buffer = device.create_buffer(&wgpu::BufferDescriptor {
-            label: Some(&format!("spectrogram_{}_uniforms", pool_index)),
-            size: std::mem::size_of::<SpectrogramParams>() as u64,
-            usage: wgpu::BufferUsages::UNIFORM | wgpu::BufferUsages::COPY_DST,
-            mapped_at_creation: false,
-        });
-
-        let render_bind_group = device.create_bind_group(&wgpu::BindGroupDescriptor {
-            label: Some(&format!("spectrogram_{}_bg", pool_index)),
-            layout: &self.render_bind_group_layout,
-            entries: &[
-                wgpu::BindGroupEntry {
-                    binding: 0,
-                    resource: wgpu::BindingResource::TextureView(&texture_view),
-                },
-                wgpu::BindGroupEntry {
-                    binding: 1,
-                    resource: wgpu::BindingResource::Sampler(&self.sampler),
-                },
-                wgpu::BindGroupEntry {
-                    binding: 2,
-                    resource: uniform_buffer.as_entire_binding(),
-                },
-            ],
-        });
-
-        self.entries.insert(
-            pool_index,
-            SpectrogramGpuEntry {
-                texture,
-                texture_view,
-                render_bind_group,
-                uniform_buffer,
-                time_bins: upload.time_bins,
-                freq_bins: upload.freq_bins,
-                sample_rate: upload.sample_rate,
-                hop_size: upload.hop_size,
-                fft_size: upload.fft_size,
-                duration: upload.duration,
-            },
-        );
-    }
-}
-
-impl egui_wgpu::CallbackTrait for SpectrogramCallback {
-    fn prepare(
-        &self,
-        device: &wgpu::Device,
-        queue: &wgpu::Queue,
-        _screen_descriptor: &egui_wgpu::ScreenDescriptor,
-        _egui_encoder: &mut wgpu::CommandEncoder,
-        resources: &mut egui_wgpu::CallbackResources,
-    ) -> Vec<wgpu::CommandBuffer> {
-        // Initialize global resources on first use
-        if !resources.contains::<SpectrogramGpuResources>() {
-            resources.insert(SpectrogramGpuResources::new(device, self.target_format));
-        }
-
-        let gpu: &mut SpectrogramGpuResources = resources.get_mut().unwrap();
-
-        // Handle pending upload
-        if let Some(ref upload) = self.pending_upload {
-            gpu.upload_spectrogram(device, queue, self.pool_index, upload);
-        }
-
-        // Update uniform buffer
-        if let Some(entry) = gpu.entries.get(&self.pool_index) {
-            queue.write_buffer(
-                &entry.uniform_buffer,
-                0,
-                bytemuck::cast_slice(&[self.params]),
-            );
-        }
-
-        Vec::new()
-    }
-
-    fn paint(
-        &self,
-        _info: eframe::egui::PaintCallbackInfo,
-        render_pass: &mut wgpu::RenderPass<'static>,
-        resources: &egui_wgpu::CallbackResources,
-    ) {
-        let gpu: &SpectrogramGpuResources = match resources.get() {
-            Some(r) => r,
-            None => return,
-        };
-
-        let entry = match gpu.entries.get(&self.pool_index) {
-            Some(e) => e,
-            None => return,
-        };
-
-        render_pass.set_pipeline(&gpu.render_pipeline);
-        render_pass.set_bind_group(0, &entry.render_bind_group, &[]);
-        render_pass.draw(0..3, 0..1); // Fullscreen triangle
-    }
-}