-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmel_spectrogram.rs
More file actions
73 lines (62 loc) · 2.55 KB
/
mel_spectrogram.rs
File metadata and controls
73 lines (62 loc) · 2.55 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
use non_empty_slice::NonEmptyVec;
/// Mel-frequency spectrogram example
///
/// This example demonstrates:
/// - Computing mel-frequency spectrograms
/// - Using logarithmic (dB) amplitude scaling
/// - Accessing mel-frequency axes
use spectrograms::{
LogParams, MelDbSpectrogram, MelParams, SpectrogramParams, StftParams, WindowType, nzu,
};
use std::f64::consts::PI;
fn main() -> Result<(), Box<dyn std::error::Error>> {
// Generate a more complex signal: two sine waves
let sample_rate = 16000.0;
let duration = 1.0;
let samples: Vec<f64> = (0..(duration * sample_rate) as usize)
.map(|i| {
let t = i as f64 / sample_rate;
// 440 Hz (A4) + 880 Hz (A5)
(2.0 * PI * 440.0 * t).sin() + 0.5 * (2.0 * PI * 880.0 * t).sin()
})
.collect();
let samples = NonEmptyVec::new(samples).unwrap();
println!("Generated {} samples with two frequencies", samples.len());
// Set up STFT parameters
let stft = StftParams::new(nzu!(512), nzu!(256), WindowType::Hanning, true)?;
let params = SpectrogramParams::new(stft, sample_rate)?;
// Set up mel filterbank parameters
let mel = MelParams::new(
nzu!(80), // n_mels: number of mel bands
0.0, // f_min: minimum frequency (Hz)
8000.0, // f_max: maximum frequency (Hz)
)?;
// Set up logarithmic (dB) scaling
let db = LogParams::new(-80.0)?; // floor at -80 dB
// Compute mel spectrogram in dB scale
let spec = MelDbSpectrogram::compute(&samples, ¶ms, &mel, Some(&db))?;
println!("\nMel Spectrogram properties:");
println!(" Mel bands: {}", spec.n_bins());
println!(" Time frames: {}", spec.n_frames());
// Access mel-frequency axis
let mel_freqs = spec.axes().frequencies();
println!("\nMel frequency range:");
println!(" Lowest mel center: {:.1} Hz", mel_freqs[0]);
println!(
" Highest mel center: {:.1} Hz",
mel_freqs[mel_freqs.len().get() - 1]
);
// Print a few mel band center frequencies
println!("\nFirst 10 mel band centers (Hz):");
for (i, &freq) in mel_freqs.iter().take(10).enumerate() {
println!(" Mel band {}: {:.1} Hz", i, freq);
}
// Find average energy per mel band (across all frames)
println!("\nAverage energy per mel band (dB):");
for i in (0..spec.n_bins().get()).step_by(spec.n_bins().get() / 5) {
let row = spec.data().row(i);
let avg = row.iter().sum::<f64>() / row.len() as f64;
println!(" Mel band {} ({:.1} Hz): {:.2} dB", i, mel_freqs[i], avg);
}
Ok(())
}