diff --git a/src/FFT.hpp b/src/FFT.hpp index 51dba4a..750100f 100644 --- a/src/FFT.hpp +++ b/src/FFT.hpp @@ -53,7 +53,8 @@ std::vector> FFT(const std::vector::const_iterator& begin, const std::vector::const_iterator& end, size_t sampleRate, - double minFreq, double maxFreq) + double minFreq, double maxFreq, + unsigned int zeropadding) { std::vector signal(begin, end); size_t N = signal.size(); @@ -64,6 +65,11 @@ FFT(const std::vector::const_iterator& begin, N++; } + if (zeropadding > 1) { + N = (signal.size() << (zeropadding - 1)); + signal.insert(signal.end(), N - signal.size(), 0); + } + std::vector> spectrum = radix2dit(signal.cbegin(), N, 1); double freqRes = (double)sampleRate / (double)N; double nyquistLimit = (double)sampleRate / 2.0f; diff --git a/src/main.cpp b/src/main.cpp index 2a37684..392824f 100644 --- a/src/main.cpp +++ b/src/main.cpp @@ -16,6 +16,7 @@ struct Settings { float splitInterval; double minFreq, maxFreq; unsigned int analyzeChannel; + unsigned int zeropadding; }; Settings Parse(int argc, char** argv); @@ -59,7 +60,9 @@ int main(int argc, char** argv) audioFile.samples[c-1].cbegin(), audioFile.samples[c-1].cend(), sampleRate, - setts.minFreq, setts.maxFreq); + setts.minFreq, setts.maxFreq, + setts.zeropadding + ); output[chName] = nlohmann::json::array(); for (const std::pair& pair : spectrum) { @@ -80,7 +83,8 @@ int main(int argc, char** argv) audioFile.samples[c-1].cend() ), sampleRate, - setts.minFreq, setts.maxFreq + setts.minFreq, setts.maxFreq, + setts.zeropadding ); output[chName].push_back({ @@ -122,6 +126,7 @@ Settings Parse(int argc, char** argv) ("q,quiet", "Suppress text output", cxxopts::value()->default_value("false")) ("i,interval", "Splits audio file into intervals of length i milliseconds and transforms them individually (0 to not split file)", cxxopts::value()) ("f,frequency", "Defines the frequency range of the output spectrum (Default: all the frequencies)", cxxopts::value>()) + ("p,pad", "Add extra zero-padding. By default, the program will pad the signals with 0s until the number of samples is a power of 2 (this would be equivalent to -p 1). With this option you can tell the program to instead pad until the power of 2 after the next one (-p 2) etc. This increases frequency resolution", cxxopts::value()) ("m,mono", "Analyze only the given channel", cxxopts::value()->default_value("0")) ("files", "Files to fourier transform", cxxopts::value>()) ("h,help", "Print usage") @@ -157,6 +162,7 @@ Settings Parse(int argc, char** argv) setts.quiet = (result.count("quiet") ? result["quiet"].as() : false); setts.splitInterval = (result.count("interval") ? result["interval"].as() : 0.0f); setts.analyzeChannel = (result.count("mono") ? result["mono"].as() : 0); + setts.zeropadding = (result.count("pad") ? result["pad"].as() : 1); if (setts.maxFreq <= setts.minFreq && (setts.maxFreq != 0))