public class SignalProcUtils extends Object
Constructor and Description |
---|
SignalProcUtils() |
Modifier and Type | Method and Description |
---|---|
static double[] |
addSignals(double[] s1,
double[] s2) |
static double[] |
addSignals(double[] s1,
double gain1,
double[] s2,
double gain2) |
static void |
addWhiteNoise(double[] x,
double level) |
static double[] |
applyPreemphasis(double[] frm,
double preCoef) |
static double[] |
arFilter(double[] x,
double[] a,
double lpGain) |
static double[] |
arFilter(double[] x,
double[] a,
double lpGain,
double[] yInitial) |
static double[] |
arFilter(double[] x,
float[] a,
double lpGain) |
static double[] |
arFilter(double[] x,
float[] a,
double lpGain,
double[] yInitial) |
static double[] |
arFilterFreqDomain(double[] windowedFrame,
double[] a,
double lpGain,
double startFreqInHz,
double endFreqInHz,
int samplingRateInHz) |
static double[] |
autocorr(double[] x,
int LPOrder) |
static double[] |
bark2freq(double[] barks,
int samplingRateInHz) |
static double |
bark2freq(double bark,
int samplingRateInHz) |
static double |
barkNew2freq(double barkNew) |
static double |
barkNew2radian(double bark,
int samplingRateInHz) |
static void |
centerClip(double[] x,
double ratio) |
static double |
cepstrum2linearSpecAmp(float[] ceps,
float freqInRadians) |
static double |
cepstrum2minimumPhase(float[] ceps,
float freqInRadians) |
static double[] |
decimate(double[] x,
double D) |
static void |
displayDFTSpectrumInDB(double[] frame) |
static void |
displayDFTSpectrumInDB(double[] frame,
int fftSize) |
static void |
displayDFTSpectrumInDB(double[] frame,
int fftSize,
double[] wgt) |
static void |
displayDFTSpectrumInDB(double[] frame,
int fftSize,
int windowType) |
static void |
displayDFTSpectrumInDBNoWindowing(double[] frame) |
static void |
displayDFTSpectrumInDBNoWindowing(double[] frame,
int fftSize) |
static void |
displayDFTSpectrumLinear(double[] frame) |
static void |
displayDFTSpectrumLinear(double[] frame,
int fftSize) |
static void |
displayDFTSpectrumLinear(double[] frame,
int fftSize,
int windowType) |
static void |
displayDFTSpectrumLinearNoWindowing(double[] frame) |
static void |
displayDFTSpectrumLinearNoWindowing(double[] frame,
int fftSize) |
static void |
displayLPSpectrumInDB(double[] alpha,
double lpGain,
int fftSize) |
static void |
displayLPSpectrumLinear(double[] alpha,
double lpGain,
int fftSize) |
static double |
energy(double[] x) |
static double[] |
fdFilter(ComplexArray frameDft,
float startFreqInHz,
float endFreqInHz,
int samplingRateInHz,
int origLen) |
static double[] |
fdFilter(double[] x,
double[] filterFreqResponse) |
static double[] |
fdFilter(double[] x,
float startFreqInHz,
float endFreqInHz,
int samplingRateInHz,
int fftSize) |
static double[][] |
fft2barkmx(int nfft,
int sr,
int nfilts,
int width,
double minfreq,
double maxfreq)
Java ported version of: wts = fft2barkmx(nfft, sr, nfilts, width) Generate a matrix of weights to combine FFT bins into
Bark bins.
|
static double[] |
filter(double[] b,
double[] x) |
static double[] |
filter(double[] b,
double[] x,
boolean bNormalize) |
static double[] |
filter(double[] b,
double[] x,
boolean bNormalize,
double[] zi) |
static double[] |
filter(double[] b,
double[] a,
double[] x) |
static double[] |
filter(double[] b,
double[] a,
double[] x,
boolean bNormalize) |
static double[] |
filter(double[] b,
double[] a,
double[] x,
boolean bNormalize,
double[] zi) |
static double[] |
filterfd(double[] filterFFTAbsMag,
double[] x,
double samplingRate) |
static double[] |
filterfd(double[] filterFFTAbsMag,
double[] x,
double samplingRate,
double winsize) |
static double[] |
filterfd(double[] filterFFTAbsMag,
double[] x,
double samplingRate,
double winsize,
double skipsize) |
static double[] |
filtfilt(double[] b,
double[] x) |
static double[] |
filtfilt(double[] b,
double[] a,
double[] x) |
static double[] |
fitLeastSquaresLine(double[] x,
double[] y) |
static double[] |
fixedRateF0Values(PitchMarks pm,
double wsFixedInSeconds,
double ssFixedInSeconds,
int numfrm,
int samplingRate) |
static int |
frameIndex2LabelIndex(int zeroBasedFrameIndex,
Labels labels,
double windowSizeInSeconds,
double skipSizeInSeconds) |
static double |
frameIndex2Time(int zeroBasedFrameIndex,
double windowSizeInSeconds,
double skipSizeInSeconds) |
static float |
frameIndex2Time(int zeroBasedFrameIndex,
float windowSizeInSeconds,
float skipSizeInSeconds) |
static double |
freq2bark(double freqInHz) |
static double[] |
freq2bark(double[] freqsInHz) |
static double |
freq2barkNew(double freqInHz) |
static int[] |
freq2index(double[] freqsInHz,
int samplingRateInHz,
int maxFreq) |
static int |
freq2index(double freqInHz,
double samplingRateInHz,
int maxFreqIndex) |
static double[] |
freq2indexDouble(double[] freqsInHz,
double samplingRateInHz,
int maxFreq) |
static double |
freq2indexDouble(double freqInHz,
double samplingRateInHz,
int maxFreqIndex) |
static int |
fullSpectrumSize(int maxFreq) |
static float[] |
getAnalysisTimes(int numfrm,
double windowSizeInSeconds,
double frameShiftInSeconds) |
static double |
getAverageSampleEnergy(double[] x) |
static double |
getAverageSampleEnergy(double[] x,
int len) |
static double |
getAverageSampleEnergy(double[] x,
int len,
int start) |
static float[] |
getAverageSampleEnergyContour(double[] x,
double windowSizeInSeconds,
double skipSizeInSeconds,
int samplingRate) |
static float[] |
getAverageSampleEnergyContour(double[] x,
float[] times,
int samplingRateInHz,
float windowDurationInSeconds) |
static double[] |
getContourLSFit(double[] contour,
boolean isPitchUVInterpolation) |
static int |
getDFTSize(int fs) |
static double |
getEnergy(double[] x) |
static double |
getEnergy(double[] x,
int len) |
static double |
getEnergy(double[] x,
int len,
int start) |
static double[] |
getEnergyContourRms(double[] x,
double windowSizeInSeconds,
double skipSizeInSeconds,
int samplingRate) |
static double |
getEnergydB(double x) |
static double |
getEnergydB(double[] x) |
static double |
getEnergydB(double[] x,
int len) |
static double |
getEnergydB(double[] x,
int len,
int start) |
static double[] |
getExpF0s(double[] logF0s) |
static double |
getF0Range(double[] f0s) |
static double |
getF0Range(double[] f0s,
double percentileMin,
double percentileMax) |
static int |
getFIRFilterOrder(int fs) |
static ComplexArray |
getFrameDft(double[] frame,
int fftSize) |
static ComplexArray |
getFrameDft(double[] frame,
int fftSize,
double[] windowWgt) |
static ComplexArray |
getFrameDft(double[] frame,
int fftSize,
int windowType) |
static double[] |
getFrameHalfMagnitudeSpectrum(double[] frame,
int fftSize) |
static double[] |
getFrameHalfMagnitudeSpectrum(double[] frame,
int fftSize,
double[] wgt) |
static double[] |
getFrameHalfMagnitudeSpectrum(double[] frame,
int fftSize,
int windowType) |
static double[] |
getFrameMagnitudeSpectrum(double[] frame,
int fftSize) |
static double[] |
getFrameMagnitudeSpectrum(double[] frame,
int fftSize,
double[] wgt) |
static double[] |
getFrameMagnitudeSpectrum(double[] frame,
int fftSize,
int windowType) |
static int |
getLifterOrder(int fs) |
static double[] |
getLogF0s(double[] f0s) |
static int |
getLPOrder(int fs) |
static double[][] |
getMapped(double[][] x,
int[] mapInds) |
static float[][] |
getMapped(float[][] x,
int[] mapInds) |
static double |
getMaximumFreqOfVoicingInHz(double[] specAmpsLinear,
int[] peakInds,
int[][] freqBandInds,
int samplingRate) |
static double[] |
getNoise(double startFreqInHz,
double endFreqInHz,
double transitionBandwidthInHz,
int samplingRateInHz,
int len) |
static double[] |
getNoiseNormalizedFreqs(double normalizedStartFreq,
double normalizedEndFreq,
double normalizedTransitionBandwidth,
int len) |
static double[] |
getPeakAmplitudeFrequencies(double[] sDft,
double f0InHz,
int numHarmonics,
int fftSize,
double samplingRateInHz,
boolean bIncludeZerothHarmonic) |
static double[] |
getPeakAmplitudes(double[] sDft,
double f0InHz,
int numHarmonics,
int fftSize,
double samplingRateInHz,
boolean bIncludeZerothHarmonic) |
static double[] |
getPeakAmplitudes(double[] sDft,
double f0InHz,
int startHarmonicIndex,
int endHarmonicIndex,
int fftSize,
double samplingRateInHz,
boolean amplitudes) |
static double |
getRmsDistance(double[] x,
double[] y) |
static int |
getTotalFrames(double totalTimeInSeconds,
double windowSizeInSeconds,
double skipSizeInSeconds) |
static int |
getTotalFrames(int totalSamples,
double windowSizeInSeconds,
double skipSizeInSeconds) |
static int |
getTotalFrames(int totalSamples,
int windowLengthInSamples,
int skipSizeInSamples) |
static double[] |
getVoiceds(double[] f0s) |
static boolean |
getVoicing(double[] windowedSpeechFrame,
int samplingRateInHz) |
static boolean |
getVoicing(double[] windowedSpeechFrame,
int samplingRateInHz,
double voicingThreshold) |
static double |
getVoicingProbability(double[] windowedSpeechFrame,
int samplingRateInHz) |
static boolean[] |
getVuvs(double[] f0s) |
static double[] |
getWhiteNoise(int totalSamples,
double maxAbsGain) |
static double[] |
getWhiteNoiseOfMeanVariance(int totalSamples,
double mean,
double variance) |
static double[] |
getWhiteNoiseOfVariance(int totalSamples,
double variance) |
static Window |
getWindow(int windowType,
int windowSizeInSamples) |
static int |
halfSpectrumSize(int fftSize) |
static double |
hz2bark(double freqInHz)
Since there is no asinh in Math, here it is used its definition: asinh(x) = ln( x + sqrt(x^2+1) ) This function is used in
fft2barkmx()
|
static double |
hz2mel(double freqInHz,
int samplingRateInHz) |
static double |
hz2radian(double hz,
int samplingRate) |
static float |
hz2radian(float hz,
int samplingRate) |
static double |
index2freq(int zeroBasedFreqIndex,
int samplingRateInHz,
int zeroBasedMaxFreqIndex) |
static double |
indexDouble2freq(double zeroBasedFreqIndex,
int samplingRateInHz,
int zeroBasedMaxFreqIndex) |
static double[] |
interpolate_pitch_uv(double[] f0s) |
static double[] |
interpolate_pitch_uv(double[] f0s,
double minVoicedVal) |
static double[] |
interpolate(double[] x,
double D) |
static void |
main(String[] args) |
static int[] |
mapFrameIndices(int numfrmSource,
Labels srcLabs,
double srcWindowSizeInSeconds,
double srcSkipSizeInSeconds,
int numFrmTarget,
Labels tgtLabs,
double tgtWindowSizeInSeconds,
double tgtSkipSizeInSeconds) |
static double |
mean(Vector<Double> v) |
static double[] |
meanFilter(double[] x,
int N) |
static double[] |
meanFilter(double[] x,
int N,
double leftOutOfBound,
double rightOutOfBound) |
static float[] |
meanFilter(float[] x,
int N) |
static float[] |
meanFilter(float[] x,
int N,
float leftOutOfBound,
float rightOutOfBound) |
static double[] |
medianFilter(double[] x) |
static double[] |
medianFilter(double[] x,
int N) |
static float[] |
medianFilter(float[] x) |
static float[] |
medianFilter(float[] x,
int N) |
static double |
mel2hz(double mel,
int samplingRateInHz) |
static double |
mel2radian(double mel,
int samplingRateInHz) |
static double |
melNonMultiplied(double freqInRadian,
int samplingRateInHz) |
static double[] |
merge(double[] x1,
double[] x2) |
static int[] |
merge(int[] x1,
int[] x2) |
static double[] |
normalizeAverageSampleEnergy(double[] x,
double newAverageSampleEnergy) |
static double[] |
normalizeAverageSampleEnergyContour(double[] x,
float[] times,
float[] currentContour,
float[] targetContour,
int samplingRateInHz,
float windowDurationInSeconds) |
static double[] |
normalizeVocalTract(double[] srcSignal,
double[] tgtSignal,
int windowType,
double windowSizeInSeconds,
double frameShiftInSeconds,
int lpcOrder,
int samplingRateInHz,
float preCoef) |
static double[] |
normalizeVocalTract(double[] srcSignal,
double[] tgtSignal,
Labels sourceLabels,
Labels targetLabels,
int windowType,
double windowSizeInSeconds,
double frameShiftInSeconds,
int lpcOrder,
int samplingRateInHz,
float preCoef) |
static double[] |
normalizeVocalTract(double[] x,
float[] tAnalysisInSeconds,
float[][] srcLpcs,
float[][] mappedTgtLpcs,
double windowSizeInSeconds,
int samplingRateInHz,
float preCoef) |
static double[] |
normalizeVocalTract(double[] s,
float[] sAnalysisInSeconds,
float[][] mappedTgtLpcs,
int windowType,
double windowSizeInSeconds,
int lpcOrderSrc,
int samplingRateInHz,
float preCoef) |
static PitchMarks |
pitchContour2pitchMarks(double[] f0s,
int fs,
int len,
double ws,
double ss,
boolean bPaddZerosForFinalPitchMark,
int offset) |
static double[] |
pitchMarks2PitchContour(int[] pitchMarks,
float ws,
float ss,
int samplingRate) |
static double[] |
pitchScalePitchContour(double[] f0s,
float ws,
float ss,
float[] pScales,
float[] pScalesTimes) |
static double |
radian2hz(double rad,
int samplingRate) |
static float |
radian2hz(float rad,
int samplingRate) |
static double |
radian2mel(double freqInRadian,
int samplingRateInHz) |
static double[] |
removePreemphasis(double[] frm,
double preCoef) |
static double[] |
replaceNaNsWith(double[] x,
double val) |
static double[] |
reverse(double[] x) |
static float |
sample2time(float sample,
int samplingRate) |
static float |
sample2time(int sample,
int samplingRate) |
static float |
sample2time(long sample,
int samplingRate) |
static float |
sampleFloat2time(float sample,
int samplingRate) |
static float[] |
samples2times(int[] samples,
int samplingRate) |
static double[] |
shift(double[] x,
int N) |
static float[] |
shift(float[] x,
int N) |
static double |
sourceTime2targetTime(double sourceTime,
Labels sourceLabels,
Labels targetLabels) |
static double |
sourceTime2targetTime(double sourceTime,
Labels sourceLabels,
Labels targetLabels,
int[][] map) |
static float[] |
specLinear2cepstrum(double[] specLinear,
int cepsOrder) |
static double[] |
spectralMirror(double[] halfSpectrum) |
static double[] |
subtractSignals(double[] s1,
double[] s2) |
static void |
test_normalizeVocalTract() |
static int |
time2frameIndex(double time,
double windowSizeInSeconds,
double skipSizeInSeconds) |
static int |
time2frameIndex(float time,
float windowSizeInSeconds,
float skipSizeInSeconds) |
static int |
time2LabelIndex(double time,
Labels labels) |
static int[] |
time2sample(double[] times,
int samplingRate) |
static int |
time2sample(double time,
int samplingRate) |
static int[] |
time2sample(float[] times,
int samplingRate) |
static int |
time2sample(float time,
int samplingRate) |
static double |
time2sampleDouble(double time,
int samplingRate) |
static int[] |
times2samples(float[] times,
int samplingRate) |
static float |
timeScaledTime(float t,
float[] scales,
float[] times) |
static float[] |
timeScaledTimes(float[] times,
float[] tScales,
float[] tScalesTimes) |
static double[] |
timeScalePitchContour(double[] f0s,
float ws,
float ss,
float[] tScales,
float[] tScalesTimes) |
public static int getLPOrder(int fs)
public static int getDFTSize(int fs)
public static int getFIRFilterOrder(int fs)
public static int getLifterOrder(int fs)
public static int halfSpectrumSize(int fftSize)
public static int fullSpectrumSize(int maxFreq)
public static double getEnergydB(double x)
public static double getEnergydB(double[] x)
public static double getEnergydB(double[] x, int len)
public static double getEnergydB(double[] x, int len, int start)
public static double getEnergy(double[] x, int len, int start)
public static double getEnergy(double[] x, int len)
public static double getEnergy(double[] x)
public static double getAverageSampleEnergy(double[] x, int len, int start)
public static double getAverageSampleEnergy(double[] x, int len)
public static double getAverageSampleEnergy(double[] x)
public static double[] normalizeAverageSampleEnergy(double[] x, double newAverageSampleEnergy)
public static double[] getEnergyContourRms(double[] x, double windowSizeInSeconds, double skipSizeInSeconds, int samplingRate)
public static float[] getAverageSampleEnergyContour(double[] x, double windowSizeInSeconds, double skipSizeInSeconds, int samplingRate)
public static float[] getAverageSampleEnergyContour(double[] x, float[] times, int samplingRateInHz, float windowDurationInSeconds)
public static double[] normalizeAverageSampleEnergyContour(double[] x, float[] times, float[] currentContour, float[] targetContour, int samplingRateInHz, float windowDurationInSeconds)
public static double[] reverse(double[] x)
public static boolean[] getVuvs(double[] f0s)
public static PitchMarks pitchContour2pitchMarks(double[] f0s, int fs, int len, double ws, double ss, boolean bPaddZerosForFinalPitchMark, int offset)
public static double[] pitchMarks2PitchContour(int[] pitchMarks, float ws, float ss, int samplingRate)
public static double[] fixedRateF0Values(PitchMarks pm, double wsFixedInSeconds, double ssFixedInSeconds, int numfrm, int samplingRate)
public static double[] interpolate_pitch_uv(double[] f0s)
public static double[] interpolate_pitch_uv(double[] f0s, double minVoicedVal)
public static double[] getContourLSFit(double[] contour, boolean isPitchUVInterpolation)
public static double[] fitLeastSquaresLine(double[] x, double[] y)
public static boolean getVoicing(double[] windowedSpeechFrame, int samplingRateInHz)
public static boolean getVoicing(double[] windowedSpeechFrame, int samplingRateInHz, double voicingThreshold)
public static double getVoicingProbability(double[] windowedSpeechFrame, int samplingRateInHz)
public static double[] autocorr(double[] x, int LPOrder)
public static double[] applyPreemphasis(double[] frm, double preCoef)
public static double[] removePreemphasis(double[] frm, double preCoef)
public static double[] freq2bark(double[] freqsInHz)
public static double freq2bark(double freqInHz)
public static double hz2bark(double freqInHz)
freqInHz
- frequency In Hzpublic static double freq2barkNew(double freqInHz)
public static double barkNew2freq(double barkNew)
public static double[] bark2freq(double[] barks, int samplingRateInHz)
public static double bark2freq(double bark, int samplingRateInHz)
public static double barkNew2radian(double bark, int samplingRateInHz)
public static double[][] fft2barkmx(int nfft, int sr, int nfilts, int width, double minfreq, double maxfreq)
nfft
- FFT sizesr
- sampling ratenfilts
- number of output bark bandswidth
- width of each band in Bark (default 1)minfreq
- min frequencymaxfreq
- max frequencypublic static int[] freq2index(double[] freqsInHz, int samplingRateInHz, int maxFreq)
public static int freq2index(double freqInHz, double samplingRateInHz, int maxFreqIndex)
public static double[] freq2indexDouble(double[] freqsInHz, double samplingRateInHz, int maxFreq)
public static double freq2indexDouble(double freqInHz, double samplingRateInHz, int maxFreqIndex)
public static double index2freq(int zeroBasedFreqIndex, int samplingRateInHz, int zeroBasedMaxFreqIndex)
public static double indexDouble2freq(double zeroBasedFreqIndex, int samplingRateInHz, int zeroBasedMaxFreqIndex)
public static float sample2time(int sample, int samplingRate)
public static float sampleFloat2time(float sample, int samplingRate)
public static float sample2time(long sample, int samplingRate)
public static float sample2time(float sample, int samplingRate)
public static int time2sample(float time, int samplingRate)
public static int[] time2sample(float[] times, int samplingRate)
public static int time2sample(double time, int samplingRate)
public static int[] time2sample(double[] times, int samplingRate)
public static double time2sampleDouble(double time, int samplingRate)
public static float[] samples2times(int[] samples, int samplingRate)
public static int[] times2samples(float[] times, int samplingRate)
public static float timeScaledTime(float t, float[] scales, float[] times)
public static float[] timeScaledTimes(float[] times, float[] tScales, float[] tScalesTimes)
public static double[] timeScalePitchContour(double[] f0s, float ws, float ss, float[] tScales, float[] tScalesTimes)
public static double[] pitchScalePitchContour(double[] f0s, float ws, float ss, float[] pScales, float[] pScalesTimes)
public static double[] getNoise(double startFreqInHz, double endFreqInHz, double transitionBandwidthInHz, int samplingRateInHz, int len)
public static double[] getNoiseNormalizedFreqs(double normalizedStartFreq, double normalizedEndFreq, double normalizedTransitionBandwidth, int len)
public static float radian2hz(float rad, int samplingRate)
public static double radian2hz(double rad, int samplingRate)
public static float hz2radian(float hz, int samplingRate)
public static double hz2radian(double hz, int samplingRate)
public static double[] medianFilter(double[] x)
public static float[] medianFilter(float[] x)
public static float[] medianFilter(float[] x, int N)
public static double[] medianFilter(double[] x, int N)
public static double[] meanFilter(double[] x, int N)
public static float[] meanFilter(float[] x, int N)
public static float[] meanFilter(float[] x, int N, float leftOutOfBound, float rightOutOfBound)
public static double[] meanFilter(double[] x, int N, double leftOutOfBound, double rightOutOfBound)
public static float frameIndex2Time(int zeroBasedFrameIndex, float windowSizeInSeconds, float skipSizeInSeconds)
public static double frameIndex2Time(int zeroBasedFrameIndex, double windowSizeInSeconds, double skipSizeInSeconds)
public static int time2frameIndex(float time, float windowSizeInSeconds, float skipSizeInSeconds)
public static int time2frameIndex(double time, double windowSizeInSeconds, double skipSizeInSeconds)
public static void centerClip(double[] x, double ratio)
public static double[] getVoiceds(double[] f0s)
public static double[] getLogF0s(double[] f0s)
public static double[] getExpF0s(double[] logF0s)
public static double getF0Range(double[] f0s)
public static double getF0Range(double[] f0s, double percentileMin, double percentileMax)
public static int frameIndex2LabelIndex(int zeroBasedFrameIndex, Labels labels, double windowSizeInSeconds, double skipSizeInSeconds)
public static int time2LabelIndex(double time, Labels labels)
public static double getRmsDistance(double[] x, double[] y)
public static int[] merge(int[] x1, int[] x2)
public static double[] merge(double[] x1, double[] x2)
public static double[] decimate(double[] x, double D)
public static double[] interpolate(double[] x, double D)
public static double energy(double[] x)
public static double[] filter(double[] b, double[] x)
public static double[] filter(double[] b, double[] a, double[] x)
public static double[] filter(double[] b, double[] x, boolean bNormalize)
public static double[] filter(double[] b, double[] a, double[] x, boolean bNormalize)
public static double[] filter(double[] b, double[] x, boolean bNormalize, double[] zi)
public static double[] filter(double[] b, double[] a, double[] x, boolean bNormalize, double[] zi)
public static double[] filtfilt(double[] b, double[] x)
public static double[] filtfilt(double[] b, double[] a, double[] x)
public static double[] filterfd(double[] filterFFTAbsMag, double[] x, double samplingRate)
public static double[] filterfd(double[] filterFFTAbsMag, double[] x, double samplingRate, double winsize)
public static double[] filterfd(double[] filterFFTAbsMag, double[] x, double samplingRate, double winsize, double skipsize)
public static void addWhiteNoise(double[] x, double level)
public static double[] getWhiteNoise(int totalSamples, double maxAbsGain)
public static double[] getWhiteNoiseOfVariance(int totalSamples, double variance)
public static double[] getWhiteNoiseOfMeanVariance(int totalSamples, double mean, double variance)
public static float[] specLinear2cepstrum(double[] specLinear, int cepsOrder)
public static double cepstrum2linearSpecAmp(float[] ceps, float freqInRadians)
public static double cepstrum2minimumPhase(float[] ceps, float freqInRadians)
public static double getMaximumFreqOfVoicingInHz(double[] specAmpsLinear, int[] peakInds, int[][] freqBandInds, int samplingRate)
public static double[] spectralMirror(double[] halfSpectrum)
public static double[] addSignals(double[] s1, double[] s2)
public static double[] addSignals(double[] s1, double gain1, double[] s2, double gain2)
public static double[] subtractSignals(double[] s1, double[] s2)
public static double[] arFilter(double[] x, double[] a, double lpGain)
public static double[] arFilter(double[] x, float[] a, double lpGain)
public static double[] arFilter(double[] x, float[] a, double lpGain, double[] yInitial)
public static double[] arFilter(double[] x, double[] a, double lpGain, double[] yInitial)
public static double[] arFilterFreqDomain(double[] windowedFrame, double[] a, double lpGain, double startFreqInHz, double endFreqInHz, int samplingRateInHz)
public static double[] fdFilter(double[] x, double[] filterFreqResponse)
public static double[] fdFilter(double[] x, float startFreqInHz, float endFreqInHz, int samplingRateInHz, int fftSize)
public static double[] fdFilter(ComplexArray frameDft, float startFreqInHz, float endFreqInHz, int samplingRateInHz, int origLen)
public static void displayDFTSpectrumLinearNoWindowing(double[] frame)
public static void displayDFTSpectrumLinearNoWindowing(double[] frame, int fftSize)
public static void displayDFTSpectrumLinear(double[] frame)
public static void displayDFTSpectrumLinear(double[] frame, int fftSize)
public static void displayDFTSpectrumLinear(double[] frame, int fftSize, int windowType)
public static void displayDFTSpectrumInDBNoWindowing(double[] frame)
public static void displayDFTSpectrumInDBNoWindowing(double[] frame, int fftSize)
public static void displayDFTSpectrumInDB(double[] frame)
public static void displayDFTSpectrumInDB(double[] frame, int fftSize)
public static void displayDFTSpectrumInDB(double[] frame, int fftSize, int windowType)
public static void displayDFTSpectrumInDB(double[] frame, int fftSize, double[] wgt)
public static double[] getFrameHalfMagnitudeSpectrum(double[] frame, int fftSize)
public static double[] getFrameMagnitudeSpectrum(double[] frame, int fftSize)
public static double[] getFrameHalfMagnitudeSpectrum(double[] frame, int fftSize, int windowType)
public static double[] getFrameMagnitudeSpectrum(double[] frame, int fftSize, int windowType)
public static double[] getFrameHalfMagnitudeSpectrum(double[] frame, int fftSize, double[] wgt)
public static double[] getFrameMagnitudeSpectrum(double[] frame, int fftSize, double[] wgt)
public static ComplexArray getFrameDft(double[] frame, int fftSize)
public static ComplexArray getFrameDft(double[] frame, int fftSize, int windowType)
public static ComplexArray getFrameDft(double[] frame, int fftSize, double[] windowWgt)
public static void displayLPSpectrumLinear(double[] alpha, double lpGain, int fftSize)
public static void displayLPSpectrumInDB(double[] alpha, double lpGain, int fftSize)
public static double[] shift(double[] x, int N)
public static float[] shift(float[] x, int N)
public static double[] getPeakAmplitudes(double[] sDft, double f0InHz, int numHarmonics, int fftSize, double samplingRateInHz, boolean bIncludeZerothHarmonic)
public static double[] getPeakAmplitudeFrequencies(double[] sDft, double f0InHz, int numHarmonics, int fftSize, double samplingRateInHz, boolean bIncludeZerothHarmonic)
public static double[] getPeakAmplitudes(double[] sDft, double f0InHz, int startHarmonicIndex, int endHarmonicIndex, int fftSize, double samplingRateInHz, boolean amplitudes)
sDft
- sDtff0InHz
- f0InHzstartHarmonicIndex
- startHarmonicIndexendHarmonicIndex
- endHarmonicIndexfftSize
- fftSizesamplingRateInHz
- samplingRateInHzamplitudes
- : if amplitudes true it returns the amplitude values, original function if amplitudes false it returns the
amplitude frequencies where the peaks were locatedpublic static float[] getAnalysisTimes(int numfrm, double windowSizeInSeconds, double frameShiftInSeconds)
public static double[][] getMapped(double[][] x, int[] mapInds)
public static float[][] getMapped(float[][] x, int[] mapInds)
public static Window getWindow(int windowType, int windowSizeInSamples)
public static int getTotalFrames(int totalSamples, int windowLengthInSamples, int skipSizeInSamples)
public static int getTotalFrames(int totalSamples, double windowSizeInSeconds, double skipSizeInSeconds)
public static int getTotalFrames(double totalTimeInSeconds, double windowSizeInSeconds, double skipSizeInSeconds)
public static double melNonMultiplied(double freqInRadian, int samplingRateInHz)
public static double radian2mel(double freqInRadian, int samplingRateInHz)
public static double hz2mel(double freqInHz, int samplingRateInHz)
public static double mel2radian(double mel, int samplingRateInHz)
public static double mel2hz(double mel, int samplingRateInHz)
public static double[] replaceNaNsWith(double[] x, double val)
public static double sourceTime2targetTime(double sourceTime, Labels sourceLabels, Labels targetLabels)
public static double sourceTime2targetTime(double sourceTime, Labels sourceLabels, Labels targetLabels, int[][] map)
public static int[] mapFrameIndices(int numfrmSource, Labels srcLabs, double srcWindowSizeInSeconds, double srcSkipSizeInSeconds, int numFrmTarget, Labels tgtLabs, double tgtWindowSizeInSeconds, double tgtSkipSizeInSeconds)
public static double[] normalizeVocalTract(double[] srcSignal, double[] tgtSignal, Labels sourceLabels, Labels targetLabels, int windowType, double windowSizeInSeconds, double frameShiftInSeconds, int lpcOrder, int samplingRateInHz, float preCoef)
public static double[] normalizeVocalTract(double[] s, float[] sAnalysisInSeconds, float[][] mappedTgtLpcs, int windowType, double windowSizeInSeconds, int lpcOrderSrc, int samplingRateInHz, float preCoef)
public static double[] normalizeVocalTract(double[] x, float[] tAnalysisInSeconds, float[][] srcLpcs, float[][] mappedTgtLpcs, double windowSizeInSeconds, int samplingRateInHz, float preCoef)
public static void test_normalizeVocalTract() throws UnsupportedAudioFileException, IOException
public static double[] normalizeVocalTract(double[] srcSignal, double[] tgtSignal, int windowType, double windowSizeInSeconds, double frameShiftInSeconds, int lpcOrder, int samplingRateInHz, float preCoef)
public static void main(String[] args) throws UnsupportedAudioFileException, IOException
Copyright © 2000–2016 DFKI GmbH. All rights reserved.