forest-all-around/sampler/lib/Audio_SdFat/synth_wavetable.cpp
Dooho Yi 91f92c0e6c audio & sd lib upgrade (SdFatSdioEX)
migration from 'smp_v1p0' dev.
for 'sampler' -> skip irrelavant note msg. and keep playing
2019-12-11 23:37:44 +09:00

424 lines
18 KiB
C++

/* Audio Library for Teensy 3.X
* Copyright (c) 2017, TeensyAudio PSU Team
*
* Development of this audio library was sponsored by PJRC.COM, LLC.
* Please support PJRC's efforts to develop open source
* software by purchasing Teensy or other PJRC products.
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice, development funding notice, and this permission
* notice shall be included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
* THE SOFTWARE.
*/
#include <Arduino.h>
#include "synth_wavetable.h"
#include <dspinst.h>
#include <SerialFlash.h>
//#define TIME_TEST_ON
//#define ENVELOPE_DEBUG
// Performance testing macro generally unrelated to the wavetable object, but was used to
// fine tune the performance of specific blocks of code in update(); usage is to specify a
// display interval in ms, then place the code block to be tracked *IN* the macro parens as
// the second argument
#ifdef TIME_TEST_ON
#define TIME_TEST(INTERVAL, CODE_BLOCK_TO_TEST) \
static float MICROS_AVG = 0.0; \
static int TEST_CUR_CNT = 0; \
static int TEST_LST_CNT = 0; \
static int NEXT_DISPLAY = 0; \
static int TEST_TIME_ACC = 0; \
int micros_start = micros(); \
CODE_BLOCK_TO_TEST \
int micros_end = micros(); \
TEST_TIME_ACC += micros_end - micros_start; \
++TEST_CUR_CNT; \
if (NEXT_DISPLAY < micros_end) { \
MICROS_AVG += (TEST_TIME_ACC - TEST_CUR_CNT * MICROS_AVG) / (TEST_LST_CNT + TEST_CUR_CNT); \
NEXT_DISPLAY = micros_end + INTERVAL*1000; \
TEST_LST_CNT += TEST_CUR_CNT; \
TEST_TIME_ACC = TEST_CUR_CNT = 0; \
Serial.printf("avg: %f, n: %i\n", MICROS_AVG, TEST_LST_CNT); \
}
#else
#define TIME_TEST(INTERVAL, CODE_BLOCK_TO_TEST) do { } while(0); \
CODE_BLOCK_TO_TEST
#endif
// Debug code to track state variables for the volume envelope
#ifdef ENVELOPE_DEBUG
#define PRINT_ENV(NAME) Serial.printf("%14s-- env_mult:%06.4f%% of UNITY_GAIN env_incr:%06.4f%% of UNITY_GAIN env_count:%i\n", #NAME, float(env_mult)/float(UNITY_GAIN), float(env_incr)/float(UNITY_GAIN), env_count);
#else
#define PRINT_ENV(NAME) do { } while(0);
#endif
/**
* @brief Stop playing waveform.
*
* Waveform does not immediately stop,
* but fades out based on release time.
*
*/
void AudioSynthWavetable::stop(void) {
cli();
if (env_state != STATE_IDLE) {
env_state = STATE_RELEASE;
env_count = current_sample->RELEASE_COUNT;
if (env_count == 0) env_count = 1;
env_incr = -(env_mult) / (env_count * ENVELOPE_PERIOD);
}
PRINT_ENV(STATE_RELEASE);
sei();
}
/**
* @brief Play waveform at defined frequency, amplitude.
*
* @param freq Frequency of note to playback, value between 1.0 and half of AUDIO_SAMPLE_RATE_EXACT
* @param amp Amplitude scaling of note, value between 0-127, with 127 being base volume
*/
void AudioSynthWavetable::playFrequency(float freq, int amp) {
setState(freqToNote(freq), amp, freq);
}
/**
* @brief Play sample at specified note, amplitude.
*
* @param note Midi note number to playback, value between 0-127
* @param amp Amplitude scaling of playback, value between 0-127, with 127 being base volume
*/
void AudioSynthWavetable::playNote(int note, int amp) {
setState(note, amp, noteToFreq(note));
}
/**
* @brief Initializes object state variables, sets freq/amp, and chooses appropriate sample
*
* @param note Midi note number to play, value between 0-127
* @param amp the amplitude level at which playback should occur
* @param freq exact frequency of the note to be played played
*/
void AudioSynthWavetable::setState(int note, int amp, float freq) {
cli();
int i;
env_state = STATE_IDLE;
// note ranges calculated by sound font decoder
for (i = 0; note > instrument->sample_note_ranges[i]; i++);
current_sample = &instrument->samples[i];
if (current_sample == NULL) {
sei();
return;
}
setFrequency(freq);
vib_count = mod_count = tone_phase = env_incr = env_mult = 0;
vib_phase = mod_phase = TRIANGLE_INITIAL_PHASE;
env_count = current_sample->DELAY_COUNT;
// linear scalar for amp with UINT16_MAX being no attenuation
tone_amp = amp * (UINT16_MAX / 127);
// scale relative to initial attenuation defined by soundfont file
tone_amp = current_sample->INITIAL_ATTENUATION_SCALAR * tone_amp >> 16;
env_state = STATE_DELAY;
PRINT_ENV(STATE_DELAY);
state_change = true;
sei();
}
/**
* @brief Set various integer offsets to values that will produce intended frequencies
* @details the main integer offset, tone_incr, is used to step through the current sample's 16-bit PCM audio sample.
* Specifically, the tone_incr is the rate at which the interpolation code in update() steps through uint32_t space.
* The remaining offset variables represent a minimum and maximum offset allowed for tone_incr, which allows for low-frequency
* variation in playback frequency (aka vibrato). Further details on implementation in update() and in sample_data.h.
*
* @param freq frequency of the generated output (between 0 and the board-specific sample rate)
*/
void AudioSynthWavetable::setFrequency(float freq) {
float tone_incr_temp = freq * current_sample->PER_HERTZ_PHASE_INCREMENT;
tone_incr = tone_incr_temp;
vib_pitch_offset_init = tone_incr_temp * current_sample->VIBRATO_PITCH_COEFFICIENT_INITIAL;
vib_pitch_offset_scnd = tone_incr_temp * current_sample->VIBRATO_PITCH_COEFFICIENT_SECOND;
mod_pitch_offset_init = tone_incr_temp * current_sample->MODULATION_PITCH_COEFFICIENT_INITIAL;
mod_pitch_offset_scnd = tone_incr_temp * current_sample->MODULATION_PITCH_COEFFICIENT_SECOND;
}
/**
* @brief Called by the AudioStream library to fill the audio output buffer.
* The major parts are the interpoalation stage, and the volume envelope stage.
* Further details on implementation included inline.
*
*/
void AudioSynthWavetable::update(void) {
// exit if nothing to do
if (env_state == STATE_IDLE || (current_sample->LOOP == false && tone_phase >= current_sample->MAX_PHASE)) {
env_state = STATE_IDLE;
return;
}
// else locally copy object state and continue
this->state_change = false;
const sample_data* s = (const sample_data*)current_sample;
uint32_t tone_phase = this->tone_phase;
uint32_t tone_incr = this->tone_incr;
uint16_t tone_amp = this->tone_amp;
envelopeStateEnum env_state = this->env_state;
int32_t env_count = this->env_count;
int32_t env_mult = this->env_mult;
int32_t env_incr = this->env_incr;
uint32_t vib_count = this->vib_count;
uint32_t vib_phase = this->vib_phase;
int32_t vib_pitch_offset_init = this->vib_pitch_offset_init;
int32_t vib_pitch_offset_scnd = this->vib_pitch_offset_scnd;
uint32_t mod_count = this->mod_count;
int32_t mod_phase = this->mod_phase;
int32_t mod_pitch_offset_init = this->mod_pitch_offset_init;
int32_t mod_pitch_offset_scnd = this->mod_pitch_offset_scnd;
audio_block_t* block;
block = allocate();
if (block == NULL) return;
uint32_t* p, *end;
uint32_t index, phase_scale;
int32_t s1, s2;
uint32_t tmp1, tmp2;
// filling audio_block two samples at a time
p = (uint32_t*)block->data;
end = p + AUDIO_BLOCK_SAMPLES / 2;
// Main loop to handle interpolation, vibrato (vibrato LFO and modulation LFO), and tremolo (modulation LFO only)
// Virbrato and modulation offsets/multipliers are updated depending on the LFO_SMOOTHNESS, with max smoothness (7) being one
// update per loop interation, and minimum smoothness (1) being once per loop. Hence there is a configurable trade-off
// between performance and the smoothness of LFO changes to pitch/amplitude as well as the vibrato/modulation delay granularity
// also note that the vibrato/tremolo for the two LFO are defined in the SoundFont spec to be a cents (vibrato) or centibel (tremolo)
// diviation oscillating with a triangle wave at a given frequency; the following implementation gets the critical points of those
// oscillations correct, but linearly interpolates the *frequency* and *amplitude* range between those points, which technically results
// in a "bowing" of the triangle wave curve relative to what it should be (although this typically isn't audible)
while (p < end) {
// TODO: more elegant support of non-looping samples
if (s->LOOP == false && tone_phase >= s->MAX_PHASE) break;
// variable to accumulate LFO pitch offsets; stays 0 if still in vibrato/modulation delay
int32_t tone_incr_offset = 0;
if (vib_count++ > s->VIBRATO_DELAY) {
vib_phase += s->VIBRATO_INCREMENT;
// convert uint32_t phase value to int32_t triangle wave value
// TRIANGLE_INITIAL_PHASE (0xC0000000) and 0x40000000 -> 0, 0 -> INT32_MAX/2, 0x80000000 -> INT32_MIN/2
int32_t vib_scale = vib_phase & 0x80000000 ? 0x40000000 + vib_phase : 0x3FFFFFFF - vib_phase;
// select a vibrato pitch offset based on sign of scale; note that the values "init" and "scnd" values
// produced by the decoder script will either both be negative, or both be positive; this allows the
// scalar to either start with either a downward (negative offset) or upward (positive) pitch oscillation
int32_t vib_pitch_offset = vib_scale >= 0 ? vib_pitch_offset_init : vib_pitch_offset_scnd;
// scale the offset and accumulate into offset
// note the offset value is already preshifted by << 2 to account for this func shifting >> 32
tone_incr_offset = multiply_accumulate_32x32_rshift32_rounded(tone_incr_offset, vib_scale, vib_pitch_offset);
}
// variable to hold an adjusted amplitude attenuation value; stays at tone_amp if modulation in delay
int32_t mod_amp = tone_amp;
if (mod_count++ > s->MODULATION_DELAY) {
// pitch LFO component is same as above, but we'll also use the scale value for tremolo below
mod_phase += s->MODULATION_INCREMENT;
int32_t mod_scale = mod_phase & 0x80000000 ? 0x40000000 + mod_phase : 0x3FFFFFFF - mod_phase;
int32_t mod_pitch_offset = mod_scale >= 0 ? mod_pitch_offset_init : mod_pitch_offset_scnd;
tone_incr_offset = multiply_accumulate_32x32_rshift32_rounded(tone_incr_offset, mod_scale, mod_pitch_offset);
// similar to pitch, sign of init and scnd are either both + or - to allow correct triangle direction
int32_t mod_amp_offset = (mod_scale >= 0 ? s->MODULATION_AMPLITUDE_INITIAL_GAIN : s->MODULATION_AMPLITUDE_SECOND_GAIN);
// here we scale the amp offset which, similar to the pitch offset, is already pre-shifted by << 2
mod_scale = multiply_32x32_rshift32(mod_scale, mod_amp_offset);
// the resulting scalar is then used to scale mod_map (possibly resulting in a negative) and add that back into mod_amp
mod_amp = signed_multiply_accumulate_32x16b(mod_amp, mod_scale, mod_amp);
}
// producing 2 output values per iteration; repeat more depending on the LFO_SMOOTHNESS
// this segment linearly interpolates, calculates how far we step through the sample data, and scales amplitude
for (int i = LFO_PERIOD / 2; i; --i, ++p) {
// INDEX_BITS representing the higher order bits we use to index into the sample data
index = tone_phase >> (32 - s->INDEX_BITS);
// recast as uint32_t to load in packed variable; initially int16_t* since we may need to read accross a word boundry
// note we are assuming a little-endian cpu (i.e. the first sample is loaded into the lower half-word)
tmp1 = *((uint32_t*)(s->sample + index));
// phase_scale here being the next 16-bits after the first INDEX_BITS, representing the distince between the samples to interpolate at
// 0x0000 gives us all of the first sample point, 0xFFFF all of the second, anything inbetween a sliding mix
phase_scale = (tone_phase << s->INDEX_BITS) >> 16;
// scaling of second sample point
s1 = signed_multiply_32x16t(phase_scale, tmp1);
// then add in scaling of first point
s1 = signed_multiply_accumulate_32x16b(s1, 0xFFFF - phase_scale, tmp1);
// apply amplitude scaling
s1 = signed_multiply_32x16b(mod_amp, s1);
// iterate tone_phase, giving us our desired frequency playback, and apply the offset, giving us our pitch LFOs
tone_phase += tone_incr + tone_incr_offset;
// break if no loop and we've gone past the end of the sample
if (s->LOOP == false && tone_phase >= s->MAX_PHASE) break;
// move phase back if a looped sample has overstepped its loop
tone_phase = s->LOOP && tone_phase >= s->LOOP_PHASE_END ? tone_phase - s->LOOP_PHASE_LENGTH : tone_phase;
//repeat as above
index = tone_phase >> (32 - s->INDEX_BITS);
tmp1 = *((uint32_t*)(s->sample + index));
phase_scale = (tone_phase << s->INDEX_BITS) >> 16;
s2 = signed_multiply_32x16t(phase_scale, tmp1);
s2 = signed_multiply_accumulate_32x16b(s2, 0xFFFF - phase_scale, tmp1);
s2 = signed_multiply_32x16b(mod_amp, s2);
tone_phase += tone_incr + tone_incr_offset;
if (s->LOOP == false && tone_phase >= s->MAX_PHASE) break;
tone_phase = s->LOOP && tone_phase >= s->LOOP_PHASE_END ? tone_phase - s->LOOP_PHASE_LENGTH : tone_phase;
// pack the two output samples into the audio_block
*p = pack_16b_16b(s2, s1);
}
}
// fill with 0s if non-looping sample that ended prematurely
if (p < end) {
env_state = STATE_IDLE;
env_count = 0;
while (p < end) *p++ = 0;
}
// filling audio_block two samples at a time
p = (uint32_t *)block->data;
end = p + AUDIO_BLOCK_SAMPLES / 2;
// the following code handles the volume envelope with the following state transitions controlled here:
// STATE_DELAY -> STATE_ATTACK -> STATE_HOLD -> STATE_DECAY -> STATE_SUSTAIN or STATE_IDLE
// STATE_RELEASE -> STATE_IDLE
// When STATE_SUSTAIN is reached, it is held indefinitely.
// Outside of this code, playNote() and playFrequency() will initially set STATE_DELAY, and stop()
// is responsible for setting STATE_RELEASE which can occur during any state, except STATE_IDLE
// State defintions:
// idle - not playing (generally should never arrive here)
// delay - full attenuation
// attack - linear ramp from full attenuation to no attenuation
// hold - no attenuation
// decay - linear ramp down to a given level of attenuation (SUSTAIN_MULT)
// sustain - constant attenuation at a given level (SUSTAIN_MULT)
// release - linear ramp down from current attenuation level to full attenuation
// Definitions of the states generally follow the SoundFont spec, with a major exception being that all
// volume scaling is linear realtive to amplitude; this is correct with respect to the attack, but not
// the correct implementation relative to the decay and release which should be scaling linearly relative
// to centibels. Practically this means the decay and release happen too slowing intially, and too quick
// near the end
// other points of note are that one env_count corresponds to 1 second * ENVELOPE_PERIOD / AUDIO_SAMPLE_RATE_EXACT;
// the ENVELOPE_PERIOD is the number of samples processed per iteration of the following loop
while (p < end) {
// note env_count == 0 is used as a trigger for state transition
if (env_count <= 0) switch (env_state) {
case STATE_DELAY:
env_state = STATE_ATTACK;
env_count = s->ATTACK_COUNT;
env_incr = UNITY_GAIN / (env_count * ENVELOPE_PERIOD);
PRINT_ENV(STATE_ATTACK);
continue;
case STATE_ATTACK:
env_mult = UNITY_GAIN;
env_state = STATE_HOLD;
env_count = s->HOLD_COUNT;
env_incr = 0;
PRINT_ENV(STATE_HOLD);
continue;
case STATE_HOLD:
env_state = STATE_DECAY;
env_count = s->DECAY_COUNT;
env_incr = (-s->SUSTAIN_MULT) / (env_count * ENVELOPE_PERIOD);
PRINT_ENV(STATE_DECAY);
continue;
case STATE_DECAY:
env_mult = UNITY_GAIN - s->SUSTAIN_MULT;
// UINT16_MAX is a value approximately corresponding to the -100 dBFS defined in the SoundFont spec as full attenuation
// hence this comparison either sends the state to indefinite STATE_SUSTAIN, or immediately into STATE_RELEASE -> STATE_IDLE
env_state = env_mult < UNITY_GAIN / UINT16_MAX ? STATE_RELEASE : STATE_SUSTAIN;
env_incr = 0;
continue;
case STATE_SUSTAIN:
env_count = INT32_MAX;
PRINT_ENV(STATE_SUSTAIN);
continue;
case STATE_RELEASE:
env_state = STATE_IDLE;
for (; p < end; ++p) *p = 0;
PRINT_ENV(STATE_IDLE);
continue;
default:
p = end;
PRINT_ENV(DEFAULT);
continue;
}
env_mult += env_incr;
// env_mult is INT32_MAX at max (i.e. 31-bits), so shift << 1 so result is aligned with high halfword of tmp1/tmp2
tmp1 = signed_multiply_32x16b(env_mult, p[0]) << 1;
env_mult += env_incr;
tmp2 = signed_multiply_32x16t(env_mult, p[0]) << 1;
// pack from high halfword of tmp1, tmp2
p[0] = pack_16t_16t(tmp2, tmp1);
env_mult += env_incr;
tmp1 = signed_multiply_32x16b(env_mult, p[1]) << 1;
env_mult += env_incr;
tmp2 = signed_multiply_32x16t(env_mult, p[1]) << 1;
p[1] = pack_16t_16t(tmp2, tmp1);
env_mult += env_incr;
tmp1 = signed_multiply_32x16b(env_mult, p[2]) << 1;
env_mult += env_incr;
tmp2 = signed_multiply_32x16t(env_mult, p[2]) << 1;
p[2] = pack_16t_16t(tmp2, tmp1);
env_mult += env_incr;
tmp1 = signed_multiply_32x16b(env_mult, p[3]) << 1;
env_mult += env_incr;
tmp2 = signed_multiply_32x16t(env_mult, p[3]) << 1;
p[3] = pack_16t_16t(tmp2, tmp1);
p += ENVELOPE_PERIOD / 2;
env_count--;
}
// copy state back, unless there was a state change
if (this->state_change == false) {
this->tone_phase = tone_phase;
this->env_state = env_state;
this->env_count = env_count;
this->env_mult = env_mult;
this->env_incr = env_incr;
if (this->env_state != STATE_IDLE) {
this->vib_count = vib_count;
this->vib_phase = vib_phase;
this->mod_count = mod_count;
this->mod_phase = mod_phase;
}
else {
this->vib_count = this->mod_count = 0;
this->vib_phase = this->mod_phase = TRIANGLE_INITIAL_PHASE;
}
}
transmit(block);
release(block);
}