diff options
author | Bent Bisballe Nyeng <deva@aasimon.org> | 2015-07-19 14:06:04 +0200 |
---|---|---|
committer | Bent Bisballe Nyeng <deva@aasimon.org> | 2016-01-20 13:31:09 +0100 |
commit | 2534e4f930f821acc0fc4d5cbfce74325b9b5137 (patch) | |
tree | d405b29951ae18b197b25e61dae7f9b8e90f181c | |
parent | f7c57640ecaf20148361db0bad321b60009061f7 (diff) |
The SIMD implementation is broken with the current cachemanager version and does not add much to the performance anyway; so now it is disabled.
-rw-r--r-- | src/drumgizmo.cc | 37 |
1 files changed, 22 insertions, 15 deletions
diff --git a/src/drumgizmo.cc b/src/drumgizmo.cc index e7843d4..528b542 100644 --- a/src/drumgizmo.cc +++ b/src/drumgizmo.cc @@ -380,9 +380,10 @@ bool DrumGizmo::run(size_t pos, sample_t *samples, size_t nsamples) return true; } +#undef SSE // SSE broken for now ... so disable it. #ifdef SSE #define N 8 -typedef float vNsf __attribute__ ((vector_size(sizeof(float)*N))); +typedef float vNsf __attribute__ ((vector_size(sizeof(sample_t)*N))); #endif/*SSE*/ void DrumGizmo::getSamples(int ch, int pos, sample_t *s, size_t sz) @@ -423,39 +424,45 @@ void DrumGizmo::getSamples(int ch, int pos, sample_t *s, size_t sz) size_t n = 0; // default start point is 0. // If we are not at offset 0 in current buffer: - if(evt->offset > (size_t)pos) n = evt->offset - pos; + if(evt->offset > (size_t)pos) { + n = evt->offset - pos; + } size_t end = sz; // default end point is the end of the buffer. // Find the end point intra-buffer - if((evt->t + end - n) > af->size) end = af->size - evt->t + n; + if((evt->t + end - n) > af->size) { + end = af->size - evt->t + n; + } // This should not be necessary but make absolutely sure that we do // not write over the end of the buffer. - if(end > sz) end = sz; + if(end > sz) { + end = sz; + } size_t t = 0; // Internal buffer counter if(evt->rampdown == NO_RAMPDOWN) { - if(n > 0) { - // We cannot use SIMD on this buffer. - for(; n < end; n++) { - s[n] += evt->buffer[t]; - t++; - } - } + #ifdef SSE size_t optend = ((end - n) / N) * N + n; + + // Force source addr to be 16 byte aligned... (might skip 1 or 2 samples) + while((size_t)&evt->buffer[t] % 16) { + ++t; + } + for(; (n < optend) && (t < evt->buffer_size); n += N) { *(vNsf*)&(s[n]) += *(vNsf*)&(evt->buffer[t]); t += N; - } + } #endif - for(; n < end; n++) { + for(; (n < end) && (t < evt->buffer_size); n++) { s[n] += evt->buffer[t]; t++; } } else { // Ramp down in progress. - for(; n < end && evt->rampdown; n++) { + for(; (n < end) && (t < evt->buffer_size) && evt->rampdown; n++) { float scale = (float)evt->rampdown/(float)evt->ramp_start; s[n] += evt->buffer[t] * scale; t++; @@ -463,7 +470,7 @@ void DrumGizmo::getSamples(int ch, int pos, sample_t *s, size_t sz) } } - evt->t += t; // Add internal buffer counter to "global" event counter. + evt->t += evt->buffer_size; // Add internal buffer counter to "global" event counter. if((evt->t < af->size) && (evt->rampdown != 0)) { evt->buffer = cacheManager.next(evt->cache_id, evt->buffer_size); |