mirror of
https://gitea.osmocom.org/cellular-infrastructure/osmo-trx.git
synced 2025-10-23 08:22:00 +00:00
SigProcLib: Improve Vector buffer allocation mess
Original issue: In order to use SSE instructions, 16-byte aligned memory chunks are needed, and C++ version < C++11 doesn't provide for a native new/delete store. For that reason, memalign() must be used in the implementation of convolve_h_alloc() for some buffers. On the other side, The C++ code relies on C++ "new T[]" operator to allocate a chunk of memory containing an array of class instances. As classes are complex types, they cannot be allocated through C structures (calling malloc). Experimentally can be seen too that it's unreliable and the process will crash during startup if malloc() is used and then a Complex<> deferred from it. Previous implementation allowed for use of convolve_h_alloc or new[] based on how the (signal)Vector is called, because then the buffer is not going to be managed internally. But that's unreliable since resize() calling resize() on it could use "delete" operator on a malloc'ed buffer, and end up having a new new[] allocated buffer. It was also found that some of the callers were actually leaking memory through ASan (because the buffer is not managed by the Vector instance). IMHO best option would be to rewrite all this code using C structures and malloc/free exclusively, since it would make all this cod eeasier to maintain. But for now, let's extend the Vector class to allow specifying an external alloc/free function and let the Vector instance take care of the ownership of the buffer in all scenarios. Change-Id: Ie484a4762a7f77fe1b105188ea03a6f025730b82
This commit is contained in:
committed by
Harald Welte
parent
800c029c70
commit
f7331764ac
@@ -32,11 +32,14 @@
|
|||||||
#include <string.h>
|
#include <string.h>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
#include <assert.h>
|
#include <assert.h>
|
||||||
|
#include <stdlib.h>
|
||||||
|
|
||||||
// We cant use Logger.h in this file...
|
// We cant use Logger.h in this file...
|
||||||
extern int gVectorDebug;
|
extern int gVectorDebug;
|
||||||
#define BVDEBUG(msg) if (gVectorDebug) {std::cout << msg;}
|
#define BVDEBUG(msg) if (gVectorDebug) {std::cout << msg;}
|
||||||
|
|
||||||
|
typedef void (*vector_free_func)(void* wData);
|
||||||
|
typedef void *(*vector_alloc_func)(size_t newSize);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
A simplified Vector template with aliases.
|
A simplified Vector template with aliases.
|
||||||
@@ -60,6 +63,8 @@ template <class T> class Vector {
|
|||||||
T* mData; ///< allocated data block, if any
|
T* mData; ///< allocated data block, if any
|
||||||
T* mStart; ///< start of useful data
|
T* mStart; ///< start of useful data
|
||||||
T* mEnd; ///< end of useful data + 1
|
T* mEnd; ///< end of useful data + 1
|
||||||
|
vector_alloc_func mAllocFunc; ///< function used to alloc new mData during resize.
|
||||||
|
vector_free_func mFreeFunc; ///< function used to free mData.
|
||||||
|
|
||||||
public:
|
public:
|
||||||
|
|
||||||
@@ -85,9 +90,19 @@ template <class T> class Vector {
|
|||||||
/** Change the size of the Vector, discarding content. */
|
/** Change the size of the Vector, discarding content. */
|
||||||
void resize(size_t newSize)
|
void resize(size_t newSize)
|
||||||
{
|
{
|
||||||
if (mData!=NULL) delete[] mData;
|
if (mData!=NULL) {
|
||||||
|
if (mFreeFunc)
|
||||||
|
mFreeFunc(mData);
|
||||||
|
else
|
||||||
|
delete[] mData;
|
||||||
|
}
|
||||||
if (newSize==0) mData=NULL;
|
if (newSize==0) mData=NULL;
|
||||||
else mData = new T[newSize];
|
else {
|
||||||
|
if (mAllocFunc)
|
||||||
|
mData = (T*) mAllocFunc(newSize);
|
||||||
|
else
|
||||||
|
mData = new T[newSize];
|
||||||
|
}
|
||||||
mStart = mData;
|
mStart = mData;
|
||||||
mEnd = mStart + newSize;
|
mEnd = mStart + newSize;
|
||||||
}
|
}
|
||||||
@@ -116,29 +131,31 @@ template <class T> class Vector {
|
|||||||
//@{
|
//@{
|
||||||
|
|
||||||
/** Build an empty Vector of a given size. */
|
/** Build an empty Vector of a given size. */
|
||||||
Vector(size_t wSize=0):mData(NULL) { resize(wSize); }
|
Vector(size_t wSize=0, vector_alloc_func wAllocFunc=NULL, vector_free_func wFreeFunc=NULL)
|
||||||
|
:mData(NULL), mAllocFunc(wAllocFunc), mFreeFunc(wFreeFunc)
|
||||||
|
{ resize(wSize); }
|
||||||
|
|
||||||
/** Build a Vector by moving another. */
|
/** Build a Vector by moving another. */
|
||||||
Vector(Vector<T>&& other)
|
Vector(Vector<T>&& other)
|
||||||
:mData(other.mData),mStart(other.mStart),mEnd(other.mEnd)
|
:mData(other.mData),mStart(other.mStart),mEnd(other.mEnd), mAllocFunc(other.mAllocFunc), mFreeFunc(other.mFreeFunc)
|
||||||
{ other.mData=NULL; }
|
{ other.mData=NULL; }
|
||||||
|
|
||||||
/** Build a Vector by copying another. */
|
/** Build a Vector by copying another. */
|
||||||
Vector(const Vector<T>& other):mData(NULL) { clone(other); }
|
Vector(const Vector<T>& other):mData(NULL), mAllocFunc(other.mAllocFunc), mFreeFunc(other.mFreeFunc) { clone(other); }
|
||||||
|
|
||||||
/** Build a Vector with explicit values. */
|
/** Build a Vector with explicit values. */
|
||||||
Vector(T* wData, T* wStart, T* wEnd)
|
Vector(T* wData, T* wStart, T* wEnd, vector_alloc_func wAllocFunc=NULL, vector_free_func wFreeFunc=NULL)
|
||||||
:mData(wData),mStart(wStart),mEnd(wEnd)
|
:mData(wData),mStart(wStart),mEnd(wEnd), mAllocFunc(wAllocFunc), mFreeFunc(wFreeFunc)
|
||||||
{ }
|
{ }
|
||||||
|
|
||||||
/** Build a vector from an existing block, NOT to be deleted upon destruction. */
|
/** Build a vector from an existing block, NOT to be deleted upon destruction. */
|
||||||
Vector(T* wStart, size_t span)
|
Vector(T* wStart, size_t span, vector_alloc_func wAllocFunc=NULL, vector_free_func wFreeFunc=NULL)
|
||||||
:mData(NULL),mStart(wStart),mEnd(wStart+span)
|
:mData(NULL),mStart(wStart),mEnd(wStart+span),mAllocFunc(wAllocFunc), mFreeFunc(wFreeFunc)
|
||||||
{ }
|
{ }
|
||||||
|
|
||||||
/** Build a Vector by concatenation. */
|
/** Build a Vector by concatenation. */
|
||||||
Vector(const Vector<T>& other1, const Vector<T>& other2)
|
Vector(const Vector<T>& other1, const Vector<T>& other2, vector_alloc_func wAllocFunc=NULL, vector_free_func wFreeFunc=NULL)
|
||||||
:mData(NULL)
|
:mData(NULL), mAllocFunc(wAllocFunc), mFreeFunc(wFreeFunc)
|
||||||
{
|
{
|
||||||
resize(other1.size()+other2.size());
|
resize(other1.size()+other2.size());
|
||||||
memcpy(mStart, other1.mStart, other1.bytes());
|
memcpy(mStart, other1.mStart, other1.bytes());
|
||||||
@@ -162,6 +179,8 @@ template <class T> class Vector {
|
|||||||
mData=other.mData;
|
mData=other.mData;
|
||||||
mStart=other.mStart;
|
mStart=other.mStart;
|
||||||
mEnd=other.mEnd;
|
mEnd=other.mEnd;
|
||||||
|
mAllocFunc=other.mAllocFunc;
|
||||||
|
mFreeFunc=other.mFreeFunc;
|
||||||
other.mData=NULL;
|
other.mData=NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@@ -1,7 +1,7 @@
|
|||||||
#ifndef _CONVOLVE_H_
|
#ifndef _CONVOLVE_H_
|
||||||
#define _CONVOLVE_H_
|
#define _CONVOLVE_H_
|
||||||
|
|
||||||
void *convolve_h_alloc(int num);
|
void *convolve_h_alloc(size_t num);
|
||||||
|
|
||||||
int convolve_real(const float *x, int x_len,
|
int convolve_real(const float *x, int x_len,
|
||||||
const float *h, int h_len,
|
const float *h, int h_len,
|
||||||
|
@@ -146,7 +146,7 @@ int base_convolve_complex(const float *x, int x_len,
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* Aligned filter tap allocation */
|
/* Aligned filter tap allocation */
|
||||||
void *convolve_h_alloc(int len)
|
void *convolve_h_alloc(size_t len)
|
||||||
{
|
{
|
||||||
#ifdef HAVE_SSE3
|
#ifdef HAVE_SSE3
|
||||||
return memalign(16, len * 2 * sizeof(float));
|
return memalign(16, len * 2 * sizeof(float));
|
||||||
|
@@ -84,14 +84,13 @@ static Resampler *dnsampler = NULL;
|
|||||||
* perform 16-byte memory alignment required by many SSE instructions.
|
* perform 16-byte memory alignment required by many SSE instructions.
|
||||||
*/
|
*/
|
||||||
struct CorrelationSequence {
|
struct CorrelationSequence {
|
||||||
CorrelationSequence() : sequence(NULL), buffer(NULL)
|
CorrelationSequence() : sequence(NULL)
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
~CorrelationSequence()
|
~CorrelationSequence()
|
||||||
{
|
{
|
||||||
delete sequence;
|
delete sequence;
|
||||||
free(buffer);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
signalVector *sequence;
|
signalVector *sequence;
|
||||||
@@ -106,8 +105,7 @@ struct CorrelationSequence {
|
|||||||
* for SSE instructions.
|
* for SSE instructions.
|
||||||
*/
|
*/
|
||||||
struct PulseSequence {
|
struct PulseSequence {
|
||||||
PulseSequence() : c0(NULL), c1(NULL), c0_inv(NULL), empty(NULL),
|
PulseSequence() : c0(NULL), c1(NULL), c0_inv(NULL), empty(NULL)
|
||||||
c0_buffer(NULL), c1_buffer(NULL), c0_inv_buffer(NULL)
|
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -117,17 +115,12 @@ struct PulseSequence {
|
|||||||
delete c1;
|
delete c1;
|
||||||
delete c0_inv;
|
delete c0_inv;
|
||||||
delete empty;
|
delete empty;
|
||||||
free(c0_buffer);
|
|
||||||
free(c1_buffer);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
signalVector *c0;
|
signalVector *c0;
|
||||||
signalVector *c1;
|
signalVector *c1;
|
||||||
signalVector *c0_inv;
|
signalVector *c0_inv;
|
||||||
signalVector *empty;
|
signalVector *empty;
|
||||||
void *c0_buffer;
|
|
||||||
void *c1_buffer;
|
|
||||||
void *c0_inv_buffer;
|
|
||||||
};
|
};
|
||||||
|
|
||||||
static CorrelationSequence *gMidambles[] = {NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL};
|
static CorrelationSequence *gMidambles[] = {NULL,NULL,NULL,NULL,NULL,NULL,NULL,NULL};
|
||||||
@@ -340,7 +333,7 @@ static signalVector *convolve(const signalVector *x, const signalVector *h,
|
|||||||
if (y && (len > y->size()))
|
if (y && (len > y->size()))
|
||||||
return NULL;
|
return NULL;
|
||||||
if (!y) {
|
if (!y) {
|
||||||
y = new signalVector(len);
|
y = new signalVector(len, convolve_h_alloc, free);
|
||||||
alloc = true;
|
alloc = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -403,8 +396,7 @@ static bool generateInvertC0Pulse(PulseSequence *pulse)
|
|||||||
if (!pulse)
|
if (!pulse)
|
||||||
return false;
|
return false;
|
||||||
|
|
||||||
pulse->c0_inv_buffer = convolve_h_alloc(5);
|
pulse->c0_inv = new signalVector((complex *) convolve_h_alloc(5), 0, 5, convolve_h_alloc, free);
|
||||||
pulse->c0_inv = new signalVector((complex *) pulse->c0_inv_buffer, 0, 5);
|
|
||||||
pulse->c0_inv->isReal(true);
|
pulse->c0_inv->isReal(true);
|
||||||
pulse->c0_inv->setAligned(false);
|
pulse->c0_inv->setAligned(false);
|
||||||
|
|
||||||
@@ -433,9 +425,7 @@ static bool generateC1Pulse(int sps, PulseSequence *pulse)
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
pulse->c1_buffer = convolve_h_alloc(len);
|
pulse->c1 = new signalVector((complex *) convolve_h_alloc(len), 0, len, convolve_h_alloc, free);
|
||||||
pulse->c1 = new signalVector((complex *)
|
|
||||||
pulse->c1_buffer, 0, len);
|
|
||||||
pulse->c1->isReal(true);
|
pulse->c1->isReal(true);
|
||||||
|
|
||||||
/* Enable alignment for SSE usage */
|
/* Enable alignment for SSE usage */
|
||||||
@@ -489,8 +479,7 @@ static PulseSequence *generateGSMPulse(int sps)
|
|||||||
len = 4;
|
len = 4;
|
||||||
}
|
}
|
||||||
|
|
||||||
pulse->c0_buffer = convolve_h_alloc(len);
|
pulse->c0 = new signalVector((complex *) convolve_h_alloc(len), 0, len, convolve_h_alloc, free);
|
||||||
pulse->c0 = new signalVector((complex *) pulse->c0_buffer, 0, len);
|
|
||||||
pulse->c0->isReal(true);
|
pulse->c0->isReal(true);
|
||||||
|
|
||||||
/* Enable alingnment for SSE usage */
|
/* Enable alingnment for SSE usage */
|
||||||
@@ -1019,7 +1008,7 @@ static void generateDelayFilters()
|
|||||||
|
|
||||||
for (int i = 0; i < DELAYFILTS; i++) {
|
for (int i = 0; i < DELAYFILTS; i++) {
|
||||||
data = (complex *) convolve_h_alloc(h_len);
|
data = (complex *) convolve_h_alloc(h_len);
|
||||||
h = new signalVector(data, 0, h_len);
|
h = new signalVector(data, 0, h_len, convolve_h_alloc, free);
|
||||||
h->setAligned(true);
|
h->setAligned(true);
|
||||||
h->isReal(true);
|
h->isReal(true);
|
||||||
|
|
||||||
@@ -1263,7 +1252,7 @@ static bool generateMidamble(int sps, int tsc)
|
|||||||
|
|
||||||
/* For SSE alignment, reallocate the midamble sequence on 16-byte boundary */
|
/* For SSE alignment, reallocate the midamble sequence on 16-byte boundary */
|
||||||
data = (complex *) convolve_h_alloc(midMidamble->size());
|
data = (complex *) convolve_h_alloc(midMidamble->size());
|
||||||
_midMidamble = new signalVector(data, 0, midMidamble->size());
|
_midMidamble = new signalVector(data, 0, midMidamble->size(), convolve_h_alloc, free);
|
||||||
_midMidamble->setAligned(true);
|
_midMidamble->setAligned(true);
|
||||||
midMidamble->copyTo(*_midMidamble);
|
midMidamble->copyTo(*_midMidamble);
|
||||||
|
|
||||||
@@ -1274,7 +1263,6 @@ static bool generateMidamble(int sps, int tsc)
|
|||||||
}
|
}
|
||||||
|
|
||||||
gMidambles[tsc] = new CorrelationSequence;
|
gMidambles[tsc] = new CorrelationSequence;
|
||||||
gMidambles[tsc]->buffer = data;
|
|
||||||
gMidambles[tsc]->sequence = _midMidamble;
|
gMidambles[tsc]->sequence = _midMidamble;
|
||||||
gMidambles[tsc]->gain = peakDetect(*autocorr, &toa, NULL);
|
gMidambles[tsc]->gain = peakDetect(*autocorr, &toa, NULL);
|
||||||
|
|
||||||
@@ -1319,13 +1307,12 @@ static CorrelationSequence *generateEdgeMidamble(int tsc)
|
|||||||
conjugateVector(*midamble);
|
conjugateVector(*midamble);
|
||||||
|
|
||||||
data = (complex *) convolve_h_alloc(midamble->size());
|
data = (complex *) convolve_h_alloc(midamble->size());
|
||||||
_midamble = new signalVector(data, 0, midamble->size());
|
_midamble = new signalVector(data, 0, midamble->size(), convolve_h_alloc, free);
|
||||||
_midamble->setAligned(true);
|
_midamble->setAligned(true);
|
||||||
midamble->copyTo(*_midamble);
|
midamble->copyTo(*_midamble);
|
||||||
|
|
||||||
/* Channel gain is an empirically measured value */
|
/* Channel gain is an empirically measured value */
|
||||||
seq = new CorrelationSequence;
|
seq = new CorrelationSequence;
|
||||||
seq->buffer = data;
|
|
||||||
seq->sequence = _midamble;
|
seq->sequence = _midamble;
|
||||||
seq->gain = Complex<float>(-19.6432, 19.5006) / 1.18;
|
seq->gain = Complex<float>(-19.6432, 19.5006) / 1.18;
|
||||||
seq->toa = 0;
|
seq->toa = 0;
|
||||||
@@ -1360,7 +1347,7 @@ static bool generateRACHSequence(CorrelationSequence **seq, const BitVector &bv,
|
|||||||
|
|
||||||
/* For SSE alignment, reallocate the midamble sequence on 16-byte boundary */
|
/* For SSE alignment, reallocate the midamble sequence on 16-byte boundary */
|
||||||
data = (complex *) convolve_h_alloc(seq1->size());
|
data = (complex *) convolve_h_alloc(seq1->size());
|
||||||
_seq1 = new signalVector(data, 0, seq1->size());
|
_seq1 = new signalVector(data, 0, seq1->size(), convolve_h_alloc, free);
|
||||||
_seq1->setAligned(true);
|
_seq1->setAligned(true);
|
||||||
seq1->copyTo(*_seq1);
|
seq1->copyTo(*_seq1);
|
||||||
|
|
||||||
@@ -1372,7 +1359,6 @@ static bool generateRACHSequence(CorrelationSequence **seq, const BitVector &bv,
|
|||||||
|
|
||||||
*seq = new CorrelationSequence;
|
*seq = new CorrelationSequence;
|
||||||
(*seq)->sequence = _seq1;
|
(*seq)->sequence = _seq1;
|
||||||
(*seq)->buffer = data;
|
|
||||||
(*seq)->gain = peakDetect(*autocorr, &toa, NULL);
|
(*seq)->gain = peakDetect(*autocorr, &toa, NULL);
|
||||||
|
|
||||||
/* For 1 sps only
|
/* For 1 sps only
|
||||||
|
@@ -1,20 +1,20 @@
|
|||||||
#include "signalVector.h"
|
#include "signalVector.h"
|
||||||
|
|
||||||
signalVector::signalVector(size_t size)
|
signalVector::signalVector(size_t size, vector_alloc_func wAllocFunc, vector_free_func wFreeFunc)
|
||||||
: Vector<complex>(size),
|
: Vector<complex>(size, wAllocFunc, wFreeFunc),
|
||||||
real(false), aligned(false), symmetry(NONE)
|
real(false), aligned(false), symmetry(NONE)
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
|
||||||
signalVector::signalVector(size_t size, size_t start)
|
signalVector::signalVector(size_t size, size_t start, vector_alloc_func wAllocFunc, vector_free_func wFreeFunc)
|
||||||
: Vector<complex>(size + start),
|
: Vector<complex>(size + start, wAllocFunc, wFreeFunc),
|
||||||
real(false), aligned(false), symmetry(NONE)
|
real(false), aligned(false), symmetry(NONE)
|
||||||
{
|
{
|
||||||
mStart = mData + start;
|
mStart = mData + start;
|
||||||
}
|
}
|
||||||
|
|
||||||
signalVector::signalVector(complex *data, size_t start, size_t span)
|
signalVector::signalVector(complex *data, size_t start, size_t span, vector_alloc_func wAllocFunc, vector_free_func wFreeFunc)
|
||||||
: Vector<complex>(NULL, data + start, data + start + span),
|
: Vector<complex>(data, data + start, data + start + span, wAllocFunc, wFreeFunc),
|
||||||
real(false), aligned(false), symmetry(NONE)
|
real(false), aligned(false), symmetry(NONE)
|
||||||
{
|
{
|
||||||
}
|
}
|
||||||
|
@@ -13,13 +13,13 @@ enum Symmetry {
|
|||||||
class signalVector: public Vector<complex> {
|
class signalVector: public Vector<complex> {
|
||||||
public:
|
public:
|
||||||
/** Default constructor */
|
/** Default constructor */
|
||||||
signalVector(size_t size = 0);
|
signalVector(size_t size = 0, vector_alloc_func wAllocFunc = NULL, vector_free_func wFreeFunc = NULL);
|
||||||
|
|
||||||
/** Construct with head room */
|
/** Construct with head room */
|
||||||
signalVector(size_t size, size_t start);
|
signalVector(size_t size, size_t start, vector_alloc_func wAllocFunc = NULL, vector_free_func wFreeFunc = NULL);
|
||||||
|
|
||||||
/** Construct from existing buffer data (buffer not managed) */
|
/** Construct from existing buffer data (buffer not managed) */
|
||||||
signalVector(complex *data, size_t start, size_t span);
|
signalVector(complex *data, size_t start, size_t span, vector_alloc_func wAllocFunc = NULL, vector_free_func wFreeFunc = NULL);
|
||||||
|
|
||||||
/** Construct by from existing vector */
|
/** Construct by from existing vector */
|
||||||
signalVector(const signalVector &vector);
|
signalVector(const signalVector &vector);
|
||||||
|
Reference in New Issue
Block a user