mirror of
https://git.postgresql.org/git/postgresql.git
synced 2025-01-12 18:34:36 +08:00
Improve memory space management in tuplesort and tuplestore.
The code originally just doubled the size of the tuple-pointer array so long as that would fit in allowedMem. This could result in failing to use as much as half of allowedMem, if (as is typical) the last doubling attempt didn't quite fit. Worse, we might double the array size but be unable to use most of the added slots, because there was no room left within the allowedMem limit for tuples the slots should point to. To fix, double only so long as we've used less than half of allowedMem in total. Then do one more array enlargement, but scale it based on total memory consumption so far. This will work nicely as long as the average tuple size is reasonably stable, and in any case should be better than the old method. This change will result in large sort operations consuming a larger fraction of work_mem than they typically did in the past. The release notes should mention that users may want to revisit their work_mem settings, if they'd tuned those settings based on the old behavior of sorting. Jeff Janes, reviewed by Peter Geoghegan and Robert Haas
This commit is contained in:
parent
1296d5c53c
commit
8ae35e9180
@ -276,6 +276,7 @@ struct Tuplesortstate
|
||||
SortTuple *memtuples; /* array of SortTuple structs */
|
||||
int memtupcount; /* number of tuples currently present */
|
||||
int memtupsize; /* allocated length of memtuples array */
|
||||
bool growmemtuples; /* memtuples' growth still underway? */
|
||||
|
||||
/*
|
||||
* While building initial runs, this is the current output run number
|
||||
@ -570,6 +571,7 @@ tuplesort_begin_common(int workMem, bool randomAccess)
|
||||
|
||||
state->memtupcount = 0;
|
||||
state->memtupsize = 1024; /* initial guess */
|
||||
state->growmemtuples = true;
|
||||
state->memtuples = (SortTuple *) palloc(state->memtupsize * sizeof(SortTuple));
|
||||
|
||||
USEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
@ -955,37 +957,110 @@ tuplesort_end(Tuplesortstate *state)
|
||||
|
||||
/*
|
||||
* Grow the memtuples[] array, if possible within our memory constraint.
|
||||
* Return TRUE if able to enlarge the array, FALSE if not.
|
||||
* Return TRUE if we were able to enlarge the array, FALSE if not.
|
||||
*
|
||||
* At each increment we double the size of the array. When we are short
|
||||
* on memory we could consider smaller increases, but because availMem
|
||||
* moves around with tuple addition/removal, this might result in thrashing.
|
||||
* Small increases in the array size are likely to be pretty inefficient.
|
||||
* Normally, at each increment we double the size of the array. When we no
|
||||
* longer have enough memory to do that, we attempt one last, smaller increase
|
||||
* (and then clear the growmemtuples flag so we don't try any more). That
|
||||
* allows us to use allowedMem as fully as possible; sticking to the pure
|
||||
* doubling rule could result in almost half of allowedMem going unused.
|
||||
* Because availMem moves around with tuple addition/removal, we need some
|
||||
* rule to prevent making repeated small increases in memtupsize, which would
|
||||
* just be useless thrashing. The growmemtuples flag accomplishes that and
|
||||
* also prevents useless recalculations in this function.
|
||||
*/
|
||||
static bool
|
||||
grow_memtuples(Tuplesortstate *state)
|
||||
{
|
||||
int newmemtupsize;
|
||||
int memtupsize = state->memtupsize;
|
||||
long memNowUsed = state->allowedMem - state->availMem;
|
||||
|
||||
/* Forget it if we've already maxed out memtuples, per comment above */
|
||||
if (!state->growmemtuples)
|
||||
return false;
|
||||
|
||||
/* Select new value of memtupsize */
|
||||
if (memNowUsed <= state->availMem)
|
||||
{
|
||||
/*
|
||||
* It is surely safe to double memtupsize if we've used no more than
|
||||
* half of allowedMem.
|
||||
*
|
||||
* Note: it might seem that we need to worry about memtupsize * 2
|
||||
* overflowing an int, but the MaxAllocSize clamp applied below
|
||||
* ensures the existing memtupsize can't be large enough for that.
|
||||
*/
|
||||
newmemtupsize = memtupsize * 2;
|
||||
}
|
||||
else
|
||||
{
|
||||
/*
|
||||
* This will be the last increment of memtupsize. Abandon doubling
|
||||
* strategy and instead increase as much as we safely can.
|
||||
*
|
||||
* To stay within allowedMem, we can't increase memtupsize by more
|
||||
* than availMem / sizeof(SortTuple) elements. In practice, we want
|
||||
* to increase it by considerably less, because we need to leave some
|
||||
* space for the tuples to which the new array slots will refer. We
|
||||
* assume the new tuples will be about the same size as the tuples
|
||||
* we've already seen, and thus we can extrapolate from the space
|
||||
* consumption so far to estimate an appropriate new size for the
|
||||
* memtuples array. The optimal value might be higher or lower than
|
||||
* this estimate, but it's hard to know that in advance.
|
||||
*
|
||||
* This calculation is safe against enlarging the array so much that
|
||||
* LACKMEM becomes true, because the memory currently used includes
|
||||
* the present array; thus, there would be enough allowedMem for the
|
||||
* new array elements even if no other memory were currently used.
|
||||
*
|
||||
* We do the arithmetic in float8, because otherwise the product of
|
||||
* memtupsize and allowedMem could overflow. (A little algebra shows
|
||||
* that grow_ratio must be less than 2 here, so we are not risking
|
||||
* integer overflow this way.) Any inaccuracy in the result should be
|
||||
* insignificant; but even if we computed a completely insane result,
|
||||
* the checks below will prevent anything really bad from happening.
|
||||
*/
|
||||
double grow_ratio;
|
||||
|
||||
grow_ratio = (double) state->allowedMem / (double) memNowUsed;
|
||||
newmemtupsize = (int) (memtupsize * grow_ratio);
|
||||
|
||||
/* We won't make any further enlargement attempts */
|
||||
state->growmemtuples = false;
|
||||
}
|
||||
|
||||
/* Must enlarge array by at least one element, else report failure */
|
||||
if (newmemtupsize <= memtupsize)
|
||||
goto noalloc;
|
||||
|
||||
/*
|
||||
* On a 64-bit machine, allowedMem could be more than MaxAllocSize. Clamp
|
||||
* to ensure our request won't be rejected by palloc.
|
||||
*/
|
||||
if ((Size) newmemtupsize >= MaxAllocSize / sizeof(SortTuple))
|
||||
{
|
||||
newmemtupsize = (int) (MaxAllocSize / sizeof(SortTuple));
|
||||
state->growmemtuples = false; /* can't grow any more */
|
||||
}
|
||||
|
||||
/*
|
||||
* We need to be sure that we do not cause LACKMEM to become true, else
|
||||
* the space management algorithm will go nuts. We assume here that the
|
||||
* memory chunk overhead associated with the memtuples array is constant
|
||||
* and so there will be no unexpected addition to what we ask for. (The
|
||||
* minimum array size established in tuplesort_begin_common is large
|
||||
* enough to force palloc to treat it as a separate chunk, so this
|
||||
* assumption should be good. But let's check it.)
|
||||
* the space management algorithm will go nuts. The code above should
|
||||
* never generate a dangerous request, but to be safe, check explicitly
|
||||
* that the array growth fits within availMem. (We could still cause
|
||||
* LACKMEM if the memory chunk overhead associated with the memtuples
|
||||
* array were to increase. That shouldn't happen with any sane value of
|
||||
* allowedMem, because at any array size large enough to risk LACKMEM,
|
||||
* palloc would be treating both old and new arrays as separate chunks.
|
||||
* But we'll check LACKMEM explicitly below just in case.)
|
||||
*/
|
||||
if (state->availMem <= (long) (state->memtupsize * sizeof(SortTuple)))
|
||||
return false;
|
||||
|
||||
/*
|
||||
* On a 64-bit machine, allowedMem could be high enough to get us into
|
||||
* trouble with MaxAllocSize, too.
|
||||
*/
|
||||
if ((Size) (state->memtupsize * 2) >= MaxAllocSize / sizeof(SortTuple))
|
||||
return false;
|
||||
if (state->availMem < (long) ((newmemtupsize - memtupsize) * sizeof(SortTuple)))
|
||||
goto noalloc;
|
||||
|
||||
/* OK, do it */
|
||||
FREEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
state->memtupsize *= 2;
|
||||
state->memtupsize = newmemtupsize;
|
||||
state->memtuples = (SortTuple *)
|
||||
repalloc(state->memtuples,
|
||||
state->memtupsize * sizeof(SortTuple));
|
||||
@ -993,6 +1068,11 @@ grow_memtuples(Tuplesortstate *state)
|
||||
if (LACKMEM(state))
|
||||
elog(ERROR, "unexpected out-of-memory situation during sort");
|
||||
return true;
|
||||
|
||||
noalloc:
|
||||
/* If for any reason we didn't realloc, shut off future attempts */
|
||||
state->growmemtuples = false;
|
||||
return false;
|
||||
}
|
||||
|
||||
/*
|
||||
|
@ -105,6 +105,7 @@ struct Tuplestorestate
|
||||
bool interXact; /* keep open through transactions? */
|
||||
bool truncated; /* tuplestore_trim has removed tuples? */
|
||||
long availMem; /* remaining memory available, in bytes */
|
||||
long allowedMem; /* total memory allowed, in bytes */
|
||||
BufFile *myfile; /* underlying file, or NULL if none */
|
||||
MemoryContext context; /* memory context for holding tuples */
|
||||
ResourceOwner resowner; /* resowner for holding temp files */
|
||||
@ -156,6 +157,7 @@ struct Tuplestorestate
|
||||
int memtupdeleted; /* the first N slots are currently unused */
|
||||
int memtupcount; /* number of tuples currently present */
|
||||
int memtupsize; /* allocated length of memtuples array */
|
||||
bool growmemtuples; /* memtuples' growth still underway? */
|
||||
|
||||
/*
|
||||
* These variables are used to keep track of the current positions.
|
||||
@ -254,7 +256,8 @@ tuplestore_begin_common(int eflags, bool interXact, int maxKBytes)
|
||||
state->eflags = eflags;
|
||||
state->interXact = interXact;
|
||||
state->truncated = false;
|
||||
state->availMem = maxKBytes * 1024L;
|
||||
state->allowedMem = maxKBytes * 1024L;
|
||||
state->availMem = state->allowedMem;
|
||||
state->myfile = NULL;
|
||||
state->context = CurrentMemoryContext;
|
||||
state->resowner = CurrentResourceOwner;
|
||||
@ -262,6 +265,7 @@ tuplestore_begin_common(int eflags, bool interXact, int maxKBytes)
|
||||
state->memtupdeleted = 0;
|
||||
state->memtupcount = 0;
|
||||
state->memtupsize = 1024; /* initial guess */
|
||||
state->growmemtuples = true;
|
||||
state->memtuples = (void **) palloc(state->memtupsize * sizeof(void *));
|
||||
|
||||
USEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
@ -526,6 +530,126 @@ tuplestore_ateof(Tuplestorestate *state)
|
||||
return state->readptrs[state->activeptr].eof_reached;
|
||||
}
|
||||
|
||||
/*
|
||||
* Grow the memtuples[] array, if possible within our memory constraint.
|
||||
* Return TRUE if we were able to enlarge the array, FALSE if not.
|
||||
*
|
||||
* Normally, at each increment we double the size of the array. When we no
|
||||
* longer have enough memory to do that, we attempt one last, smaller increase
|
||||
* (and then clear the growmemtuples flag so we don't try any more). That
|
||||
* allows us to use allowedMem as fully as possible; sticking to the pure
|
||||
* doubling rule could result in almost half of allowedMem going unused.
|
||||
* Because availMem moves around with tuple addition/removal, we need some
|
||||
* rule to prevent making repeated small increases in memtupsize, which would
|
||||
* just be useless thrashing. The growmemtuples flag accomplishes that and
|
||||
* also prevents useless recalculations in this function.
|
||||
*/
|
||||
static bool
|
||||
grow_memtuples(Tuplestorestate *state)
|
||||
{
|
||||
int newmemtupsize;
|
||||
int memtupsize = state->memtupsize;
|
||||
long memNowUsed = state->allowedMem - state->availMem;
|
||||
|
||||
/* Forget it if we've already maxed out memtuples, per comment above */
|
||||
if (!state->growmemtuples)
|
||||
return false;
|
||||
|
||||
/* Select new value of memtupsize */
|
||||
if (memNowUsed <= state->availMem)
|
||||
{
|
||||
/*
|
||||
* It is surely safe to double memtupsize if we've used no more than
|
||||
* half of allowedMem.
|
||||
*
|
||||
* Note: it might seem that we need to worry about memtupsize * 2
|
||||
* overflowing an int, but the MaxAllocSize clamp applied below
|
||||
* ensures the existing memtupsize can't be large enough for that.
|
||||
*/
|
||||
newmemtupsize = memtupsize * 2;
|
||||
}
|
||||
else
|
||||
{
|
||||
/*
|
||||
* This will be the last increment of memtupsize. Abandon doubling
|
||||
* strategy and instead increase as much as we safely can.
|
||||
*
|
||||
* To stay within allowedMem, we can't increase memtupsize by more
|
||||
* than availMem / sizeof(void *) elements. In practice, we want
|
||||
* to increase it by considerably less, because we need to leave some
|
||||
* space for the tuples to which the new array slots will refer. We
|
||||
* assume the new tuples will be about the same size as the tuples
|
||||
* we've already seen, and thus we can extrapolate from the space
|
||||
* consumption so far to estimate an appropriate new size for the
|
||||
* memtuples array. The optimal value might be higher or lower than
|
||||
* this estimate, but it's hard to know that in advance.
|
||||
*
|
||||
* This calculation is safe against enlarging the array so much that
|
||||
* LACKMEM becomes true, because the memory currently used includes
|
||||
* the present array; thus, there would be enough allowedMem for the
|
||||
* new array elements even if no other memory were currently used.
|
||||
*
|
||||
* We do the arithmetic in float8, because otherwise the product of
|
||||
* memtupsize and allowedMem could overflow. (A little algebra shows
|
||||
* that grow_ratio must be less than 2 here, so we are not risking
|
||||
* integer overflow this way.) Any inaccuracy in the result should be
|
||||
* insignificant; but even if we computed a completely insane result,
|
||||
* the checks below will prevent anything really bad from happening.
|
||||
*/
|
||||
double grow_ratio;
|
||||
|
||||
grow_ratio = (double) state->allowedMem / (double) memNowUsed;
|
||||
newmemtupsize = (int) (memtupsize * grow_ratio);
|
||||
|
||||
/* We won't make any further enlargement attempts */
|
||||
state->growmemtuples = false;
|
||||
}
|
||||
|
||||
/* Must enlarge array by at least one element, else report failure */
|
||||
if (newmemtupsize <= memtupsize)
|
||||
goto noalloc;
|
||||
|
||||
/*
|
||||
* On a 64-bit machine, allowedMem could be more than MaxAllocSize. Clamp
|
||||
* to ensure our request won't be rejected by palloc.
|
||||
*/
|
||||
if ((Size) newmemtupsize >= MaxAllocSize / sizeof(void *))
|
||||
{
|
||||
newmemtupsize = (int) (MaxAllocSize / sizeof(void *));
|
||||
state->growmemtuples = false; /* can't grow any more */
|
||||
}
|
||||
|
||||
/*
|
||||
* We need to be sure that we do not cause LACKMEM to become true, else
|
||||
* the space management algorithm will go nuts. The code above should
|
||||
* never generate a dangerous request, but to be safe, check explicitly
|
||||
* that the array growth fits within availMem. (We could still cause
|
||||
* LACKMEM if the memory chunk overhead associated with the memtuples
|
||||
* array were to increase. That shouldn't happen with any sane value of
|
||||
* allowedMem, because at any array size large enough to risk LACKMEM,
|
||||
* palloc would be treating both old and new arrays as separate chunks.
|
||||
* But we'll check LACKMEM explicitly below just in case.)
|
||||
*/
|
||||
if (state->availMem < (long) ((newmemtupsize - memtupsize) * sizeof(void *)))
|
||||
goto noalloc;
|
||||
|
||||
/* OK, do it */
|
||||
FREEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
state->memtupsize = newmemtupsize;
|
||||
state->memtuples = (void **)
|
||||
repalloc(state->memtuples,
|
||||
state->memtupsize * sizeof(void *));
|
||||
USEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
if (LACKMEM(state))
|
||||
elog(ERROR, "unexpected out-of-memory situation during sort");
|
||||
return true;
|
||||
|
||||
noalloc:
|
||||
/* If for any reason we didn't realloc, shut off future attempts */
|
||||
state->growmemtuples = false;
|
||||
return false;
|
||||
}
|
||||
|
||||
/*
|
||||
* Accept one tuple and append it to the tuplestore.
|
||||
*
|
||||
@ -631,20 +755,8 @@ tuplestore_puttuple_common(Tuplestorestate *state, void *tuple)
|
||||
*/
|
||||
if (state->memtupcount >= state->memtupsize - 1)
|
||||
{
|
||||
/*
|
||||
* See grow_memtuples() in tuplesort.c for the rationale
|
||||
* behind these two tests.
|
||||
*/
|
||||
if (state->availMem > (long) (state->memtupsize * sizeof(void *)) &&
|
||||
(Size) (state->memtupsize * 2) < MaxAllocSize / sizeof(void *))
|
||||
{
|
||||
FREEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
state->memtupsize *= 2;
|
||||
state->memtuples = (void **)
|
||||
repalloc(state->memtuples,
|
||||
state->memtupsize * sizeof(void *));
|
||||
USEMEM(state, GetMemoryChunkSpace(state->memtuples));
|
||||
}
|
||||
(void) grow_memtuples(state);
|
||||
Assert(state->memtupcount < state->memtupsize);
|
||||
}
|
||||
|
||||
/* Stash the tuple in the in-memory array */
|
||||
|
Loading…
Reference in New Issue
Block a user