From cab5ee1ba616020312107cad192f131ffed7e541 Mon Sep 17 00:00:00 2001 From: Rika Ichinose Date: Sun, 9 Jun 2024 21:47:03 +0300 Subject: [PATCH] heap.inc with incremental formatting and instant recycling of fixed chunks. --- rtl/inc/heap.inc | 2929 +++++++++++++++++++++++---------------------- rtl/inc/heaph.inc | 6 +- 2 files changed, 1491 insertions(+), 1444 deletions(-) diff --git a/rtl/inc/heap.inc b/rtl/inc/heap.inc index 0d98c577ea..e9c5c832ea 100644 --- a/rtl/inc/heap.inc +++ b/rtl/inc/heap.inc @@ -18,7 +18,7 @@ { $define HAS_MEMORYMANAGER} { Memory manager } -{$ifndef FPC_NO_DEFAULT_MEMORYMANAGER} +{$if not defined(FPC_NO_DEFAULT_MEMORYMANAGER)} const MemoryManager: TMemoryManager = ( NeedLock: false; // Obsolete @@ -34,8 +34,7 @@ const GetHeapStatus: {$ifndef FPC_NO_DEFAULT_HEAP}@SysGetHeapStatus{$else}nil{$endif}; GetFPCHeapStatus: {$ifndef FPC_NO_DEFAULT_HEAP}@SysGetFPCHeapStatus{$else}nil{$endif}; ); -{$else not FPC_NO_DEFAULT_MEMORYMANAGER} -{$ifndef FPC_IN_HEAPMGR} +{$elseif not defined(FPC_IN_HEAPMGR)} const MemoryManager: TMemoryManager = ( NeedLock: false; // Obsolete @@ -52,201 +51,12 @@ const GetFPCHeapStatus: nil; );public name 'FPC_SYSTEM_MEMORYMANAGER'; {$endif FPC_IN_HEAPMGR} -{$endif not FPC_NO_DEFAULT_MEMORYMANAGER} { Try to find the best matching block in general freelist } { define BESTMATCH} -{ DEBUG: Dump info when the heap needs to grow } -{ define DUMPGROW} - -{ define DEBUG_SYSOSREALLOC} - -{ Memory profiling: at moment in time of max heap size usage, - keep statistics of number of each size allocated - (with 16 byte granularity) } -{ define DUMP_MEM_USAGE} - -{$ifdef DUMP_MEM_USAGE} - {$define SHOW_MEM_USAGE} -{$endif} - {$ifndef FPC_NO_DEFAULT_MEMORYMANAGER} -const -{$ifdef CPU64} - blocksize = 32; { at least size of freerecord } - blockshift = 5; { shr value for blocksize=2^blockshift} - maxblocksize = 512+blocksize; { 1024+8 needed for heaprecord } -{$else} - blocksize = 16; { at least size of freerecord } - blockshift = 4; { shr value for blocksize=2^blockshift} - maxblocksize = 512+blocksize; { 1024+8 needed for heaprecord } -{$endif} - maxblockindex = maxblocksize div blocksize; { highest index in array of lists of memchunks } - - { common flags } - fixedsizeflag = 1; { flag if the block is of fixed size } - { memchunk var flags } - usedflag = 2; { flag if the block is used or not } - lastblockflag = 4; { flag if the block is the last in os chunk } - firstblockflag = 8; { flag if the block is the first in os chunk } - { os chunk flags } - ocrecycleflag = 1; - { above flags stored in size field } - sizemask = not(blocksize-1); - fixedoffsetshift = 12; - fixedsizemask = sizemask and ((1 shl fixedoffsetshift) - 1); - { After how many successive allocations of oschunks for fixed freelist - purposes should we double the size of locgrowheapsizesmall for the - current thread. Since the allocations of oschunks are added together for - all blocksizes, this is only a fuzzy indication of when the size will be - doubled rather than a hard and fast boundary. } - fixedallocthreshold = (maxblocksize shr blockshift) * 8; - { maximum size to which locgrowheapsizesmall can grow } - maxgrowheapsizesmall = 256*1024; - -{****************************************************************************} - -{$ifdef DUMPGROW} - {$define DUMPBLOCKS} -{$endif} - -{ - We use 'fixed' size chunks for small allocations, - and os chunks with variable sized blocks for big - allocations. - - * a block is an area allocated by user - * a chunk is a block plus our bookkeeping - * an os chunk is a collection of chunks - - Memory layout: - fixed: < chunk size > [ ... user data ... ] - variable: < prev chunk size > < chunk size > [ ... user data ... ] - - When all chunks in an os chunk are free, we keep a few around - but otherwise it will be freed to the OS. - - Fixed os chunks can be converted to variable os chunks and back - (if not too big). To prevent repeated conversion overhead in case - of user freeing/allocing same or a small set of sizes, we only do - the conversion to the new fixed os chunk size format after we - reuse the os chunk for another fixed size, or variable. Note that - while the fixed size os chunk is on the freelists.oslist, it is also - still present in a freelists.fixedlists, therefore we can easily remove - the os chunk from the freelists.oslist if this size is needed again; we - don't need to search freelists.oslist in alloc_oschunk, since it won't - be present anymore if alloc_oschunk is reached. Note that removing - from the freelists.oslist is not really done, only the recycleflag is - set, allowing to reset the flag easily. alloc_oschunk will clean up - the list while passing over it, that was a slow function anyway. -} - -type - pfreelists = ^tfreelists; - - poschunk = ^toschunk; - toschunk = record - size : 0..high(ptrint); {Cannot be ptruint because used field is signed.} - next_free : poschunk; - prev_any : poschunk; - next_any : poschunk; - used : ptrint; { 0: free, >0: fixed, -1: var } - freelists : pfreelists; - { padding inserted automatically by alloc_oschunk } - end; - - ppmemchunk_fixed = ^pmemchunk_fixed; - pmemchunk_fixed = ^tmemchunk_fixed; - tmemchunk_fixed = record - { aligning is done automatically in alloc_oschunk } - size : ptruint; - next_fixed, - prev_fixed : pmemchunk_fixed; - end; - - ppmemchunk_var = ^pmemchunk_var; - pmemchunk_var = ^tmemchunk_var; - tmemchunk_var = record - prevsize : ptruint; - freelists : pfreelists; - size : ptruint; - next_var, - prev_var : pmemchunk_var; - end; - - { ``header'', ie. size of structure valid when chunk is in use } - { should correspond to tmemchunk_var_hdr structure starting with the - last field. Reason is that the overlap is starting from the end of the - record. } - tmemchunk_fixed_hdr = record - { aligning is done automatically in alloc_oschunk } - size : ptruint; - end; - tmemchunk_var_hdr = record - prevsize : ptruint; - freelists : pfreelists; - size : ptruint; - end; - - pfpcheapstatus = ^tfpcheapstatus; - - tfixedfreelists = array[1..maxblockindex] of pmemchunk_fixed; - - tfreelists = record - oslist : poschunk; { os chunks free, available for use } - fixedlists : tfixedfreelists; - oscount : dword; { number of os chunks on oslist } - { how many oschunks have been allocated in this thread since - the last time we doubled the locgrowheapsizesmall size } - fixedallocated: dword; - { the size of oschunks allocated for fixed allocations in this thread; - initialised on thread creation with the global growheapsizesmall setting } - locgrowheapsizesmall: ptruint; - oslist_all : poschunk; { all os chunks allocated } - varlist : pmemchunk_var; - { chunks waiting to be freed from other thread } - waitfixed : pmemchunk_fixed; - waitvar : pmemchunk_var; - { heap statistics } - internal_status : TFPCHeapStatus; - end; - -const - fixedfirstoffset = ((sizeof(toschunk) + sizeof(tmemchunk_fixed_hdr) + $f) - and not $f) - sizeof(tmemchunk_fixed_hdr); - varfirstoffset = ((sizeof(toschunk) + sizeof(tmemchunk_var_hdr) + $f) - and not $f) - sizeof(tmemchunk_var_hdr); -{$ifdef BESTMATCH} - matcheffort = high(longint); -{$else} - matcheffort = 10; -{$endif} - -var - orphaned_freelists : tfreelists; -{$ifdef FPC_HAS_FEATURE_THREADING} - heap_lock : trtlcriticalsection; - heap_lock_use : integer; -threadvar -{$endif} - freelists : tfreelists; - -{$ifdef DUMP_MEM_USAGE} -const - sizeusageshift = 4; - sizeusageindex = 2049; - sizeusagesize = sizeusageindex shl sizeusageshift; -type - tsizeusagelist = array[0..sizeusageindex] of longint; -{$ifdef FPC_HAS_FEATURE_THREADING} -threadvar -{$else} -var -{$endif} - sizeusage, maxsizeusage: tsizeusagelist; -{$endif} {$endif HAS_MEMORYMANAGER} @@ -268,16 +78,12 @@ end; function IsMemoryManagerSet:Boolean; begin -{$ifdef HAS_MEMORYMANAGER} - Result:=false; -{$else HAS_MEMORYMANAGER} -{$ifdef FPC_NO_DEFAULT_MEMORYMANAGER} +{$if defined(HAS_MEMORYMANAGER) or defined(FPC_NO_DEFAULT_MEMORYMANAGER)} Result:=false; {$else not FPC_NO_DEFAULT_MEMORYMANAGER} IsMemoryManagerSet := (MemoryManager.GetMem<>@SysGetMem) or (MemoryManager.FreeMem<>@SysFreeMem); -{$endif notFPC_NO_DEFAULT_MEMORYMANAGER} -{$endif HAS_MEMORYMANAGER} +{$endif HAS_MEMORYMANAGER or FPC_NO_DEFAULT_MEMORYMANAGER} end; {$ifdef FPC_HAS_FEATURE_HEAP} @@ -374,1192 +180,1510 @@ end; {$if defined(FPC_HAS_FEATURE_HEAP) or defined(FPC_IN_HEAPMGR)} {$ifndef HAS_MEMORYMANAGER} +{ + We use 'fixed' size chunks for small allocations, + and os chunks with variable sized blocks for big + allocations. -{***************************************************************************** - GetHeapStatus -*****************************************************************************} + * a block is an area allocated by user + * a chunk is a block plus our bookkeeping + * an os chunk is a collection of chunks + + Memory layout: + fixed: < CommonHeader > [ ... user data ... ] + variable: [ VarHeader < CommonHeader > ] [ ... user data ... ] + + When all chunks in an os chunk are free, we keep a few around + but otherwise it will be freed to the OS. +} + +type + HeapInc = object + const + { Alignment requirement for blocks. All fixed sizes (among other things) are assumed to be divisible. } + Alignment = 2 * sizeof(pointer); + + { Fixed chunk sizes are: + ┌──── step = 16 ────┐┌─── step = 32 ────┐┌──── step = 48 ───┐┌ step 64 ┐ + 16, 32, 48, 64, 80, 96, 128, 160, 192, 224, 272, 320, 368, 416, 480, 544 + #0 #1 #2 #3 #4 #5 #6 #7 #8 #9 #10 #11 #12 #13 #14 #15 } + MinFixedHeaderAndPayload = 16; + MaxFixedHeaderAndPayload = 544; + FixedSizesCount = 16; + FixedSizes: array[0 .. FixedSizesCount - 1] of uint16 = (16, 32, 48, 64, 80, 96, 128, 160, 192, 224, 272, 320, 368, 416, 480, 544); + SizeMinus1Div16ToIndex: array[0 .. (MaxFixedHeaderAndPayload - 1) div 16] of uint8 = + { 16, 32, 48, 64, 80, 96, 112, 128, 144, 160, 176, 192, 208, 224, 240, 256, 272, 288, 304, 320, 336, 352, 368, 384, 400, 416, 432, 448, 464, 480, 496, 512, 528, 544 } + ( 0, 1, 2, 3, 4, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 10, 11, 11, 11, 12, 12, 12, 13, 13, 13, 14, 14, 14, 14, 15, 15, 15, 15); + + class function SizeMinus1ToIndex(sizeMinus1: SizeUint): SizeUint; static; inline; { sizeMinus1 + 1 ≤ MaxFixedHeaderAndPayload } + class function IndexToSize(sizeIndex: SizeUint): SizeUint; static; inline; + + const + OSChunkFixedSizeQuant = 32 * 1024; + OSChunkVarSizeQuant = 64 * 1024; + MaxFixedChunkSize = 256 * 1024; + + { Variable freelist search strategy: -1 = exhaustive search for the best (smallest fitting) match, ≥0 = search this many after the first match. } + MatchEffort = {$ifdef BESTMATCH} -1 {$else} 10 {$endif}; + + { Limit on shrinking variable chunks and keeping the tail when splitting the chunk in AllocVar / TryResizeVar. } + MinVarHeaderAndPayload = MaxFixedHeaderAndPayload * 3 div 4; + + { Adjustable part ends here~ } + + const + SizeIndexBits = 1 + trunc(ln(FixedSizesCount - 1) / ln(2)); + SizeIndexMask = 1 shl SizeIndexBits - 1; + FixedBitPos = {$if SizeIndexBits >= 3} SizeIndexBits {$else} 3 {$endif}; { Variable chunks use 3 low bits for used / first / last. } + FixedFlag = 1 shl FixedBitPos; + ChunkOffsetShift = FixedBitPos + 1; + + { Not really used; MaxFixedChunkSize limit on fixed OS chunks assumed to be strictly enforced and (much!) more restricting than MaxChunkOffset. + MaxFixedChunkSize = 256 Kb. + MaxChunkOffset ~ 2^(32 - 6) ~ 67 Mb. + Indices could be stored instead, but offsets avoid multiplications. } + MaxChunkOffset = High(uint32) shr ChunkOffsetShift; + + UsedFlag = 1 shl 0; + FirstFlag = 1 shl 1; + LastFlag = 1 shl 2; + VarSizeQuant = 1 shl ChunkOffsetShift; {$if VarSizeQuant < Alignment} {$error Assumed to be >= Alignment.} {$endif} + VarSizeMask = SizeUint(-VarSizeQuant); + + type + { Common header of any memory chunk, residing immediately to the left of the ~payload~ (block). + + Fixed chunk header, assuming SizeIndexBits = 4: + h[0:3] = size index (= h and SizeIndexMask) + h[4] = 1 (h and FixedFlag <> 0) + h[5:31] — offset in the OS chunk (= h shr ChunkOffsetShift) + + Variable chunk header, assuming SizeIndexBits = 4: + h[0] = used flag (h and UsedFlag <> 0) + h[1] = first flag (h and FirstFlag <> 0) + h[2] = last flag (h and LastFlag <> 0) + h[3] = unused + h[4] = 0 (h and FixedFlag = 0) + h[5:31] = size, rounded up to 32 (VarSizeQuant), shr 5; in other words, size = h and VarSizeMask. + + If sizeof(SizeUint) > 4: “h and VarSizeMask” is low part of size, high part is stored in VarChunk.sizeHi. } + + pCommonHeader = ^CommonHeader; + CommonHeader = record + h: uint32; + end; + + pThreadState = ^ThreadState; + + { Chunk that has been freed. Reuses the now-uninteresting payload, so payload must always fit its size. + Used for fixed freelists and cross-thread to-free queue. } + pFreeChunk = ^FreeChunk; + FreeChunk = record + next: pFreeChunk; + end; + + pOSChunk = ^OSChunk; + OSChunk = object { Common header for all OS chunks. } + size: SizeUint; { Full size asked from SysOSAlloc. } + {$ifdef FPC_HAS_FEATURE_THREADING} + threadState: pThreadState; { Protected with gs.lock. Nil if orphaned. } + {$endif} + prev, next: pointer; { pOSChunk, but used for different subtypes. } + + { For what purpose this chunk was used the last time. -1 — var, N ≥ 0 — fixed size N. Allows for a small optimization when reusing fixed chunks. } + sizeIndex: SizeInt; + + { Remove from list src and push to list dest. } + procedure MoveTo(var src, dest: pOSChunk); + end; + + pFreeOSChunk = ^FreeOSChunk; + FreeOSChunk = object(OSChunk) + end; + + FreeOSChunkList = object + first, last: pFreeOSChunk; + {$ifdef HAS_SYSOSFREE} + n: SizeUint; + {$endif} + + function Get(minSize, maxSize: SizeUint): pOSChunk; + {$ifdef HAS_SYSOSFREE} + function FreeOne: SizeUint; + procedure FreeAll; + {$endif} + end; + + pFixedOSChunk = ^FixedOSChunk; + FixedOSChunk = object(OSChunk) + { Data starts at FixedOSChunkDataOffset and spans for “maxSize” (virtual value, does not exist directly) bytes, of which: + — first formattedSize are either allocated (“used”; counted in usedSize) or in the freelist (firstFreeChunk; size = formattedSize - usedSize), + — the rest “maxSize” - formattedSize are yet unallocated space. + + This design, together with tracking free chunks per FixedOSChunk rather than per fixed size, trivializes reusing the chunk. + Chopping all available space at once would get rid of the “unallocated space” entity, but is a lot of potentially wasted work: + https://gitlab.com/freepascal.org/fpc/source/-/issues/40447. + + Values are multiples of the chunk size instead of counts (could be chunksUsed, chunksFormatted, chunksMax) to save on multiplications. + Moreover, instead of “maxSize” from the explanation above, fullThreshold is used, which is such a value that the chunk is full if usedSize >= fullThreshold. + maxSize = RoundUp(fullThreshold, chunk size). + Reason is, calculating fullThreshold does not require division. } + + firstFreeChunk: pFreeChunk; + usedSize, formattedSize, fullThreshold: uint32; + end; + + pVarOSChunk = ^VarOSChunk; + VarOSChunk = object(OSChunk) + end; + + pVarHeader = ^VarHeader; + VarHeader = record + prevSize: SizeUint; { Always 0 for the first chunk. } + {$ifdef FPC_HAS_FEATURE_THREADING} + threadState: pThreadState; + {$endif} + {$if sizeof(SizeUint) > 4} + sizeHi: uint32; + {$endif} + { Assumed to indeed match chunk’s CommonHeader, i.e. that there is no padding after this field. + Otherwise must be accessed as pCommonHeader(pointer(varHdr) + (VarHeaderSize - CommonHeaderSize))^ :D. } + ch: CommonHeader; + end; + + { Reuses the payload of variable chunks whose ch.h and UsedFlag = 0, so variable chunk payload must always fit its size. } + pFreeVarChunk = ^FreeVarChunk; + FreeVarChunk = record + prev, next: pFreeVarChunk; + size: SizeUint; { Cached size for easier access when working with free chunks, always equals to header.sizeHi shl 32 or header.ch.h and VarSizeMask. } + end; + + ThreadState = object + fullOS: pFixedOSChunk; { Completely filled fixed OS chunks. } + freeOS: FreeOSChunkList; { Completely empty OS chunks. } + {$ifdef FPC_HAS_FEATURE_THREADING} + toFree: pFreeChunk; { Free requests from other threads, atomic. } + {$endif} + + used, maxUsed, allocated, maxAllocated: SizeUint; { Statistics. } + + varOS: pVarOSChunk; + varFree: pFreeVarChunk; + + { OS chunks with at least 1 free chunk (including unformatted space), but not completely empty. + OS chunks that become completely empty are moved to freeOS, completely full are moved to fullOS. } + fixedPartialOS: array[0 .. FixedSizesCount - 1] of pFixedOSChunk; + + { Only to calculate preferable new fixed OS chunk sizes... + (Updated infrequently, as opposed to possible “fixedUsed”. When a new fixed OS chunk is required, all existing chunks of its size are full.) } + allocatedByFullFixed: array[0 .. FixedSizesCount - 1] of SizeUint; + + {$ifdef DEBUG_HEAP_INC} + procedure Dump(var f: text); + {$endif} + + function AllocFixed(size: SizeUint): pointer; + function FreeFixed(p: pointer): SizeUint; + + function GetOSChunk(minSize, maxSize: SizeUint; sizeIndex: SizeInt): pOSChunk; + function AllocateOSChunk(minSize: SizeUint; sizeIndex: SizeInt): pOSChunk; + + function AllocVar(size: SizeUint): pointer; + function FreeVar(p: pointer): SizeUint; + function TryResizeVar(p: pointer; size: SizeUint): pointer; + {$ifdef HAS_SYSOSREALLOC} + function TrySysOSRealloc(p: pointer; oldSize, newSize: SizeUint): pointer; + {$endif} + + {$ifdef FPC_HAS_FEATURE_THREADING} + procedure PushToFree(p: pFreeChunk); + procedure FlushToFree; + + procedure Orphan; { Must be performed under gs.lock. } + class procedure Orphan(list: pFixedOSChunk); static; + procedure Adopt(osChunk: pFixedOSChunk); { Must be performed under gs.lock. } + procedure AdoptVarOwner(p: pointer); { Adopts the OS chunk that contains p. Must be performed under gs.lock. } + + class function ChangeThreadStates(list: pOSChunk; ts: pThreadState): pOSChunk; static; { Returns the last item of the list. } + class procedure ChangeThreadState(vOs: pVarOSChunk; ts: pThreadState); static; + + {$ifndef FPC_SECTION_THREADVARS} + procedure FixupSelfPtr; + {$endif ndef FPC_SECTION_THREADVARS} + {$endif FPC_HAS_FEATURE_THREADING} + end; + + {$ifdef FPC_HAS_FEATURE_THREADING} + GlobalState = record + lock: TRTLCriticalSection; + lockUse: int32; + + { Data from dead threads (“orphaned”), protected by gs.lock. } + fixedOS: pFixedOSChunk; + freeOS: FreeOSChunkList; + varOS: pVarOSChunk; + end; + {$endif FPC_HAS_FEATURE_THREADING} + +{$ifdef FPC_HAS_FEATURE_THREADING} + class var + gs: GlobalState; + class threadvar + thisTs: ThreadState; +{$else FPC_HAS_FEATURE_THREADING} + class var + thisTs: ThreadState; +{$endif FPC_HAS_FEATURE_THREADING} + + const + CommonHeaderSize = sizeof(CommonHeader); + {$if MinFixedHeaderAndPayload < CommonHeaderSize + sizeof(FreeChunk)} {$error MinFixedHeaderAndPayload does not fit CommonHeader + FreeChunk.} {$endif} + FixedOSChunkDataOffset = (sizeof(FixedOSChunk) + CommonHeaderSize + Alignment - 1) and -Alignment - CommonHeaderSize; + VarHeaderSize = sizeof(VarHeader); + VarOSChunkDataOffset = (sizeof(VarOSChunk) + VarHeaderSize + Alignment - 1) and -Alignment - VarHeaderSize; + MaxVarPayload = High(SizeUint) - (VarOSChunkDataOffset + VarHeaderSize + OSChunkVarSizeQuant); { Absolute limit on chunk sizes. } + end; + + class function HeapInc.SizeMinus1ToIndex(sizeMinus1: SizeUint): SizeUint; + begin + result := SizeMinus1Div16ToIndex[sizeMinus1 div 16]; + end; + + class function HeapInc.IndexToSize(sizeIndex: SizeUint): SizeUint; + begin + result := FixedSizes[sizeIndex]; + end; + + procedure HeapInc.OSChunk.MoveTo(var src, dest: pOSChunk); + var + osNext, osPrev: pOSChunk; + begin + osPrev := prev; + osNext := next; + if Assigned(osPrev) then + osPrev^.next := osNext + else + src := osNext; + if Assigned(osNext) then + osNext^.prev := osPrev; + prev := nil; + osNext := dest; + next := osNext; + if Assigned(osNext) then + osNext^.prev := @self; + dest := @self; + end; + + function HeapInc.FreeOSChunkList.Get(minSize, maxSize: SizeUint): pOSChunk; + var + prev, next: pFreeOSChunk; + begin + result := first; + while Assigned(result) and not ((result^.size >= minSize) and (result^.size <= maxSize)) do + result := result^.next; + if not Assigned(result) then + exit; + + prev := result^.prev; + next := result^.next; + if Assigned(prev) then + prev^.next := next + else + first := next; + if Assigned(next) then + next^.prev := prev + else + last := prev; + {$ifdef HAS_SYSOSFREE} dec(n); {$endif} + end; + +{$ifdef HAS_SYSOSFREE} + function HeapInc.FreeOSChunkList.FreeOne: SizeUint; + var + best, prev: pFreeOSChunk; + begin + { Presently: the last one (which means LRU, as they are pushed to the beginning). } + best := last; + prev := best^.prev; + if Assigned(prev) then + prev^.next := nil + else + first := nil; + last := prev; + dec(n); + result := best^.size; + SysOSFree(best, best^.size); + end; + + procedure HeapInc.FreeOSChunkList.FreeAll; + var + cur, next: pFreeOSChunk; + begin + cur := first; + first := nil; + last := nil; + n := 0; + while Assigned(cur) do + begin + next := cur^.next; + SysOSFree(cur, cur^.size); + cur := next; + end; + end; +{$endif HAS_SYSOSFREE} + +{$ifdef DEBUG_HEAP_INC} + procedure HeapInc.ThreadState.Dump(var f: text); + var + i: SizeInt; + fix: pFixedOSChunk; + fr: pFreeOSChunk; + {$ifdef FPC_HAS_FEATURE_THREADING} + tf: pFreeChunk; + {$endif} + vf: pFreeVarChunk; + vOs: pVarOSChunk; + p: pointer; + begin + writeln(f, 'used = ', used, ', allocated = ', allocated, ', maxUsed = ', maxUsed, ', maxAllocated = ', maxAllocated); + fix := fullOS; + if Assigned(fix) then + begin + writeln(f); + repeat + writeln(f, 'Full fixed: size = ', fix^.size, ', usedSize = ', fix^.usedSize, ', formattedSize = ', fix^.formattedSize, ', fullThreshold = ', fix^.fullThreshold); + fix := fix^.next; + until not Assigned(fix); + end; + for i := 0 to FixedSizesCount - 1 do + if Assigned(fixedPartialOS[i]) then + begin + write(f, 'Size #', i, ' (', IndexToSize(i), ')'); + if allocatedByFullFixed[i] <> 0 then + write(f, ': allocatedByFullFixed = ', allocatedByFullFixed[i]); + writeln(f); + fix := fixedPartialOS[i]; + while Assigned(fix) do + begin + writeln(f, 'size = ', fix^.size, ', usedSize = ', fix^.usedSize, ', formattedSize = ', fix^.formattedSize, ', fullThreshold = ', fix^.fullThreshold); + fix := fix^.next; + end; + end; + vOs := varOS; + while Assigned(vOs) do + begin + writeln(f, LineEnding, 'Var OS chunk, size ', vOs^.size); + p := pointer(vOs) + (VarOSChunkDataOffset + VarHeaderSize); + repeat + write(f, HexStr(p), ': ', + 'prevSize = ', pVarHeader(p - VarHeaderSize)^.prevSize, ', size = ', + {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} pVarHeader(p - VarHeaderSize)^.ch.h and VarSizeMask); + if pVarHeader(p - VarHeaderSize)^.ch.h and UsedFlag <> 0 then + write(f, ', used') + else + write(f, ', f r e e'); + if pVarHeader(p - VarHeaderSize)^.ch.h and FirstFlag <> 0 then + write(f, ', first'); + if pVarHeader(p - VarHeaderSize)^.ch.h and LastFlag <> 0 then + write(f, ', last'); + writeln(f); + if pVarHeader(p - VarHeaderSize)^.ch.h and LastFlag <> 0 then + break; + p := p + ({$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} pVarHeader(p - VarHeaderSize)^.ch.h and uint32(VarSizeMask)); + until false; + vOs := vOs^.next; + end; + fr := freeOS.first; + if Assigned(fr) then + begin + writeln(f); + repeat + writeln(f, 'Free OS: ', HexStr(fr), ', size = ', fr^.size); + fr := fr^.next; + until not Assigned(fr); + end; + vf := varFree; + if Assigned(vf) then + begin + write(f, LineEnding, 'Var free:'); + repeat + write(f, ' ', vf^.size); + vf := vf^.next; + until not Assigned(vf); + writeln(f); + end; + {$ifdef FPC_HAS_FEATURE_THREADING} + tf := toFree; + if Assigned(tf) then + begin + write(f, LineEnding, 'To-free:'); + repeat + if pCommonHeader(pointer(tf) - CommonHeaderSize)^.h and FixedFlag <> 0 then + write(f, ' f ', CommonHeaderSize + SysMemSize(tf)) + else + write(f, ' v ', VarHeaderSize + SysMemSize(tf)); + tf := tf^.next; + until not Assigned(tf); + writeln(f); + end; + {$endif FPC_HAS_FEATURE_THREADING} + end; +{$endif DEBUG_HEAP_INC} + + function HeapInc.ThreadState.AllocFixed(size: SizeUint): pointer; + var + sizeIndex: SizeUint; + osChunk, osNext: pFixedOSChunk; + begin + sizeIndex := SizeMinus1ToIndex(size + (CommonHeaderSize - 1)); + + osChunk := fixedPartialOS[sizeIndex]; + if not Assigned(osChunk) then + begin + {$ifdef FPC_HAS_FEATURE_THREADING} + if Assigned(toFree) then + begin + FlushToFree; + osChunk := fixedPartialOS[sizeIndex]; + end; + if not Assigned(osChunk) then + {$endif FPC_HAS_FEATURE_THREADING} + begin + osChunk := pFixedOSChunk(GetOSChunk(FixedOSChunkDataOffset + MaxFixedHeaderAndPayload, MaxFixedChunkSize, sizeIndex)); + if not Assigned(osChunk) then + exit(nil); + if SizeUint(osChunk^.sizeIndex) = sizeIndex then + { Lucky! Just don’t reset the chunk and use its old freelist. } + else + begin + osChunk^.sizeIndex := sizeIndex; + osChunk^.firstFreeChunk := nil; + osChunk^.usedSize := 0; + osChunk^.formattedSize := 0; + osChunk^.fullThreshold := osChunk^.size - IndexToSize(sizeIndex) - (FixedOSChunkDataOffset - 1); { available OS chunk space - chunk size + 1. } + end; + + { Add osChunk to fixedPartialOS[sizeIndex]. } + osNext := fixedPartialOS[sizeIndex]; + osChunk^.prev := nil; + osChunk^.next := osNext; + if Assigned(osNext) then + osNext^.prev := osChunk; + fixedPartialOS[sizeIndex] := osChunk; + end; + end; + + size := IndexToSize(sizeIndex); + inc(used, size); + if used > maxUsed then + maxUsed := used; + + { osChunk from the fixedPartialOS list has either free chunk or free unformatted space for a new chunk. } + result := osChunk^.firstFreeChunk; + if Assigned(result) then + osChunk^.firstFreeChunk := pFreeChunk(result)^.next + else + begin + result := pointer(osChunk) + (FixedOSChunkDataOffset + CommonHeaderSize) + osChunk^.formattedSize; + pCommonHeader(result - CommonHeadersize)^.h := sizeIndex + osChunk^.formattedSize shl ChunkOffsetShift + + (FixedFlag + (FixedOSChunkDataOffset + CommonHeaderSize) shl ChunkOffsetShift); { ← const } + inc(osChunk^.formattedSize, size); + end; + inc(osChunk^.usedSize, size); + if osChunk^.usedSize >= osChunk^.fullThreshold then + begin + inc(allocatedByFullFixed[sizeIndex], osChunk^.size); + { Remove osChunk from fixedPartialOS[sizeIndex], add to fullOS. } + osNext := osChunk^.next; + fixedPartialOS[sizeIndex] := osNext; + if Assigned(osNext) then + osNext^.prev := nil; + osNext := fullOS; + osChunk^.next := osNext; { osChunk^.prev is already nil because osChunk was the first item of fixedPartialOS[sizeIndex]. } + if Assigned(osNext) then + osNext^.prev := osChunk; + fullOS := osChunk; + end; + end; + + function HeapInc.ThreadState.FreeFixed(p: pointer): SizeUint; + var + sizeIndex, usedSize: SizeUint; + osChunk, osPrev, osNext: pFixedOSChunk; + freeOsNext: pFreeOSChunk; + {$ifdef FPC_HAS_FEATURE_THREADING} + chunkTs: pThreadState; + {$endif} + begin + osChunk := p - pCommonHeader(p - CommonHeaderSize)^.h shr ChunkOffsetShift; + + {$ifdef FPC_HAS_FEATURE_THREADING} + { This can be checked without blocking; osChunk^.threadState can only change from one value not equal to @self to another value not equal to @self. } + if osChunk^.threadState <> @self then + begin + EnterCriticalSection(gs.lock); + chunkTs := osChunk^.threadState; + if Assigned(chunkTs) then + begin + { Despite atomic Push lock must be held as otherwise target thread might end and destroy chunkTs. + However, target thread won’t block to free p, so PushToFree instantly invalidates p. } + result := IndexToSize(pCommonHeader(p - CommonHeaderSize)^.h and SizeIndexMask) - CommonHeaderSize; + chunkTs^.PushToFree(p); + LeaveCriticalSection(gs.lock); + exit; + end; + Adopt(osChunk); { ...And continue! } + LeaveCriticalSection(gs.lock); + end; + {$endif FPC_HAS_FEATURE_THREADING} + + pFreeChunk(p)^.next := osChunk^.firstFreeChunk; + osChunk^.firstFreeChunk := p; + sizeIndex := pCommonHeader(p - CommonHeaderSize)^.h and SizeIndexMask; + result := IndexToSize(sizeIndex); + dec(used, result); + usedSize := osChunk^.usedSize; + if usedSize >= osChunk^.fullThreshold then + begin + dec(allocatedByFullFixed[sizeIndex], osChunk^.size); + + { Remove osChunk from fullOS, add to fixedPartialOS[sizeIndex]. } + osPrev := osChunk^.prev; + osNext := osChunk^.next; + if Assigned(osPrev) then + osPrev^.next := osNext + else + fullOS := osNext; + if Assigned(osNext) then + osNext^.prev := osPrev; + osChunk^.prev := nil; + osNext := fixedPartialOS[sizeIndex]; + osChunk^.next := osNext; + if Assigned(osNext) then + osNext^.prev := osChunk; + fixedPartialOS[sizeIndex] := osChunk; + end; + dec(usedSize, result); + osChunk^.usedSize := usedSize; + if usedSize = 0 then + begin + { Remove osChunk from fixedPartialOS[sizeIndex], add to freeOS. } + osPrev := osChunk^.prev; + osNext := osChunk^.next; + if Assigned(osPrev) then + osPrev^.next := osNext + else + fixedPartialOS[sizeIndex] := osNext; + if Assigned(osNext) then + osNext^.prev := osPrev; + + freeOsNext := freeOS.first; + pFreeOSChunk(osChunk)^.prev := nil; + pFreeOSChunk(osChunk)^.next := freeOsNext; + if Assigned(freeOsNext) then + freeOsNext^.prev := osChunk + else + freeOS.last := pFreeOSChunk(osChunk); + freeOS.first := pFreeOSChunk(osChunk); + {$ifdef HAS_SYSOSFREE} + inc(freeOS.n); + if freeOS.n > MaxKeptOSChunks then + dec(allocated, freeOS.FreeOne); + {$endif} + end; + dec(result, CommonHeaderSize); + end; + + function HeapInc.ThreadState.GetOSChunk(minSize, maxSize: SizeUint; sizeIndex: SizeInt): pOSChunk; + begin + result := freeOS.Get(minSize, maxSize); + if Assigned(result) then + exit; + {$ifdef FPC_HAS_FEATURE_THREADING} + if Assigned(gs.freeOS.first) then { Racing precheck. } + begin + EnterCriticalSection(gs.lock); + result := gs.freeOS.Get(minSize, maxSize); + LeaveCriticalSection(gs.lock); + if Assigned(result) then + begin + result^.threadState := @self; + inc(allocated, result^.size); + if allocated > maxAllocated then + maxAllocated := allocated; + exit; + end; + end; + {$endif FPC_HAS_FEATURE_THREADING} + result := AllocateOSChunk(minSize, sizeIndex); + end; + + function HeapInc.ThreadState.AllocateOSChunk(minSize: SizeUint; sizeIndex: SizeInt): pOSChunk; + var + preferredSize: SizeUint; + begin + if sizeIndex < 0 then + begin + if minSize <= GrowHeapSize1 then { 256K by default. } + preferredSize := GrowHeapSize1 + else if minSize <= GrowHeapSize2 then { 1M by default. } + preferredSize := GrowHeapSize2 + else + preferredSize := (minSize + (OSChunkVarSizeQuant - 1)) and SizeUint(-OSChunkVarSizeQuant); + end else + begin + preferredSize := (allocatedByFullFixed[sizeIndex] div 8 + (OSChunkFixedSizeQuant - 1)) and SizeUint(-OSChunkFixedSizeQuant); { 12.5% of memory allocated by the size. } + if preferredSize < growheapsizesmall then + preferredSize := growheapsizesmall; + if preferredSize > MaxFixedChunkSize then + preferredSize := MaxFixedChunkSize; + end; + result := SysOSAlloc(preferredSize); + if not Assigned(result) and (preferredSize > minSize) then + begin + preferredSize := minSize; + result := SysOSAlloc(preferredSize); + end; + if not Assigned(result) then + if ReturnNilIfGrowHeapFails then + exit + else + HandleError(204); + inc(allocated, preferredSize); + if allocated > maxAllocated then + maxAllocated := allocated; + result^.size := preferredSize; + {$ifdef FPC_HAS_FEATURE_THREADING} + result^.threadState := @self; + {$endif} + result^.sizeIndex := -2; { Neither −1 nor ≥0. } + end; + + function HeapInc.ThreadState.AllocVar(size: SizeUint): pointer; + var + fv, fv2: pFreeVarChunk; + osChunk, osNext: pVarOSChunk; + varPrev, varNext: pFreeVarChunk; + vSize, minSize, maxSize: SizeUint; + {$if MatchEffort >= 0} fv2Size: SizeUint; {$endif} + {$if MatchEffort > 1} triesLeft: uint32; {$endif} + begin + if size > MaxVarPayload then + if ReturnNilIfGrowHeapFails then + exit(nil) + else + HandleError(204); + size := (size + (VarHeaderSize + VarSizeQuant - 1)) and SizeUint(-VarSizeQuant); + + {$ifdef FPC_HAS_FEATURE_THREADING} + if Assigned(toFree) then + FlushToFree; + {$endif} + + { Seach varFree for a chunk that fits size, heuristically strive for smallest. } + fv := varFree; + while Assigned(fv) and (fv^.size < size) do + fv := fv^.next; + {$if MatchEffort <> 0} + if Assigned(fv) and (fv^.size > size) then { Don’t search further if the size is already exact. } + begin + {$if MatchEffort > 1} triesLeft := MatchEffort + 1; {$endif} + fv2 := fv; + repeat + {$if MatchEffort > 1} + dec(triesLeft); + if triesLeft = 0 then + break; + {$endif} + fv2 := fv2^.next; + if not Assigned(fv2) then + break; + fv2Size := fv2^.size; + if (fv2Size < size) or (fv2Size >= fv^.size) then + continue; + fv := fv2; + {$if MatchEffort > 1} + if fv2Size = size then { Check here instead of the loop condition to prevent ‘continue’ from jumping to the check. } + break; + {$endif} + until {$if MatchEffort = 1} true {$else} false {$endif}; + end; + {$endif MatchEffort <> 0} + + if Assigned(fv) then + begin + { Remove fv from varFree. } + varPrev := fv^.prev; + varNext := fv^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + end else + begin + minSize := VarOSChunkDataOffset + size; + if minSize <= GrowHeapSize1 then + maxSize := GrowHeapSize1 + else if minSize <= GrowHeapSize2 then + maxSize := GrowHeapSize2 + else + maxSize := High(SizeUint); + osChunk := pVarOSChunk(GetOSChunk(minSize, maxSize, -1)); + if not Assigned(osChunk) then + exit(nil); + osChunk^.sizeIndex := -1; + + { Add osChunk to varOS. } + osNext := varOS; + osChunk^.prev := nil; + osChunk^.next := osNext; + if Assigned(osNext) then + osNext^.prev := osChunk; + varOS := osChunk; + + { Format new free var chunk spanning the entire osChunk (but don’t add to varFree, it is expected to be removed). } + fv := pointer(osChunk) + (VarOSChunkDataOffset + VarHeaderSize); + pVarHeader(pointer(fv) - VarHeaderSize)^.prevSize := 0; + {$ifdef FPC_HAS_FEATURE_THREADING} + pVarHeader(pointer(fv) - VarHeaderSize)^.threadState := @self; + {$endif} + vSize := SizeUint(osChunk^.size - VarOSChunkDataOffset) and SizeUint(-VarSizeQuant); + {$if sizeof(SizeUint) > 4} + pVarHeader(pointer(fv) - VarHeaderSize)^.sizeHi := vSize shr 32; + {$endif} + pVarHeader(pointer(fv) - VarHeaderSize)^.ch.h := uint32(vSize) or (FirstFlag or LastFlag); + fv^.size := vSize; + end; + + { Result will be allocated at the beginning of fv; maybe format the remainder and push it back to varFree. } + result := fv; + vSize := fv^.size - size; + if (vSize > MaxFixedHeaderAndPayload) or + { If fv is last in the OS chunk, remainder ≤ MaxFixedHeaderAndPayload is guaranteedly wasted. + If fv is not last, there is a hope that occupied chunk to the right might get freed one day and merge with the remainder. } + (vSize >= MinVarHeaderAndPayload) and (pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag = 0) then + begin + inc(pointer(fv), size); { result = allocated block, fv = remainder. } + pVarHeader(pointer(fv) - VarHeaderSize)^.prevSize := size; + {$ifdef FPC_HAS_FEATURE_THREADING} + pVarHeader(pointer(fv) - VarHeaderSize)^.threadState := @self; + {$endif} + {$if sizeof(SizeUint) > 4} + pVarHeader(pointer(fv) - VarHeaderSize)^.sizeHi := vSize shr 32; + {$endif} + { Remainder is still last in the OS chunk if the original chunk was last. } + pVarHeader(pointer(fv) - VarHeaderSize)^.ch.h := pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag or uint32(vSize); + fv^.size := vSize; + if pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag = 0 then + pVarHeader(pointer(fv) + vSize - VarHeaderSize)^.prevSize := vSize; + + { Add fv to varFree. } + varNext := varFree; + fv^.prev := nil; + fv^.next := varNext; + if Assigned(varNext) then + varNext^.prev := fv; + varFree := fv; + + { Allocated chunk is still first in the OS chunk if the original chunk was first. } + pVarHeader(result - VarHeaderSize)^.ch.h := pVarHeader(result - VarHeaderSize)^.ch.h and FirstFlag or UsedFlag or uint32(size); + end else + begin + { Use the entire chunk. } + size := fv^.size; + pVarHeader(result - VarHeaderSize)^.ch.h := pVarHeader(result - VarHeaderSize)^.ch.h and (FirstFlag or LastFlag) or UsedFlag or uint32(size); + end; + {$if sizeof(SizeUint) > 4} + pVarHeader(result - VarHeaderSize)^.sizeHi := size shr 32; + {$endif} + inc(used, size); + if used > maxUsed then + maxUsed := used; + end; + + function HeapInc.ThreadState.FreeVar(p: pointer): SizeUint; + var + {$ifdef FPC_HAS_FEATURE_THREADING} + chunkTs: pThreadState; + {$endif} + varPrev, varNext: pFreeVarChunk; + p2: pointer; + fSizeFlags: SizeUint; + osChunk, osPrev, osNext: pVarOSChunk; + freeOsNext: pFreeOSChunk; + begin + {$ifdef FPC_HAS_FEATURE_THREADING} + chunkTs := pVarHeader(p - VarHeaderSize)^.threadState; + if chunkTs <> @self then + begin + EnterCriticalSection(gs.lock); + chunkTs := pVarHeader(p - VarHeaderSize)^.threadState; + if Assigned(chunkTs) then + begin + { Despite atomic Push lock must be held as otherwise target thread might end and destroy chunkTs. + However, target thread won’t block to free p, so PushToFree instantly invalidates p. } + result := {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} pVarHeader(p - VarHeaderSize)^.ch.h and uint32(VarSizeMask) - VarHeaderSize; + chunkTs^.PushToFree(p); + LeaveCriticalSection(gs.lock); + exit; + end; + AdoptVarOwner(p); { ...And continue! } + LeaveCriticalSection(gs.lock); + end; + {$endif FPC_HAS_FEATURE_THREADING} + + fSizeFlags := {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} pVarHeader(p - VarHeaderSize)^.ch.h; + result := fSizeFlags and VarSizeMask; + dec(used, result); + + { If next/prev are free, remove them from varFree and merge with f — (f)uture (f)ree chunk that starts at p, has fSizeFlags, + and conveniently always inherits prevSize of its final location. } + if fSizeFlags and LastFlag = 0 then + begin + p2 := p + result; + if pVarHeader(p2 - VarHeaderSize)^.ch.h and UsedFlag = 0 then + begin + fSizeFlags := (fSizeFlags + pFreeVarChunk(p2)^.size) or pVarHeader(p2 - VarHeaderSize)^.ch.h and LastFlag; + + { Remove p2 from varFree. } + varPrev := pFreeVarChunk(p2)^.prev; + varNext := pFreeVarChunk(p2)^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + end; + end; + + if fSizeFlags and FirstFlag = 0 then + begin + p2 := p - pVarHeader(p - VarHeaderSize)^.prevSize; + if pVarHeader(p2 - VarHeaderSize)^.ch.h and UsedFlag = 0 then + begin + p := p2; + fSizeFlags := (fSizeFlags + pFreeVarChunk(p2)^.size) or pVarHeader(p2 - VarHeaderSize)^.ch.h and FirstFlag; + + { Remove p2 from varFree. } + varPrev := pFreeVarChunk(p2)^.prev; + varNext := pFreeVarChunk(p2)^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + end; + end; + + { Turn p into a free chunk and add it back to varFree... + unless it spans the entire OS chunk, in which case instead move the chunk from varOS to freeOS. } + if fSizeFlags and (FirstFlag or LastFlag) <> FirstFlag or LastFlag then + begin + if fSizeFlags and LastFlag = 0 then + pVarHeader(p + fSizeFlags and VarSizeMask - VarHeaderSize)^.prevSize := fSizeFlags and VarSizeMask; + + {$if sizeof(SizeUint) > 4} + pVarHeader(p - VarHeaderSize)^.sizeHi := fSizeFlags shr 32; + {$endif} + pVarHeader(p - VarHeaderSize)^.ch.h := uint32(fSizeFlags) xor UsedFlag; + pFreeVarChunk(p)^.size := fSizeFlags and VarSizeMask; + + { Add p to varFree. } + varNext := varFree; + pFreeVarChunk(p)^.prev := nil; + pFreeVarChunk(p)^.next := varNext; + if Assigned(varNext) then + varNext^.prev := p; + varFree := p; + end else + begin + osChunk := p - (VarOSChunkDataOffset + VarHeaderSize); + + { Remove osChunk from varOS. } + osPrev := osChunk^.prev; + osNext := osChunk^.next; + if Assigned(osPrev) then + osPrev^.next := osNext + else + varOS := osNext; + if Assigned(osNext) then + osNext^.prev := osPrev; + + { Instantly free if huge. } + {$ifdef HAS_SYSOSFREE} + if osChunk^.size > GrowHeapSize2 then + begin + dec(allocated, osChunk^.size); + SysOSFree(osChunk, osChunk^.size); + end else + {$endif} + begin + { Add to freeOS. } + freeOsNext := freeOS.first; + osChunk^.prev := nil; + osChunk^.next := freeOsNext; + if Assigned(freeOsNext) then + freeOsNext^.prev := osChunk + else + freeOS.last := pFreeOSChunk(osChunk); + freeOS.first := pFreeOSChunk(osChunk); + {$ifdef HAS_SYSOSFREE} + inc(freeOS.n); + if freeOS.n > MaxKeptOSChunks then + dec(allocated, freeOS.FreeOne); + {$endif} + end; + end; + dec(result, VarHeaderSize); + end; + + function HeapInc.ThreadState.TryResizeVar(p: pointer; size: SizeUint): pointer; + var + fp, p2: pointer; + oldpsize, fSizeFlags, growby: SizeUint; + varNext, varPrev: pFreeVarChunk; + begin + if (size < MinVarHeaderAndPayload - VarHeaderSize) or (size > MaxVarPayload) + {$ifdef FPC_HAS_FEATURE_THREADING} + or (pVarHeader(p - VarHeaderSize)^.threadState <> @self) + {$endif} + then + exit(nil); + size := (size + (VarHeaderSize + VarSizeQuant - 1)) and SizeUint(-VarSizeQuant); + result := p; { From now on use result instead of p (saves a register). } + + oldpsize := {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(result - VarHeaderSize)^.sizeHi) shl 32 or {$endif} pVarHeader(result - VarHeaderSize)^.ch.h and uint32(VarSizeMask); + p2 := result + oldpsize; + { (f)uture (f)ree chunk starting at p + size and having fSizeFlags will be created at the end, must exit before that if not required. } + if size <= oldpsize then + begin + { Shrink. Maybe. } + fSizeFlags := oldpsize - size; + + if pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag <> 0 then + begin + { Has nothing to the right: create free chunk if > MaxFixedHeaderAndPayload, otherwise report success but change nothing. } + if fSizeFlags <= MaxFixedHeaderAndPayload then + exit; + dec(used, fSizeFlags); + fSizeFlags := fSizeFlags or LastFlag; + end + else if pVarHeader(p2 - VarHeaderSize)^.ch.h and UsedFlag <> 0 then + begin + { Has used chunk to the right: create free chunk if ≥ MinVarHeaderAndPayload, following the same logic as in AllocVar. } + if fSizeFlags < MinVarHeaderAndPayload then + exit; + dec(used, fSizeFlags); + end else + begin + dec(used, fSizeFlags); + { Has empty chunk to the right: extend with freed space. } + fSizeFlags := (fSizeFlags + pFreeVarChunk(p2)^.size) or pVarHeader(p2 - VarHeaderSize)^.ch.h and LastFlag; + + { Remove p2 from varFree. } + varPrev := pFreeVarChunk(p2)^.prev; + varNext := pFreeVarChunk(p2)^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + end; + + { Update p size. } + {$if sizeof(SizeUint) > 4} + pVarHeader(result - VarHeaderSize)^.sizeHi := size shr 32; + {$endif} + pVarHeader(result - VarHeaderSize)^.ch.h := uint32(size) or pVarHeader(result - VarHeaderSize)^.ch.h and (FirstFlag or UsedFlag); + end + { Grow if there is free space. } + else if (pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag = 0) and (pVarHeader(p2 - VarHeaderSize)^.ch.h and UsedFlag = 0) and + (pFreeVarChunk(p2)^.size >= size - oldpsize) then + begin + fSizeFlags := pFreeVarChunk(p2)^.size - (size - oldpsize); + if pVarHeader(p2 - VarHeaderSize)^.ch.h and LastFlag = 0 then + begin + if fSizeFlags <= MaxFixedHeaderAndPayload then + fSizeFlags := 0; + end else + if fSizeFlags < MinVarHeaderAndPayload then + fSizeFlags := 0 + else + fSizeFlags := fSizeFlags or LastFlag; + + growby := pFreeVarChunk(p2)^.size - fSizeFlags and VarSizeMask; + size := oldpsize + growby; + inc(used, growby); + if used > maxUsed then + maxUsed := used; + + { Remove p2 from varFree. } + varPrev := pFreeVarChunk(p2)^.prev; + varNext := pFreeVarChunk(p2)^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + + { Update p size. } + {$if sizeof(SizeUint) > 4} + pVarHeader(result - VarHeaderSize)^.sizeHi := size shr 32; + {$endif} + pVarHeader(result - VarHeaderSize)^.ch.h := uint32(size) or pVarHeader(result - VarHeaderSize)^.ch.h and (FirstFlag or UsedFlag); + { No empty chunk? } + if fSizeFlags = 0 then + begin + if pVarHeader(p2 - VarHeaderSize)^.ch.h and LastFlag <> 0 then + pVarHeader(result - VarHeaderSize)^.ch.h := pVarHeader(result - VarHeaderSize)^.ch.h or LastFlag + else + pVarHeader(result + size - VarHeaderSize)^.prevSize := size; + exit; + end; + end + {$ifdef HAS_SYSOSREALLOC} + else if (oldpsize >= 64 * 1024) and { Don’t do SysOSRealloc if the source is under 64 Kb (arbitrary value). } + (pVarHeader(result - VarHeaderSize)^.ch.h and FirstFlag <> 0) and + ((pVarHeader(result - VarHeaderSize)^.ch.h and LastFlag <> 0) or (pVarHeader(p2 - VarHeaderSize)^.ch.h and (LastFlag or UsedFlag) = LastFlag)) then + exit(TrySysOSRealloc(result, oldpsize, size)) + {$endif} + else + exit(nil); + + { Format new free var chunk. } + fp := result + size; + pVarHeader(fp - VarHeaderSize)^.prevSize := size; + {$ifdef FPC_HAS_FEATURE_THREADING} + pVarHeader(fp - VarHeaderSize)^.threadState := @self; + {$endif} + {$if sizeof(SizeUint) > 4} + pVarHeader(fp - VarHeaderSize)^.sizeHi := fSizeFlags shr 32; + {$endif} + pVarHeader(fp - VarHeaderSize)^.ch.h := uint32(fSizeFlags); + pFreeVarChunk(fp)^.size := fSizeFlags and VarSizeMask; + if fSizeFlags and LastFlag = 0 then + pVarHeader(fp + fSizeFlags and VarSizeMask - VarHeaderSize)^.prevSize := fSizeFlags and VarSizeMask; + + { Add fp to varFree. } + varNext := varFree; + pFreeVarChunk(fp)^.prev := nil; + pFreeVarChunk(fp)^.next := varNext; + if Assigned(varNext) then + varNext^.prev := fp; + varFree := fp; + end; + +{$ifdef HAS_SYSOSREALLOC} + function HeapInc.ThreadState.TrySysOSRealloc(p: pointer; oldSize, newSize: SizeUint): pointer; + var + newOSSize: SizeUint; + hasFreeChunkToTheRight: boolean; + vf, varPrev, varNext: pFreeVarChunk; + begin + { Either p is the only chunk or has last empty chunk to the right. } + hasFreeChunkToTheRight := pVarHeader(p - VarHeaderSize)^.ch.h and LastFlag = 0; + + { Don’t do SysOSRealloc if the source chunk is <12.5% (arbitrary value) of the empty chunk to the right. } + if hasFreeChunkToTheRight and (oldSize < pFreeVarChunk(p + oldSize)^.size div 8) then + exit(nil); + + newOSSize := (newSize + (VarOSChunkDataOffset + OSChunkVarSizeQuant - 1)) and SizeUint(-OSChunkVarSizeQuant); + p := SysOSRealloc(p - (VarOSChunkDataOffset + VarHeaderSize), pVarOSChunk(p - (VarOSChunkDataOffset + VarHeaderSize))^.size, newOSSize); + if not Assigned(p) then + exit(nil); + + inc(allocated, newOSSize - pVarOSChunk(p)^.size); + if allocated > maxAllocated then + maxAllocated := allocated; + pVarOSChunk(p)^.size := newOSSize; + { For simplicity, new chunk spans the entire OS chunk. } + newOSSize := (newOSSize - VarOSChunkDataOffset) and SizeUint(-VarSizeQuant); + inc(used, newOSSize - oldSize); + if used > maxUsed then + maxUsed := used; + + { Update p size. } + {$if sizeof(SizeUint) > 4} + pVarHeader(p + VarOSChunkDataOffset)^.sizeHi := newOSSize shr 32; + {$endif} + pVarHeader(p + VarOSChunkDataOffset)^.ch.h := uint32(newOSSize) or (FirstFlag or LastFlag or UsedFlag); + + { Careful! Old pointers into p are invalidated and must be fixed. + There are up to 3 invalidated pointers: OS chunk in varOS, old p itself (p is reused for new OS chunk pointer), maybe empty chunk to the right in varFree. } + if Assigned(pVarOSChunk(p)^.next) then + pVarOSChunk(pVarOSChunk(p)^.next)^.prev := p; + if Assigned(pVarOSChunk(p)^.prev) then + pVarOSChunk(pVarOSChunk(p)^.prev)^.next := p + else + varOS := p; + + result := p + (VarOSChunkDataOffset + VarHeaderSize); + if hasFreeChunkToTheRight then + begin + vf := result + oldSize; + + { Remove vf from varFree. } + varPrev := vf^.prev; + varNext := vf^.next; + if Assigned(varPrev) then + varPrev^.next := varNext + else + varFree := varNext; + if Assigned(varNext) then + varNext^.prev := varPrev; + end; + end; +{$endif HAS_SYSOSREALLOC} + +{$ifdef FPC_HAS_FEATURE_THREADING} + procedure HeapInc.ThreadState.PushToFree(p: pFreeChunk); + var + next: pFreeChunk; + begin + repeat + next := toFree; + p^.next := next; + WriteBarrier; { Write p after p^.next. } + until InterlockedCompareExchange(toFree, p, next) = next; + end; + + procedure HeapInc.ThreadState.FlushToFree; + var + tf, nx: pFreeChunk; + begin + tf := InterlockedExchange(toFree, nil); + while Assigned(tf) do + begin + ReadDependencyBarrier; { Read toFree^.next after toFree. } + nx := tf^.next; + if pCommonHeader(pointer(tf) - CommonHeaderSize)^.h and FixedFlag <> 0 then + FreeFixed(tf) + else + FreeVar(tf); + tf := nx; + end; + end; + + procedure HeapInc.ThreadState.Orphan; + var + sizeIndex: SizeUint; + lastFree, nextFree: pFreeOSChunk; + vOs, nextVOs, lastVOs: pVarOSChunk; + begin + FlushToFree; + Orphan(fullOS); + for sizeIndex := 0 to High(fixedPartialOS) do + Orphan(fixedPartialOS[sizeIndex]); + { Prepend freeOS to gs.freeOS. } + lastFree := freeOS.last; + if Assigned(lastFree) then + begin + nextFree := gs.freeOS.first; + lastFree^.next := nextFree; + if Assigned(nextFree) then + nextFree^.prev := lastFree + else + gs.freeOS.last := lastFree; + gs.freeOS.first := freeOS.first; + {$ifdef HAS_SYSOSFREE} + inc(gs.freeOS.n, freeOS.n); + while gs.freeOS.n > MaxKeptOSChunks do + gs.freeOS.FreeOne; + {$endif} + end; + { Prepend varOS to gs.varOS. } + vOs := varOS; + if Assigned(vOs) then + begin + nextVOs := gs.varOS; + gs.varOS := vOs; + repeat + lastVOs := vOs; + ChangeThreadState(vOs, nil); + vOs := vOs^.next; + until not Assigned(vOs); + lastVOs^.next := nextVOs; + if Assigned(nextVOs) then + nextVOs^.prev := lastVOs; + end; + + { Zeroing is probably required, because Orphan is called from FinalizeHeap which is called from DoneThread which can be called twice, according to this comment from syswin.inc: } + // DoneThread; { Assume everything is idempotent there } + FillChar(self, sizeof(self), 0); + end; + + class procedure HeapInc.ThreadState.Orphan(list: pFixedOSChunk); + var + last, osNext: pFixedOSChunk; + begin + if not Assigned(list) then + exit; + last := pFixedOSChunk(ChangeThreadStates(list, nil)); + { Prepend list to gs.fixedOS. } + osNext := gs.fixedOS; + last^.next := osNext; + if Assigned(osNext) then + osNext^.prev := last; + gs.fixedOS := list; + end; + + procedure HeapInc.ThreadState.Adopt(osChunk: pFixedOSChunk); + var + sizeIndex: SizeUint; + dest: ^pFixedOSChunk; + begin + sizeIndex := pCommonHeader(pointer(osChunk) + FixedOSChunkDataOffset)^.h and SizeIndexMask; + inc(used, osChunk^.usedSize); + if used > maxUsed then + maxUsed := used; + inc(allocated, osChunk^.size); + if allocated > maxAllocated then + maxAllocated := allocated; + + { Remove osChunk from gs.fixedOS, add to fullOS or fixedPartialOS[sizeIndex] as appropriate. } + dest := @fixedPartialOS[sizeIndex]; + if osChunk^.usedSize >= osChunk^.fullThreshold then + begin + inc(allocatedByFullFixed[sizeIndex], osChunk^.size); + dest := @fullOS; + end; + osChunk^.MoveTo(gs.fixedOS, dest^); + + osChunk^.threadState := @self; + end; + + procedure HeapInc.ThreadState.AdoptVarOwner(p: pointer); + var + prevSize, size: SizeUint; + h: uint32; + varFreeHead: pFreeVarChunk; + begin + repeat + prevSize := pVarHeader(p - VarHeaderSize)^.prevSize; + dec(p, prevSize); + until prevSize = 0; + + { Move OS chunk from gs.varOS to varOS. } + pOSChunk(p - (VarOSChunkDataOffset + VarHeaderSize))^.MoveTo(gs.varOS, varOS); + inc(allocated, pOSChunk(p - (VarOSChunkDataOffset + VarHeaderSize))^.size); + if allocated > maxAllocated then + maxAllocated := allocated; + + { Careful: even though VarHeaders have own threadState links, correct threadState in the OS chunk is required, + as the chunk might be orphaned, then adopted with this function, then become free, then be reused as fixed chunk. + GetOSChunk does not set threadState if it takes the chunk from local freeOS, assuming it is already set. } + pOSChunk(p - (VarOSChunkDataOffset + VarHeaderSize))^.threadState := @self; + + varFreeHead := varFree; + repeat + pVarHeader(p - VarHeaderSize)^.threadState := @self; + h := pVarHeader(p - VarHeaderSize)^.ch.h; + size := {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} h and uint32(VarSizeMask); + if h and UsedFlag = 0 then + begin + { Add free chunk to varFree. } + pFreeVarChunk(p)^.prev := nil; + pFreeVarChunk(p)^.next := varFreeHead; + if Assigned(varFreeHead) then + varFreeHead^.prev := pFreeVarChunk(p); + varFreeHead := p; + end else + inc(used, size); { maxUsed is updated after the loop. } + inc(p, size); + until h and LastFlag <> 0; + varFree := varFreeHead; + if used > maxUsed then + maxUsed := used; + end; + + class function HeapInc.ThreadState.ChangeThreadStates(list: pOSChunk; ts: pThreadState): pOSChunk; static; { Returns the last item of list. } + begin + if not Assigned(list) then + exit(nil); + repeat + list^.threadState := ts; + result := list; + list := list^.next; + until not Assigned(list); + end; + + class procedure HeapInc.ThreadState.ChangeThreadState(vOs: pVarOSChunk; ts: pThreadState); + var + h: uint32; + p: pointer; + begin + vOs^.threadState := ts; { Not really required (for now), but done for symmetry; also see the comment on setting OSChunk.threadState in AdoptVarOwner. } + p := pointer(vOs) + (VarOSChunkDataOffset + VarHeaderSize); + repeat + pVarHeader(p - VarHeaderSize)^.threadState := ts; + h := pVarHeader(p - VarHeaderSize)^.ch.h; + inc(p, {$if sizeof(SizeUint) > 4} SizeUint(pVarHeader(p - VarHeaderSize)^.sizeHi) shl 32 or {$endif} h and uint32(VarSizeMask)); + until h and LastFlag <> 0; + end; + +{$ifndef FPC_SECTION_THREADVARS} + procedure HeapInc.ThreadState.FixupSelfPtr; + var + sizeIndex: SizeUint; + vOs: pVarOSChunk; + begin + ChangeThreadStates(fullOS, @self); + for sizeIndex := 0 to High(fixedPartialOS) do + ChangeThreadStates(fixedPartialOS[sizeIndex], @self); + ChangeThreadStates(freeOS.first, @self); + vOs := varOS; + while Assigned(vOs) do + begin + ChangeThreadState(vOs, @self); + vOs := vOs^.next; + end; + end; +{$endif ndef FPC_SECTION_THREADVARS} +{$endif FPC_HAS_FEATURE_THREADING} function SysGetFPCHeapStatus:TFPCHeapStatus; var - status: pfpcheapstatus; + ts: HeapInc.pThreadState; begin - status := @freelists.internal_status; - status^.CurrHeapFree := status^.CurrHeapSize - status^.CurrHeapUsed; - result := status^; + ts := @HeapInc.thisTs; + result.MaxHeapSize := ts^.maxAllocated; + result.MaxHeapUsed := ts^.maxUsed; + result.CurrHeapSize := ts^.allocated; + result.CurrHeapUsed := ts^.used; + result.CurrHeapFree := result.CurrHeapSize - result.CurrHeapUsed; end; function SysGetHeapStatus :THeapStatus; var - status: pfpcheapstatus; + ts: HeapInc.pThreadState; begin - status := @freelists.internal_status; - status^.CurrHeapFree := status^.CurrHeapSize - status^.CurrHeapUsed; - result.TotalAllocated :=status^.CurrHeapUsed; - result.TotalFree :=status^.CurrHeapFree; - result.TotalAddrSpace :=status^.CurrHeapSize; - result.TotalUncommitted :=0; - result.TotalCommitted :=0; - result.FreeSmall :=0; - result.FreeBig :=0; - result.Unused :=0; - result.Overhead :=0; - result.HeapErrorCode :=0; -end; - - -{$ifdef DUMPBLOCKS} // TODO -procedure DumpBlocks(loc_freelists: pfreelists); -var - s,i,j : ptruint; - hpfixed : pmemchunk_fixed; - hpvar : pmemchunk_var; -begin - { fixed freelist } - for i := 1 to maxblockindex do - begin - hpfixed := loc_freelists^.fixedlists[i]; - j := 0; - while assigned(hpfixed) do - begin - inc(j); - hpfixed := hpfixed^.next_fixed; - end; - writeln('Block ',i*blocksize,': ',j); - end; - { var freelist } - hpvar := loc_freelists^.varlist; - j := 0; - s := 0; - while assigned(hpvar) do - begin - inc(j); - if hpvar^.size>s then - s := hpvar^.size; - hpvar := hpvar^.next_var; - end; - writeln('Variable: ',j,' maxsize: ',s); -end; -{$endif} - - -{***************************************************************************** - Forwards -*****************************************************************************} - -procedure finish_waitfixedlist(loc_freelists: pfreelists); forward; -procedure finish_waitvarlist(loc_freelists: pfreelists); forward; -function try_finish_waitfixedlist(loc_freelists: pfreelists): boolean; forward; -procedure try_finish_waitvarlist(loc_freelists: pfreelists); forward; - -{***************************************************************************** - List adding/removal -*****************************************************************************} - -procedure append_to_list_var(pmc: pmemchunk_var); inline; -var - varlist: ppmemchunk_var; -begin - varlist := @pmc^.freelists^.varlist; - pmc^.prev_var := nil; - pmc^.next_var := varlist^; - if varlist^<>nil then - varlist^^.prev_var := pmc; - varlist^ := pmc; -end; - -{$ifdef HEAP_DEBUG} - -function find_fixed_mc(loc_freelists: pfreelists; chunkindex: ptruint; - pmc: pmemchunk_fixed): boolean; -var - pmc_temp: pmemchunk_fixed; -begin - pmc_temp := loc_freelists^.fixedlists[chunkindex]; - while pmc_temp <> nil do - begin - if pmc_temp = pmc then exit(true); - pmc_temp := pmc_temp^.next_fixed; - end; - result := false; -end; - -{$endif} - -procedure remove_from_list_fixed(pmc: pmemchunk_fixed; fixedlist: ppmemchunk_fixed); inline; -begin - if assigned(pmc^.next_fixed) then - pmc^.next_fixed^.prev_fixed := pmc^.prev_fixed; - if assigned(pmc^.prev_fixed) then - pmc^.prev_fixed^.next_fixed := pmc^.next_fixed - else - fixedlist^ := pmc^.next_fixed; -end; - -procedure remove_from_list_var(pmc: pmemchunk_var); inline; -begin - if assigned(pmc^.next_var) then - pmc^.next_var^.prev_var := pmc^.prev_var; - if assigned(pmc^.prev_var) then - pmc^.prev_var^.next_var := pmc^.next_var - else - pmc^.freelists^.varlist := pmc^.next_var; -end; - -procedure remove_freed_fixed_chunks(poc: poschunk); - { remove all fixed chunks from the fixed free list, as this os chunk - is going to be used for other purpose } -var - pmc, pmc_end: pmemchunk_fixed; - fixedlist: ppmemchunk_fixed; - chunksize: ptruint; -begin - { exit if this is a var size os chunk, function only applicable to fixed size } - if poc^.used < 0 then - exit; - pmc := pmemchunk_fixed(pointer(poc)+fixedfirstoffset); - chunksize := pmc^.size and fixedsizemask; - pmc_end := pmemchunk_fixed(pointer(poc)+(poc^.size and sizemask)-chunksize); - fixedlist := @poc^.freelists^.fixedlists[chunksize shr blockshift]; - repeat - remove_from_list_fixed(pmc, fixedlist); - pmc := pointer(pmc)+chunksize; - until pmc > pmc_end; -end; - -procedure free_oschunk(loc_freelists: pfreelists; poc: poschunk); -var - pocsize: ptruint; -begin - remove_freed_fixed_chunks(poc); - if assigned(poc^.prev_any) then - poc^.prev_any^.next_any := poc^.next_any - else - loc_freelists^.oslist_all := poc^.next_any; - if assigned(poc^.next_any) then - poc^.next_any^.prev_any := poc^.prev_any; - if poc^.used >= 0 then - dec(loc_freelists^.fixedallocated); - pocsize := poc^.size and sizemask; - dec(loc_freelists^.internal_status.currheapsize, pocsize); - SysOSFree(poc, pocsize); -end; - -procedure append_to_oslist(poc: poschunk); -var - loc_freelists: pfreelists; -begin - loc_freelists := poc^.freelists; - { check if already on list } - if (poc^.size and ocrecycleflag) <> 0 then - begin - inc(loc_freelists^.oscount); - poc^.size := poc^.size and not ocrecycleflag; - exit; - end; - { decide whether to free block or add to list } -{$ifdef HAS_SYSOSFREE} - if (loc_freelists^.oscount >= MaxKeptOSChunks) or - ((poc^.size and sizemask) > growheapsize2) then - begin - free_oschunk(loc_freelists, poc); - end - else - begin -{$endif} - poc^.next_free := loc_freelists^.oslist; - loc_freelists^.oslist := poc; - inc(loc_freelists^.oscount); -{$ifdef HAS_SYSOSFREE} - end; -{$endif} -end; - -procedure append_to_oslist_var(pmc: pmemchunk_var); -var - poc: poschunk; -begin - // block eligable for freeing - poc := pointer(pmc)-varfirstoffset; - remove_from_list_var(pmc); - append_to_oslist(poc); -end; - -procedure modify_oschunk_freelists(poc: poschunk; new_freelists: pfreelists); -var - pmcv: pmemchunk_var; -begin - poc^.freelists := new_freelists; - { only if oschunk contains var memchunks, we need additional assignments } - if poc^.used <> -1 then exit; - pmcv := pmemchunk_var(pointer(poc)+varfirstoffset); - repeat - pmcv^.freelists := new_freelists; - if (pmcv^.size and lastblockflag) <> 0 then - break; - pmcv := pmemchunk_var(pointer(pmcv)+(pmcv^.size and sizemask)); - until false; -end; - -function modify_freelists(loc_freelists, new_freelists: pfreelists): poschunk; -var - poc: poschunk; -begin - poc := loc_freelists^.oslist_all; - if assigned(poc) then - begin - repeat - { fixed and var freelist for orphaned freelists do not need maintenance } - { we assume the heap is not severely fragmented at thread exit } - modify_oschunk_freelists(poc, new_freelists); - if not assigned(poc^.next_any) then - exit(poc); - poc := poc^.next_any; - until false; - end; - modify_freelists := nil; -end; - -{***************************************************************************** - Split block -*****************************************************************************} - -function split_block(pcurr: pmemchunk_var; size: ptruint): ptruint; -var - pcurr_tmp : pmemchunk_var; - size_flags, oldsize, sizeleft: ptruint; -begin - size_flags := pcurr^.size; - oldsize := size_flags and sizemask; - sizeleft := oldsize-size; - if sizeleft>=sizeof(tmemchunk_var) then - begin - pcurr_tmp := pmemchunk_var(pointer(pcurr)+size); - { update prevsize of block to the right } - if (size_flags and lastblockflag) = 0 then - pmemchunk_var(pointer(pcurr)+oldsize)^.prevsize := sizeleft; - { inherit the lastblockflag } - pcurr_tmp^.size := sizeleft or (size_flags and lastblockflag); - pcurr_tmp^.prevsize := size; - pcurr_tmp^.freelists := pcurr^.freelists; - { the block we return is not the last one anymore (there's now a block after it) } - { decrease size of block to new size } - pcurr^.size := size or (size_flags and (not sizemask and not lastblockflag)); - { insert the block in the freelist } - append_to_list_var(pcurr_tmp); - result := size; - end - else - result := oldsize; -end; - - -{***************************************************************************** - Try concat freerecords -*****************************************************************************} - -procedure concat_two_blocks(mc_left, mc_right: pmemchunk_var); -var - mc_tmp : pmemchunk_var; - size_right : ptruint; -begin - // mc_right can't be a fixed size block - if mc_right^.size and fixedsizeflag<>0 then - HandleError(204); - // left block free, concat with right-block - size_right := mc_right^.size and sizemask; - inc(mc_left^.size, size_right); - // if right-block was last block, copy flag - if (mc_right^.size and lastblockflag) <> 0 then - begin - mc_left^.size := mc_left^.size or lastblockflag; - end - else - begin - // there is a block to the right of the right-block, adjust it's prevsize - mc_tmp := pmemchunk_var(pointer(mc_right)+size_right); - mc_tmp^.prevsize := mc_left^.size and sizemask; - end; - // remove right-block from doubly linked list - remove_from_list_var(mc_right); -end; - -function try_concat_free_chunk_forward(mc: pmemchunk_var): boolean; -var - mc_tmp : pmemchunk_var; -begin - { try concat forward } - result := false; - if (mc^.size and lastblockflag) = 0 then - begin - mc_tmp := pmemchunk_var(pointer(mc)+(mc^.size and sizemask)); - if (mc_tmp^.size and usedflag) = 0 then - begin - // next block free: concat - concat_two_blocks(mc, mc_tmp); - result := true; - end; - end; -end; - -function try_concat_free_chunk(mc: pmemchunk_var): pmemchunk_var; -var - mc_tmp : pmemchunk_var; -begin - try_concat_free_chunk_forward(mc); - - { try concat backward } - if (mc^.size and firstblockflag) = 0 then - begin - mc_tmp := pmemchunk_var(pointer(mc)-mc^.prevsize); - if (mc_tmp^.size and usedflag) = 0 then - begin - // prior block free: concat - concat_two_blocks(mc_tmp, mc); - mc := mc_tmp; - end; - end; - - result := mc; -end; - - -{***************************************************************************** - Grow Heap -*****************************************************************************} - -function find_free_oschunk(loc_freelists: pfreelists; - minsize, maxsize: ptruint; var size: ptruint): poschunk; -var - prev_poc, poc: poschunk; - pocsize: ptruint; -begin - poc := loc_freelists^.oslist; - prev_poc := nil; - while poc <> nil do - begin - if (poc^.size and ocrecycleflag) <> 0 then - begin - { oops! we recycled this chunk; remove it from list } - poc^.size := poc^.size and not ocrecycleflag; - poc := poc^.next_free; - if prev_poc = nil then - loc_freelists^.oslist := poc - else - prev_poc^.next_free := poc; - continue; - end; - pocsize := poc^.size and sizemask; - if (pocsize >= minsize) and - (pocsize <= maxsize) then - begin - size := pocsize; - if prev_poc = nil then - loc_freelists^.oslist := poc^.next_free - else - prev_poc^.next_free := poc^.next_free; - dec(loc_freelists^.oscount); - remove_freed_fixed_chunks(poc); - break; - end; - prev_poc := poc; - poc := poc^.next_free; - end; - result := poc; -end; - -function alloc_oschunk(loc_freelists: pfreelists; chunkindex, size: ptruint): pointer; -var - pmc, - pmc_next : pmemchunk_fixed; - pmcv : pmemchunk_var; - poc : poschunk; - minsize, - maxsize, - i : ptruint; - chunksize : ptruint; - status : pfpcheapstatus; -begin - { increase size by size needed for os block header } - minsize := size + varfirstoffset; - { for fixed size chunks we keep offset from os chunk to mem chunk in - upper bits, so maximum os chunk size is 64K on 32bit for fixed size } - if chunkindex<>0 then - maxsize := 1 shl (32-fixedoffsetshift) - else - maxsize := high(ptruint); - poc:=nil; - { blocks available in freelist? } - { do not reformat fixed size chunks too quickly } - if loc_freelists^.oscount >= MaxKeptOSChunks then - poc := find_free_oschunk(loc_freelists, minsize, maxsize, size); - { if none available, try to recycle orphaned os chunks } - if not assigned(poc) and (assigned(orphaned_freelists.waitfixed) - or assigned(orphaned_freelists.waitvar) or (orphaned_freelists.oscount > 0)) then - begin -{$ifdef FPC_HAS_FEATURE_THREADING} - EnterCriticalSection(heap_lock); -{$endif} - finish_waitfixedlist(@orphaned_freelists); - finish_waitvarlist(@orphaned_freelists); - if orphaned_freelists.oscount > 0 then - begin - { blocks available in orphaned freelist ? } - poc := find_free_oschunk(@orphaned_freelists, minsize, maxsize, size); - if assigned(poc) then - begin - { adopt this os chunk } - poc^.freelists := loc_freelists; - if assigned(poc^.prev_any) then - poc^.prev_any^.next_any := poc^.next_any - else - orphaned_freelists.oslist_all := poc^.next_any; - if assigned(poc^.next_any) then - poc^.next_any^.prev_any := poc^.prev_any; - poc^.next_any := loc_freelists^.oslist_all; - if assigned(loc_freelists^.oslist_all) then - loc_freelists^.oslist_all^.prev_any := poc; - poc^.prev_any := nil; - loc_freelists^.oslist_all := poc; - end; - end; -{$ifdef FPC_HAS_FEATURE_THREADING} - LeaveCriticalSection(heap_lock); -{$endif} - end; - if poc = nil then - begin -{$ifdef DUMPGROW} - writeln('growheap(',size,') allocating ',(size+sizeof(toschunk)+$ffff) and not $ffff); - DumpBlocks(loc_freelists); -{$endif} - { allocate by 64K size } - size := (size+varfirstoffset+$ffff) and not $ffff; - { allocate smaller blocks for fixed-size chunks } - if chunkindex<>0 then - begin - poc := SysOSAlloc(loc_freelists^.LocGrowHeapSizeSmall); - if poc<>nil then - size := loc_freelists^.LocGrowHeapSizeSmall; - end - { first try 256K (default) } - else if size<=GrowHeapSize1 then - begin - poc := SysOSAlloc(GrowHeapSize1); - if poc<>nil then - size := GrowHeapSize1; - end - { second try 1024K (default) } - else if size<=GrowHeapSize2 then - begin - poc := SysOSAlloc(GrowHeapSize2); - if poc<>nil then - size := GrowHeapSize2; - end - { else allocate the needed bytes } - else - poc := SysOSAlloc(size); - { try again } - if poc=nil then - begin - poc := SysOSAlloc(size); - if poc=nil then - begin - if ReturnNilIfGrowHeapFails then - begin - result := nil; - exit - end - else - HandleError(203); - end; - end; - poc^.freelists := loc_freelists; - poc^.prev_any := nil; - poc^.next_any := loc_freelists^.oslist_all; - if assigned(loc_freelists^.oslist_all) then - loc_freelists^.oslist_all^.prev_any := poc; - loc_freelists^.oslist_all := poc; - { set the total new heap size } - status := @loc_freelists^.internal_status; - inc(status^.currheapsize, size); - if status^.currheapsize > status^.maxheapsize then - status^.maxheapsize := status^.currheapsize; - end; - { initialize os-block } - poc^.size := size; - if chunkindex<>0 then - begin - poc^.used := 0; - { chop os chunk in fixedsize parts, - maximum of $ffff elements are allowed, otherwise - there will be an overflow } - chunksize := chunkindex shl blockshift; - if ptruint(size-chunksize)>maxsize then - HandleError(204); - { we need to align the user pointers to 8 byte at least for - mmx/sse and doubles on sparc, align to 16 bytes } - i := fixedfirstoffset; - result := pointer(poc) + i; - pmc := pmemchunk_fixed(result); - pmc^.prev_fixed := nil; - repeat - pmc^.size := fixedsizeflag or chunksize or (i shl fixedoffsetshift); - inc(i, chunksize); - if i > ptruint(size - chunksize) then break; - pmc_next := pmemchunk_fixed(pointer(pmc)+chunksize); - pmc^.next_fixed := pmc_next; - pmc_next^.prev_fixed := pmc; - pmc := pmc_next; - until false; - pmc_next := loc_freelists^.fixedlists[chunkindex]; - pmc^.next_fixed := pmc_next; - if pmc_next<>nil then - pmc_next^.prev_fixed := pmc; - loc_freelists^.fixedlists[chunkindex] := pmemchunk_fixed(result); - { check whether we should increase the size of the fixed freelist blocks } - inc(loc_freelists^.fixedallocated); - if loc_freelists^.fixedallocated > fixedallocthreshold then - begin - if loc_freelists^.locgrowheapsizesmall < maxgrowheapsizesmall then - inc(loc_freelists^.locgrowheapsizesmall, loc_freelists^.locgrowheapsizesmall); - { also set to zero in case we did not grow the blocksize to - prevent oveflows of this counter in case the rtl is compiled - range/overflow checking } - loc_freelists^.fixedallocated := 0; - end; - end - else - begin - poc^.used := -1; - { we need to align the user pointers to 8 byte at least for - mmx/sse and doubles on sparc, align to 16 bytes } - result := pointer(poc)+varfirstoffset; - pmcv := pmemchunk_var(result); - pmcv^.size := (ptruint(size-varfirstoffset) and sizemask) or (firstblockflag or lastblockflag); - pmcv^.prevsize := 0; - pmcv^.freelists := loc_freelists; - append_to_list_var(pmcv); - end; -end; - -{***************************************************************************** - SysGetMem -*****************************************************************************} - -function SysGetMem_Fixed(chunksize: ptruint): pointer; -var - pmc, pmc_next: pmemchunk_fixed; - poc: poschunk; - chunkindex: ptruint; - loc_freelists: pfreelists; -begin - { try to find a block in one of the freelists per size } - chunkindex := chunksize shr blockshift; - loc_freelists := @freelists; - pmc := loc_freelists^.fixedlists[chunkindex]; - { no free blocks ? } - if assigned(pmc) then - begin - { remove oschunk from free list in case we recycle it } - poc := poschunk(pointer(pmc) - (pmc^.size shr fixedoffsetshift)); - if poc^.used = 0 then - begin - poc^.size := poc^.size or ocrecycleflag; - dec(loc_freelists^.oscount); - end; - end - else if try_finish_waitfixedlist(loc_freelists) then - { freed some to-be freed chunks, retry allocation } - exit(SysGetMem_Fixed(chunksize)) - else - begin - pmc := alloc_oschunk(loc_freelists, chunkindex, chunksize); - if not assigned(pmc) then - exit(nil); - poc := poschunk(pointer(pmc)-fixedfirstoffset); - end; - prefetch(poc^.used); - { get a pointer to the block we should return } - result := pointer(pmc)+sizeof(tmemchunk_fixed_hdr); - { update freelist } - pmc_next := pmc^.next_fixed; - loc_freelists^.fixedlists[chunkindex] := pmc_next; - prefetch((pointer(@chunksize)-4)^); - if assigned(pmc_next) then - pmc_next^.prev_fixed := nil; - { statistics } - with loc_freelists^.internal_status do - begin - inc(currheapused, chunksize); - if currheapused > maxheapused then - begin - maxheapused := currheapused; -{$ifdef DUMP_MEM_USAGE} - maxsizeusage := sizeusage; -{$endif} - end; - end; - inc(poc^.used); -end; - -function SysGetMem_Var(size: ptruint): pointer; -var - pcurr : pmemchunk_var; - pbest : pmemchunk_var; - loc_freelists : pfreelists; - iter : cardinal; -begin - result:=nil; - { check for maximum possible allocation (everything is rounded up to the - next multiple of 64k) } - if (size>high(ptruint)-$ffff) then - if ReturnNilIfGrowHeapFails then - exit - else - HandleError(204); - { free pending items } - loc_freelists := @freelists; - try_finish_waitvarlist(loc_freelists); - pbest := nil; - pcurr := loc_freelists^.varlist; - iter := high(iter); - while assigned(pcurr) and (iter>0) do - begin - if (pcurr^.size>=size) then - begin - if not assigned(pbest) or (pcurr^.size maxheapused then - begin - maxheapused := currheapused; -{$ifdef DUMP_MEM_USAGE} - maxsizeusage := sizeusage; -{$endif} - end; - end; -{$ifdef DEBUG_SYSOSREALLOC} - writeln('Allocated block at: $',hexstr(PtrUInt(pcurr),SizeOf(PtrUInt)*2),', size: ',hexstr(PtrUInt(pcurr^.size and sizemask),SizeOf(PtrUInt)*2)); -{$endif DEBUG_SYSOSREALLOC} + FillChar((@result)^, sizeof(result), 0); + ts := @HeapInc.thisTs; + result.TotalAllocated :=ts^.used; + result.TotalFree :=ts^.allocated - ts^.used; + result.TotalAddrSpace :=ts^.allocated; end; function SysGetMem(size : ptruint):pointer; -begin -{ SysGetMem(0) is expected to return something freeable and non-nil. No need in explicit handling, presently. } -{ calc to multiple of 16 after adding the needed bytes for memchunk header } - if size <= (maxblocksize - sizeof(tmemchunk_fixed_hdr)) then - begin - size := (size+(sizeof(tmemchunk_fixed_hdr)+(blocksize-1))) and fixedsizemask; - result := sysgetmem_fixed(size); - end - else - begin - if size < high(ptruint)-((sizeof(tmemchunk_var_hdr)+(blocksize-1))) then - size := (size+(sizeof(tmemchunk_var_hdr)+(blocksize-1))) and sizemask; - result := sysgetmem_var(size); - end; - -{$ifdef DUMP_MEM_USAGE} - size := sysmemsize(result); - if size > sizeusagesize then - inc(sizeusage[sizeusageindex]) - else - inc(sizeusage[size shr sizeusageshift]); -{$endif} -end; - - -{***************************************************************************** - SysFreeMem -*****************************************************************************} - -procedure waitfree_fixed(pmc: pmemchunk_fixed; poc: poschunk); -begin -{$ifdef FPC_HAS_FEATURE_THREADING} - EnterCriticalSection(heap_lock); -{$endif} - pmc^.next_fixed := poc^.freelists^.waitfixed; - poc^.freelists^.waitfixed := pmc; -{$ifdef FPC_HAS_FEATURE_THREADING} - LeaveCriticalSection(heap_lock); -{$endif} -end; - -procedure waitfree_var(pmcv: pmemchunk_var); -begin -{$ifdef FPC_HAS_FEATURE_THREADING} - EnterCriticalSection(heap_lock); -{$endif} - pmcv^.next_var := pmcv^.freelists^.waitvar; - pmcv^.freelists^.waitvar := pmcv; -{$ifdef FPC_HAS_FEATURE_THREADING} - LeaveCriticalSection(heap_lock); -{$endif} -end; - -function SysFreeMem_Fixed(loc_freelists: pfreelists; pmc: pmemchunk_fixed): ptruint; var - chunkindex, - chunksize: ptruint; - poc: poschunk; - pmc_next: pmemchunk_fixed; - pocfreelists: pfreelists; + ts: HeapInc.pThreadState; begin - poc := poschunk(pointer(pmc)-(pmc^.size shr fixedoffsetshift)); - { start memory access to poc^.freelists already } - pocfreelists := poc^.freelists; - chunksize := pmc^.size and fixedsizemask; - if loc_freelists = pocfreelists then - begin - { decrease used blocks count (well in advance of poc^.used check below, - to avoid stalling due to a dependency) } - dec(poc^.used); - - { insert the block in its freelist } - chunkindex := chunksize shr blockshift; - pmc_next := loc_freelists^.fixedlists[chunkindex]; - pmc^.prev_fixed := nil; - pmc^.next_fixed := pmc_next; - if assigned(pmc_next) then - pmc_next^.prev_fixed := pmc; - loc_freelists^.fixedlists[chunkindex] := pmc; - - dec(loc_freelists^.internal_status.currheapused, chunksize); - - if poc^.used <= 0 then - begin - { decrease used blocks count } - if poc^.used<0 then - HandleError(204); - { osblock can be freed? } - append_to_oslist(poc); - end; - end + ts := @HeapInc.thisTs; + if size <= HeapInc.MaxFixedHeaderAndPayload - HeapInc.CommonHeaderSize then + result := ts^.AllocFixed(size) else - begin - { deallocated in wrong thread! add to to-be-freed list of correct thread } - waitfree_fixed(pmc, poc); - end; - result := chunksize-sizeof(tmemchunk_fixed_hdr); + result := ts^.AllocVar(size); end; -function SysFreeMem_Var(loc_freelists: pfreelists; pmcv: pmemchunk_var): ptruint; -var - chunksize: ptruint; -begin - chunksize := pmcv^.size and sizemask; - if loc_freelists = pmcv^.freelists then - begin -{$ifdef DEBUG_SYSOSREALLOC} - writeln('Releasing block at: $',hexstr(PtrUInt(pmcv),SizeOf(PtrUInt)*2)); -{$endif DEBUG_SYSOSREALLOC} - { insert the block in its freelist } - pmcv^.size := pmcv^.size and (not usedflag); - append_to_list_var(pmcv); - pmcv := try_concat_free_chunk(pmcv); - if (pmcv^.size and (firstblockflag or lastblockflag)) = (firstblockflag or lastblockflag) then - append_to_oslist_var(pmcv); - dec(loc_freelists^.internal_status.currheapused, chunksize); - end else - { deallocated in wrong thread! add to to-be-freed list of correct thread } - waitfree_var(pmcv); - result:=chunksize-sizeof(tmemchunk_var_hdr); -end; - - function SysFreeMem(p: pointer): ptruint; var - pmc: pmemchunk_fixed; - loc_freelists: pfreelists; -{$ifdef DUMP_MEM_USAGE} - size: sizeint; -{$endif} + ts: HeapInc.pThreadState; begin - pmc := pmemchunk_fixed(p-sizeof(tmemchunk_fixed_hdr)); - prefetch(pmc^.size); - if p=nil then + result := 0; + if Assigned(p) then begin - result:=0; - exit; + ts := @HeapInc.thisTs; + if HeapInc.pCommonHeader(p - HeapInc.CommonHeaderSize)^.h and HeapInc.FixedFlag <> 0 then + result := ts^.FreeFixed(p) + else + result := ts^.FreeVar(p); end; -{$ifdef DUMP_MEM_USAGE} - size := sysmemsize(p); - if size > sizeusagesize then - dec(sizeusage[sizeusageindex]) - else - dec(sizeusage[size shr sizeusageshift]); -{$endif} - { loc_freelists is a threadvar, so it can be worth it to prefetch } - loc_freelists := @freelists; - prefetch(loc_freelists^.internal_status.currheapused); - { check if this is a fixed- or var-sized chunk } - if (pmc^.size and fixedsizeflag) = 0 then - result := sysfreemem_var(loc_freelists, pmemchunk_var(p-sizeof(tmemchunk_var_hdr))) - else - result := sysfreemem_fixed(loc_freelists, pmc); end; -procedure finish_waitfixedlist(loc_freelists: pfreelists); - { free to-be-freed chunks, return whether we freed anything } +function SysTryResizeMem(var p: pointer; size: ptruint): boolean; var - pmc: pmemchunk_fixed; + ts: HeapInc.pThreadState; + h: uint32; + newp: pointer; begin - while loc_freelists^.waitfixed <> nil do + h := HeapInc.pCommonHeader(p - HeapInc.CommonHeaderSize)^.h; + if h and HeapInc.FixedFlag <> 0 then + { Don’t shrink fixed chunk. } + result := size <= SizeUint(HeapInc.IndexToSize(h and HeapInc.SizeIndexMask) - HeapInc.CommonHeaderSize) + else begin - { keep next_fixed, might be destroyed } - pmc := loc_freelists^.waitfixed; - loc_freelists^.waitfixed := pmc^.next_fixed; - SysFreeMem_Fixed(loc_freelists, pmc); + ts := @HeapInc.thisTs; + {$ifdef FPC_HAS_FEATURE_THREADING} + if Assigned(ts^.toFree) then + ts^.FlushToFree; + {$endif FPC_HAS_FEATURE_THREADING} + newp := ts^.TryResizeVar(p, size); + result := Assigned(newp); + if result then + p := newp; end; end; -function try_finish_waitfixedlist(loc_freelists: pfreelists): boolean; -begin - if loc_freelists^.waitfixed = nil then - exit(false); -{$ifdef FPC_HAS_FEATURE_THREADING} - EnterCriticalSection(heap_lock); -{$endif} - finish_waitfixedlist(loc_freelists); -{$ifdef FPC_HAS_FEATURE_THREADING} - LeaveCriticalSection(heap_lock); -{$endif} - result := true; -end; - -procedure finish_waitvarlist(loc_freelists: pfreelists); - { free to-be-freed chunks, return whether we freed anything } +function SysMemSize(p: pointer): ptruint; var - pmcv: pmemchunk_var; + h: uint32; begin - while loc_freelists^.waitvar <> nil do - begin - { keep next_var, might be destroyed } - pmcv := loc_freelists^.waitvar; - loc_freelists^.waitvar := pmcv^.next_var; - SysFreeMem_Var(loc_freelists, pmcv); - end; + if not Assigned(p) then + exit(0); + h := HeapInc.pCommonHeader(p - HeapInc.CommonHeaderSize)^.h; + if h and HeapInc.FixedFlag <> 0 then + result := HeapInc.IndexToSize(h and HeapInc.SizeIndexMask) - HeapInc.CommonHeaderSize + else + result := {$if sizeof(SizeUint) > 4} SizeUint(HeapInc.pVarHeader(p - HeapInc.VarHeaderSize)^.sizeHi) shl 32 or {$endif} + HeapInc.pVarHeader(p - HeapInc.VarHeaderSize)^.ch.h and uint32(HeapInc.VarSizeMask) + - HeapInc.VarHeaderSize; end; -procedure try_finish_waitvarlist(loc_freelists: pfreelists); +function SysReAllocMem(var p: pointer; size: ptruint):pointer; +var + oldsize, newsize, tocopy: SizeUint; begin - if loc_freelists^.waitvar = nil then - exit; -{$ifdef FPC_HAS_FEATURE_THREADING} - EnterCriticalSection(heap_lock); -{$endif} - finish_waitvarlist(loc_freelists); -{$ifdef FPC_HAS_FEATURE_THREADING} - LeaveCriticalSection(heap_lock); -{$endif} + if size = 0 then + begin + SysFreeMem(p); + result := nil; + p := nil; + end + else if not Assigned(p) then + begin + result := SysGetMem(size); + p := result; + end + else if SysTryResizeMem(p, size) then + result := p + else + begin + oldsize := SysMemSize(p); + newsize := size; + result := SysGetMem(newsize); + if not Assigned(result) then + begin + if size <= oldsize then + { Don’t fail if shrinking. } + result := p; + exit; { If growing failed, return nil, but keep the old p. } + end; + tocopy := oldsize; + if tocopy > newsize then + tocopy := newsize; + Move(p^, result^, tocopy); + SysFreeMem(p); + p := result; + end; end; -{***************************************************************************** - SysFreeMemSize -*****************************************************************************} - Function SysFreeMemSize(p: pointer; size: ptruint):ptruint; begin -// if size=0 then -// exit(0); { can't free partial blocks, ignore size } result := SysFreeMem(p); end; - -{***************************************************************************** - SysMemSize -*****************************************************************************} - -function SysMemSize(p: pointer): ptruint; -begin - if not assigned(p) then - exit(0); - result := pmemchunk_fixed(pointer(p)-sizeof(tmemchunk_fixed_hdr))^.size; - if (result and fixedsizeflag) = 0 then - result := result and sizemask-sizeof(tmemchunk_var_hdr) - else - result := result and fixedsizemask-sizeof(tmemchunk_fixed_hdr); -end; - - -{***************************************************************************** - SysAllocMem -*****************************************************************************} - function SysAllocMem(size: ptruint): pointer; begin result := SysGetMem(size); - if result<>nil then - FillChar(result^,SysMemSize(result),0); -end; - - -{***************************************************************************** - SysResizeMem -*****************************************************************************} - -function SysTryResizeMem(var p: pointer; size: ptruint): boolean; -var - chunksize, - newsize, - oldsize, - currsize : ptruint; - pcurr : pmemchunk_var; - loc_freelists : pfreelists; - poc : poschunk; - pmcv : pmemchunk_var; -begin - SysTryResizeMem := false; - -{$ifdef DEBUG_SYSOSREALLOC} - writeln('Resize block at: $',hexstr(PtrUInt(pcurr),SizeOf(PtrUInt)*2), - ', from: ',hexstr(SysMemSize(p),SizeOf(PtrUInt)*2), - ', to: ',hexstr(size,SizeOf(PtrUInt)*2)); -{$endif DEBUG_SYSOSREALLOC} - { fix p to point to the heaprecord } - chunksize := pmemchunk_fixed(p-sizeof(tmemchunk_fixed_hdr))^.size; - - { handle fixed memchuncks separate. Only allow resizes when the - new size fits in the same block } - if (chunksize and fixedsizeflag) <> 0 then - begin - currsize := chunksize and fixedsizemask; - - { 1. Resizing to smaller sizes will never allocate a new block. We just keep the current block. This - is needed for the expectations that resizing to a small block will not move the contents of - a memory block - 2. For resizing to greater size first check if the size fits in the fixed block range to prevent - "truncating" the size by the fixedsizemask } - if ((size <= (maxblocksize - sizeof(tmemchunk_fixed_hdr))) and - ((size+(sizeof(tmemchunk_fixed_hdr)+(blocksize-1))) and sizemask <= currsize)) then - begin - systryresizemem:=true; - exit; - end; - - { we need to allocate a new fixed or var memchunck } - exit; - end; - - { var memchunk } - - { do not fragment the heap with small shrinked blocks } - { also solves problem with var sized chunks smaller than sizeof(tmemchunk_var) } - if size < maxblocksize div 2 then - exit(false); - - currsize := chunksize and sizemask; - size := (size+sizeof(tmemchunk_var_hdr)+(blocksize-1)) and sizemask; - - { is the allocated block still correct? } - if (currsize>=size) and (size>ptruint(currsize-blocksize)) then - begin - SysTryResizeMem := true; - exit; - end; - - { get pointer to block } - loc_freelists := @freelists; - pcurr := pmemchunk_var(pointer(p)-sizeof(tmemchunk_var_hdr)); - if pcurr^.freelists <> loc_freelists then - exit; - oldsize := currsize; - - { do we need to allocate more memory ? } - if try_concat_free_chunk_forward(pcurr) then - currsize := pcurr^.size and sizemask; - if size>currsize then - begin -{$ifdef FPC_SYSTEM_HAS_SYSOSREALLOC} - { if the os block is only occupied by the memory block which shall be resized, - it can be tried if the OS can reallocate the block. On linux, the OS often does - not need to move the data but it can just remap the memory pages } - if ((pcurr^.size and firstblockflag) <> 0) and ((pcurr^.size and lastblockflag) <> 0) then - begin - newsize:=(size+varfirstoffset+sizeof(tmemchunk_var_hdr)+$ffff) and not $ffff; - poc:=SysOSRealloc(pointer(pcurr)-varfirstoffset,poschunk(pointer(pcurr)-varfirstoffset)^.size,newsize); - if poc<>nil then - begin - with loc_freelists^.internal_status do - begin - inc(currheapsize,newsize-poc^.size); - if currheapsize > maxheapsize then - maxheapsize := currheapsize; - end; -{$ifdef DEBUG_SYSOSREALLOC} - writeln('Block successfully resized by SysOSRealloc to: ',hexstr(qword(poc),sizeof(pointer)*2),' new size: $',hexstr(newsize,sizeof(ptruint)*2)); -{$endif DEBUG_SYSOSREALLOC} - poc^.size:=newsize; - { remove old os block from list, while it is already moved, the data is still the same } - if assigned(poc^.prev_any) then - poc^.prev_any^.next_any := poc^.next_any - else - loc_freelists^.oslist_all := poc^.next_any; - if assigned(poc^.next_any) then - poc^.next_any^.prev_any := poc^.prev_any; - - { insert the block with the new data into oslist_all } - poc^.prev_any := nil; - poc^.next_any := loc_freelists^.oslist_all; - if assigned(loc_freelists^.oslist_all) then - loc_freelists^.oslist_all^.prev_any := poc; - loc_freelists^.oslist_all := poc; - - { setup new block location } - p:=pointer(poc)+varfirstoffset+sizeof(tmemchunk_var_hdr); - - { setup the block data } - pmcv:=pmemchunk_var(p-sizeof(tmemchunk_var_hdr)); - pmcv^.size:=(ptruint(newsize-varfirstoffset) and sizemask) or (firstblockflag or lastblockflag); - pmcv^.prevsize:=0; - - currsize:=size; - - { create the left over freelist block as we rounded up, if at least 16 bytes are free } - size:=split_block(pmcv,size); - - { the block is used } - pmcv^.size:=pmcv^.size or usedflag; - - { TryResizeMem is successful } - SysTryResizeMem:=true; - end; - end; -{$endif FPC_SYSTEM_HAS_SYSOSREALLOC} - { adjust statistics (try_concat_free_chunk_forward may have merged a free - block into the current block, which we will subsequently free (so the - combined size will be freed -> make sure the combined size is marked as - used) } - with loc_freelists^.internal_status do - begin - inc(currheapused, currsize-oldsize); - if currheapused > maxheapused then - maxheapused := currheapused; - end; - { the size is bigger than the previous size, we need to allocate more mem - but we could not concatenate with next block or not big enough } - exit; - end - else - { is the size smaller then we can adjust the block to that size and insert - the other part into the freelist } - if currsize>size then - currsize := split_block(pcurr, size); - - with loc_freelists^.internal_status do - begin - inc(currheapused, currsize-oldsize); - if currheapused > maxheapused then - maxheapused := currheapused; - end; - SysTryResizeMem := true; -end; - - -{***************************************************************************** - SysResizeMem -*****************************************************************************} - -function SysReAllocMem(var p: pointer; size: ptruint):pointer; -var - newsize, - oldsize, - minsize : ptruint; - p2 : pointer; -begin - { Free block? } - if size=0 then - begin - if p<>nil then - begin - SysFreeMem(p); - p := nil; - end; - end - else - { Allocate a new block? } - if p=nil then - begin - p := SysGetMem(size); - end - else - begin - { Resize block } -{$ifdef DUMP_MEM_USAGE} - oldsize:=SysMemSize(p); -{$endif} - if not SysTryResizeMem(p,size) then - begin - oldsize:=SysMemSize(p); - { Grow with bigger steps to prevent the need for - multiple getmem/freemem calls for fixed blocks. It might cost a bit - of extra memory, but in most cases a reallocmem is done multiple times. } - if oldsizenewsize then - newsize:=size; - end - else - newsize:=size; - { calc size of data to move } - minsize:=oldsize; - if newsize < minsize then - minsize := newsize; - p2 := SysGetMem(newsize); - if p2<>nil then - Move(p^,p2^,minsize); - SysFreeMem(p); - p := p2; -{$ifdef DUMP_MEM_USAGE} - end else begin - size := sysmemsize(p); - if size <> oldsize then - begin - if oldsize > sizeusagesize then - dec(sizeusage[sizeusageindex]) - else if oldsize >= 0 then - dec(sizeusage[oldsize shr sizeusageshift]); - if size > sizeusagesize then - inc(sizeusage[sizeusageindex]) - else if size >= 0 then - inc(sizeusage[size shr sizeusageshift]); - end; -{$endif} - end; - end; - SysReAllocMem := p; + if Assigned(result) then + FillChar(result^, SysMemSize(result), 0); end; {$endif FPC_NO_DEFAULT_HEAP} @@ -1575,141 +1699,64 @@ end; the initialization of the system unit } {$ifdef FPC_HAS_FEATURE_THREADING} procedure InitHeapThread; -var - loc_freelists: pfreelists; begin - if heap_lock_use > 0 then - begin - EnterCriticalSection(heap_lock); - inc(heap_lock_use); - LeaveCriticalSection(heap_lock); - end; - loc_freelists := @freelists; - fillchar(loc_freelists^,sizeof(tfreelists),0); - { initialise the local blocksize for allocating oschunks for fixed - freelists with the default starting value } - loc_freelists^.locgrowheapsizesmall:=growheapsizesmall; -{$ifdef DUMP_MEM_USAGE} - fillchar(sizeusage,sizeof(sizeusage),0); - fillchar(maxsizeusage,sizeof(sizeusage),0); -{$endif} + if HeapInc.gs.lockUse>0 then + InterlockedIncrement(HeapInc.gs.lockUse); end; {$endif} procedure InitHeap; public name '_FPC_InitHeap'; -var - loc_freelists: pfreelists; begin -{$ifdef FPC_HAS_FEATURE_THREADING} { we cannot initialize the locks here yet, thread support is not loaded yet } - heap_lock_use := 0; -{$endif} - loc_freelists := @freelists; - fillchar(loc_freelists^,sizeof(tfreelists),0); - { initialise the local blocksize for allocating oschunks for fixed - freelists with the default starting value } - loc_freelists^.locgrowheapsizesmall:=growheapsizesmall; - fillchar(orphaned_freelists,sizeof(orphaned_freelists),0); end; procedure RelocateHeap; -var - loc_freelists: pfreelists; begin - { this function should be called in main thread context } {$ifdef FPC_HAS_FEATURE_THREADING} - if heap_lock_use > 0 then + if HeapInc.gs.lockUse > 0 then exit; - heap_lock_use := 1; - initcriticalsection(heap_lock); -{$endif} - + HeapInc.gs.lockUse := 1; + InitCriticalSection(HeapInc.gs.lock); {$ifndef FPC_SECTION_THREADVARS} - { even if section threadvars are used, this shouldn't cause problems as loc_freelists simply - does not change but we do not need it } - loc_freelists := @freelists; - { loc_freelists still points to main thread's freelists, but they - have a reference to the global main freelists, fix them to point - to the main thread specific variable } - modify_freelists(loc_freelists, loc_freelists); + { threadState pointers still point to main thread's thisTs, but they + have a reference to the global main thisTs, fix them to point + to the main thread specific variable. + even if section threadvars are used, this shouldn't cause problems as threadState pointers simply + do not change but we do not need it } + HeapInc.thisTs.FixupSelfPtr; {$endif FPC_SECTION_THREADVARS} if MemoryManager.RelocateHeap <> nil then MemoryManager.RelocateHeap(); +{$endif FPC_HAS_FEATURE_THREADING} end; procedure FinalizeHeap; -var - poc, poc_next: poschunk; - loc_freelists: pfreelists; -{$ifdef FPC_HAS_FEATURE_THREADING} - last_thread: boolean; -{$endif} -{$ifdef DUMP_MEM_USAGE} - i : longint; -{$endif} begin { Do not try to do anything if the heap manager already reported an error } if (errorcode=203) or (errorcode=204) then exit; - loc_freelists := @freelists; {$ifdef FPC_HAS_FEATURE_THREADING} - if heap_lock_use > 0 then - begin - EnterCriticalSection(heap_lock); - finish_waitfixedlist(loc_freelists); - finish_waitvarlist(loc_freelists); - end; -{$endif} -{$ifdef HAS_SYSOSFREE} - poc := loc_freelists^.oslist; - while assigned(poc) do - begin - poc_next := poc^.next_free; - { check if this os chunk was 'recycled' i.e. taken in use again } - if (poc^.size and ocrecycleflag) = 0 then - free_oschunk(loc_freelists, poc) - else - poc^.size := poc^.size and not ocrecycleflag; - poc := poc_next; - end; - loc_freelists^.oslist := nil; - loc_freelists^.oscount := 0; -{$endif HAS_SYSOSFREE} -{$ifdef FPC_HAS_FEATURE_THREADING} - if heap_lock_use > 0 then - begin - poc := modify_freelists(loc_freelists, @orphaned_freelists); - if assigned(poc) then + if HeapInc.gs.lockUse > 0 then + EnterCriticalSection(HeapInc.gs.lock); + HeapInc.thisTs.Orphan; + if HeapInc.gs.lockUse > 0 then begin - poc^.next_any := orphaned_freelists.oslist_all; - if assigned(orphaned_freelists.oslist_all) then - orphaned_freelists.oslist_all^.prev_any := poc; - orphaned_freelists.oslist_all := loc_freelists^.oslist_all; + LeaveCriticalSection(HeapInc.gs.lock); + if InterlockedDecrement(HeapInc.gs.lockUse) = 0 then + begin + DoneCriticalSection(HeapInc.gs.lock); + {$ifdef HAS_SYSOSFREE} + HeapInc.gs.freeOS.FreeAll; + {$endif} + end; end; - dec(heap_lock_use); - last_thread := heap_lock_use = 0; - LeaveCriticalSection(heap_lock); - if last_thread then - DoneCriticalSection(heap_lock); - end; -{$endif} -{$ifdef SHOW_MEM_USAGE} - writeln('Max heap used/size: ', loc_freelists^.internal_status.maxheapused, '/', - loc_freelists^.internal_status.maxheapsize); - flush(output); -{$endif} -{$ifdef DUMP_MEM_USAGE} - for i := 0 to sizeusageindex-1 do - if maxsizeusage[i] <> 0 then - writeln('size ', i shl sizeusageshift, ' usage ', maxsizeusage[i]); - writeln('size >', sizeusagesize, ' usage ', maxsizeusage[sizeusageindex]); - flush(output); -{$endif} +{$else FPC_HAS_FEATURE_THREADING} + HeapInc.thisTs.freeOS.FreeAll; +{$endif FPC_HAS_FEATURE_THREADING} end; {$endif ndef HAS_MEMORYMANAGER} {$endif ndef FPC_NO_DEFAULT_MEMORYMANAGER} {$endif defined(FPC_HAS_FEATURE_HEAP) or defined(FPC_IN_HEAPMGR)} - diff --git a/rtl/inc/heaph.inc b/rtl/inc/heaph.inc index 12c681d5dd..1137835e9e 100644 --- a/rtl/inc/heaph.inc +++ b/rtl/inc/heaph.inc @@ -97,12 +97,12 @@ Procedure Freememory(p:pointer;Size:ptruint); Function MemSize(p:pointer):ptruint; { Delphi functions } -function GetMem(size:ptruint):pointer; +function GetMem(size:ptruint):pointer; inline; function GetMemory(size:ptruint):pointer; cdecl; -function Freemem(p:pointer):ptruint; +function Freemem(p:pointer):ptruint; inline; function Freememory(p:pointer):ptruint; cdecl; function AllocMem(Size:ptruint):pointer; -function ReAllocMem(var p:pointer;Size:ptruint):pointer; +function ReAllocMem(var p:pointer;Size:ptruint):pointer; inline; function ReAllocMemory(p:pointer;Size:ptruint):pointer; cdecl; function GetHeapStatus:THeapStatus; function GetFPCHeapStatus:TFPCHeapStatus;