summaryrefslogtreecommitdiffstats
path: root/src/VBox/Devices/Storage/IOBufMgmt.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/VBox/Devices/Storage/IOBufMgmt.cpp')
-rw-r--r--src/VBox/Devices/Storage/IOBufMgmt.cpp543
1 files changed, 543 insertions, 0 deletions
diff --git a/src/VBox/Devices/Storage/IOBufMgmt.cpp b/src/VBox/Devices/Storage/IOBufMgmt.cpp
new file mode 100644
index 00000000..808141da
--- /dev/null
+++ b/src/VBox/Devices/Storage/IOBufMgmt.cpp
@@ -0,0 +1,543 @@
+/* $Id: IOBufMgmt.cpp $ */
+/** @file
+ * VBox storage devices: I/O buffer management API.
+ */
+
+/*
+ * Copyright (C) 2016-2023 Oracle and/or its affiliates.
+ *
+ * This file is part of VirtualBox base platform packages, as
+ * available from https://www.virtualbox.org.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation, in version 3 of the
+ * License.
+ *
+ * This program is distributed in the hope that it will be useful, but
+ * WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, see <https://www.gnu.org/licenses>.
+ *
+ * SPDX-License-Identifier: GPL-3.0-only
+ */
+#define LOG_GROUP LOG_GROUP_IOBUFMGMT
+#include <VBox/cdefs.h>
+#include <iprt/errcore.h>
+#include <VBox/log.h>
+#include <iprt/assert.h>
+#include <iprt/critsect.h>
+#include <iprt/mem.h>
+#include <iprt/memsafer.h>
+#include <iprt/sg.h>
+#include <iprt/string.h>
+#include <iprt/asm.h>
+
+/** Set to verify the allocations for distinct memory areas. */
+//#define IOBUFMGR_VERIFY_ALLOCATIONS 1
+
+/** The minimum bin size to create - power of two!. */
+#define IOBUFMGR_BIN_SIZE_MIN _4K
+/** The maximum bin size to create - power of two!. */
+#define IOBUFMGR_BIN_SIZE_MAX _1M
+
+/** Pointer to the internal I/O buffer manager data. */
+typedef struct IOBUFMGRINT *PIOBUFMGRINT;
+
+/**
+ * Internal I/O buffer descriptor data.
+ */
+typedef struct IOBUFDESCINT
+{
+ /** Data segments. */
+ RTSGSEG aSegs[10];
+ /** Data segments used for the current allocation. */
+ unsigned cSegsUsed;
+ /** Pointer to I/O buffer manager. */
+ PIOBUFMGRINT pIoBufMgr;
+} IOBUFDESCINT;
+
+/**
+ * A
+ */
+typedef struct IOBUFMGRBIN
+{
+ /** Index of the next free entry. */
+ unsigned iFree;
+ /** Pointer to the array of free objects for this bin. */
+ void **papvFree;
+} IOBUFMGRBIN;
+typedef IOBUFMGRBIN *PIOBUFMGRBIN;
+
+/**
+ * Internal I/O buffer manager data.
+ */
+typedef struct IOBUFMGRINT
+{
+ /** Critical section protecting the allocation path. */
+ RTCRITSECT CritSectAlloc;
+ /** Flags the manager was created with. */
+ uint32_t fFlags;
+ /** Maximum size of I/O memory to allocate. */
+ size_t cbMax;
+ /** Amount of free memory. */
+ size_t cbFree;
+ /** The order of smallest bin. */
+ uint32_t u32OrderMin;
+ /** The order of largest bin. */
+ uint32_t u32OrderMax;
+ /** Pointer to the base memory of the allocation. */
+ void *pvMem;
+ /** Number of bins for free objects. */
+ uint32_t cBins;
+ /** Flag whether allocation is on hold waiting for everything to be free
+ * to be able to defragment the memory. */
+ bool fAllocSuspended;
+ /** Array of bins. */
+ PIOBUFMGRBIN paBins;
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ /** Pointer to the object state (allocated/free) bitmap. */
+ void *pbmObjState;
+#endif
+ /** Array of pointer entries for the various bins - variable in size. */
+ void *apvObj[1];
+} IOBUFMGRINT;
+
+/* Must be included after IOBUFDESCINT was defined. */
+#define IOBUFDESCINT_DECLARED
+#include "IOBufMgmt.h"
+
+/**
+ * Gets the number of bins required between the given minimum and maximum size
+ * to have a bin for every power of two size inbetween.
+ *
+ * @returns The number of bins required.
+ * @param cbMin The size of the smallest bin.
+ * @param cbMax The size of the largest bin.
+ */
+DECLINLINE(uint32_t) iobufMgrGetBinCount(uint32_t cbMin, uint32_t cbMax)
+{
+ uint32_t u32Max = ASMBitLastSetU32(cbMax);
+ uint32_t u32Min = ASMBitLastSetU32(cbMin);
+
+ Assert(cbMax >= cbMin && cbMax != 0 && cbMin != 0);
+ return u32Max - u32Min + 1;
+}
+
+/**
+ * Returns the number of entries required in the object array to cover all bins.
+ *
+ * @returns Number of entries required in the object array.
+ * @param cbMem Size of the memory buffer.
+ * @param cBins Number of bins available.
+ * @param cbMinBin Minimum object size.
+ */
+DECLINLINE(uint32_t) iobufMgrGetObjCount(size_t cbMem, unsigned cBins, size_t cbMinBin)
+{
+ size_t cObjs = 0;
+ size_t cbBin = cbMinBin;
+
+ while (cBins-- > 0)
+ {
+ cObjs += cbMem / cbBin;
+ cbBin <<= 1; /* The size doubles for every bin. */
+ }
+
+ Assert((uint32_t)cObjs == cObjs);
+ return (uint32_t)cObjs;
+}
+
+DECLINLINE(void) iobufMgrBinObjAdd(PIOBUFMGRBIN pBin, void *pvObj)
+{
+ LogFlowFunc(("pBin=%#p{.iFree=%u} pvObj=%#p\n", pBin, pBin->iFree, pvObj));
+ AssertPtr(pvObj);
+ pBin->papvFree[pBin->iFree] = pvObj;
+ pBin->iFree++;
+ LogFlowFunc(("return pBin=%#p{.iFree=%u}\n", pBin, pBin->iFree));
+}
+
+DECLINLINE(void *) iobufMgrBinObjRemove(PIOBUFMGRBIN pBin)
+{
+ LogFlowFunc(("pBin=%#p{.iFree=%u}\n", pBin, pBin->iFree));
+ Assert(pBin->iFree > 0);
+
+ pBin->iFree--;
+ void *pvObj = pBin->papvFree[pBin->iFree];
+ AssertPtr(pvObj);
+
+ LogFlowFunc(("returns pvObj=%#p pBin=%#p{.iFree=%u}\n", pvObj, pBin, pBin->iFree));
+ return pvObj;
+}
+
+/**
+ * Resets the bins to factory default (memory resigin in the largest bin).
+ *
+ * @param pThis The I/O buffer manager instance.
+ */
+static void iobufMgrResetBins(PIOBUFMGRINT pThis)
+{
+ /* Init the bins. */
+ size_t cbMax = pThis->cbMax;
+ size_t iObj = 0;
+ uint32_t cbBin = IOBUFMGR_BIN_SIZE_MIN;
+ for (unsigned i = 0; i < pThis->cBins; i++)
+ {
+ PIOBUFMGRBIN pBin = &pThis->paBins[i];
+ pBin->iFree = 0;
+ pBin->papvFree = &pThis->apvObj[iObj];
+ iObj += cbMax / cbBin;
+
+ /* Init the biggest possible bin with the free objects. */
+ if ( (cbBin << 1) > cbMax
+ || i == pThis->cBins - 1)
+ {
+ uint8_t *pbMem = (uint8_t *)pThis->pvMem;
+ while (cbMax)
+ {
+ iobufMgrBinObjAdd(pBin, pbMem);
+ cbMax -= cbBin;
+ pbMem += cbBin;
+
+ if (cbMax < cbBin) /** @todo Populate smaller bins and don't waste memory. */
+ break;
+ }
+
+ /* Limit the number of available bins. */
+ pThis->cBins = i + 1;
+ break;
+ }
+
+ cbBin <<= 1;
+ }
+}
+
+/**
+ * Allocate one segment from the manager.
+ *
+ * @returns Number of bytes allocated, 0 if there is no free memory.
+ * @param pThis The I/O buffer manager instance.
+ * @param pSeg The segment to fill in on success.
+ * @param cb Maximum number of bytes to allocate.
+ */
+static size_t iobufMgrAllocSegment(PIOBUFMGRINT pThis, PRTSGSEG pSeg, size_t cb)
+{
+ size_t cbAlloc = 0;
+
+ /* Round to the next power of two and get the bin to try first. */
+ uint32_t u32Order = ASMBitLastSetU32((uint32_t)cb) - 1;
+ if (cb & (RT_BIT_32(u32Order) - 1))
+ u32Order++;
+
+ u32Order = RT_CLAMP(u32Order, pThis->u32OrderMin, pThis->u32OrderMax);
+ unsigned iBin = u32Order - pThis->u32OrderMin;
+
+ /*
+ * Check whether the bin can satisfy the request. If not try the next bigger
+ * bin and so on. If there is nothing to find try the smaller bins.
+ */
+ Assert(iBin < pThis->cBins);
+
+ PIOBUFMGRBIN pBin = &pThis->paBins[iBin];
+ /* Reset the bins if there is nothing in the current one but all the memory is marked as free. */
+ if ( pThis->cbFree == pThis->cbMax
+ && pBin->iFree == 0)
+ iobufMgrResetBins(pThis);
+
+ if (pBin->iFree == 0)
+ {
+ unsigned iBinCur = iBin;
+ PIOBUFMGRBIN pBinCur = &pThis->paBins[iBinCur];
+
+ while (iBinCur < pThis->cBins)
+ {
+ if (pBinCur->iFree != 0)
+ {
+ uint8_t *pbMem = (uint8_t *)iobufMgrBinObjRemove(pBinCur);
+ AssertPtr(pbMem);
+
+ /* Always split into half. */
+ while (iBinCur > iBin)
+ {
+ iBinCur--;
+ pBinCur = &pThis->paBins[iBinCur];
+ iobufMgrBinObjAdd(pBinCur, pbMem + RT_BIT_Z(iBinCur + pThis->u32OrderMin));
+ }
+
+ /* For the last bin we will get two new memory blocks. */
+ iobufMgrBinObjAdd(pBinCur, pbMem);
+ Assert(pBin == pBinCur);
+ break;
+ }
+
+ pBinCur++;
+ iBinCur++;
+ }
+ }
+
+ /*
+ * If we didn't find something in the higher bins try to accumulate as much as possible from the smaller bins.
+ */
+ if ( pBin->iFree == 0
+ && iBin > 0)
+ {
+#if 1
+ pThis->fAllocSuspended = true;
+#else
+ do
+ {
+ iBin--;
+ pBin = &pThis->paBins[iBin];
+
+ if (pBin->iFree != 0)
+ {
+ pBin->iFree--;
+ pSeg->pvSeg = pBin->papvFree[pBin->iFree];
+ pSeg->cbSeg = (size_t)RT_BIT_32(iBin + pThis->u32OrderMin);
+ AssertPtr(pSeg->pvSeg);
+ cbAlloc = pSeg->cbSeg;
+ break;
+ }
+ }
+ while (iBin > 0);
+#endif
+ }
+ else if (pBin->iFree != 0)
+ {
+ pSeg->pvSeg = iobufMgrBinObjRemove(pBin);
+ pSeg->cbSeg = RT_BIT_Z(u32Order);
+ cbAlloc = pSeg->cbSeg;
+ AssertPtr(pSeg->pvSeg);
+
+ pThis->cbFree -= cbAlloc;
+
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ /* Mark the objects as allocated. */
+ uint32_t iBinStart = ((uintptr_t)pSeg->pvSeg - (uintptr_t)pThis->pvMem) / IOBUFMGR_BIN_SIZE_MIN;
+ Assert( !(((uintptr_t)pSeg->pvSeg - (uintptr_t)pThis->pvMem) % IOBUFMGR_BIN_SIZE_MIN)
+ && !(pSeg->cbSeg % IOBUFMGR_BIN_SIZE_MIN));
+ uint32_t iBinEnd = iBinStart + (pSeg->cbSeg / IOBUFMGR_BIN_SIZE_MIN);
+ while (iBinStart < iBinEnd)
+ {
+ bool fState = ASMBitTestAndSet(pThis->pbmObjState, iBinStart);
+ //LogFlowFunc(("iBinStart=%u fState=%RTbool -> true\n", iBinStart, fState));
+ AssertMsg(!fState, ("Trying to allocate an already allocated object\n"));
+ iBinStart++;
+ }
+#endif
+ }
+
+ return cbAlloc;
+}
+
+DECLHIDDEN(int) IOBUFMgrCreate(PIOBUFMGR phIoBufMgr, size_t cbMax, uint32_t fFlags)
+{
+ int rc = VINF_SUCCESS;
+
+ AssertPtrReturn(phIoBufMgr, VERR_INVALID_POINTER);
+ AssertReturn(cbMax, VERR_NOT_IMPLEMENTED);
+
+ /* Allocate the basic structure in one go. */
+ unsigned cBins = iobufMgrGetBinCount(IOBUFMGR_BIN_SIZE_MIN, IOBUFMGR_BIN_SIZE_MAX);
+ uint32_t cObjs = iobufMgrGetObjCount(cbMax, cBins, IOBUFMGR_BIN_SIZE_MIN);
+ PIOBUFMGRINT pThis = (PIOBUFMGRINT)RTMemAllocZ(RT_UOFFSETOF_DYN(IOBUFMGRINT, apvObj[cObjs]) + cBins * sizeof(IOBUFMGRBIN));
+ if (RT_LIKELY(pThis))
+ {
+ pThis->fFlags = fFlags;
+ pThis->cbMax = cbMax;
+ pThis->cbFree = cbMax;
+ pThis->cBins = cBins;
+ pThis->fAllocSuspended = false;
+ pThis->u32OrderMin = ASMBitLastSetU32(IOBUFMGR_BIN_SIZE_MIN) - 1;
+ pThis->u32OrderMax = ASMBitLastSetU32(IOBUFMGR_BIN_SIZE_MAX) - 1;
+ pThis->paBins = (PIOBUFMGRBIN)((uint8_t *)pThis + RT_UOFFSETOF_DYN(IOBUFMGRINT, apvObj[cObjs]));
+
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ pThis->pbmObjState = RTMemAllocZ((cbMax / IOBUFMGR_BIN_SIZE_MIN / 8) + 1);
+ if (!pThis->pbmObjState)
+ rc = VERR_NO_MEMORY;
+#endif
+
+ if (RT_SUCCESS(rc))
+ rc = RTCritSectInit(&pThis->CritSectAlloc);
+ if (RT_SUCCESS(rc))
+ {
+ if (pThis->fFlags & IOBUFMGR_F_REQUIRE_NOT_PAGABLE)
+ rc = RTMemSaferAllocZEx(&pThis->pvMem, RT_ALIGN_Z(pThis->cbMax, _4K),
+ RTMEMSAFER_F_REQUIRE_NOT_PAGABLE);
+ else
+ pThis->pvMem = RTMemPageAllocZ(RT_ALIGN_Z(pThis->cbMax, _4K));
+
+ if ( RT_LIKELY(pThis->pvMem)
+ && RT_SUCCESS(rc))
+ {
+ iobufMgrResetBins(pThis);
+
+ *phIoBufMgr = pThis;
+ return VINF_SUCCESS;
+ }
+ else
+ rc = VERR_NO_MEMORY;
+
+ RTCritSectDelete(&pThis->CritSectAlloc);
+ }
+
+ RTMemFree(pThis);
+ }
+ else
+ rc = VERR_NO_MEMORY;
+
+ return rc;
+}
+
+DECLHIDDEN(int) IOBUFMgrDestroy(IOBUFMGR hIoBufMgr)
+{
+ PIOBUFMGRINT pThis = hIoBufMgr;
+
+ AssertPtrReturn(pThis, VERR_INVALID_HANDLE);
+
+ int rc = RTCritSectEnter(&pThis->CritSectAlloc);
+ if (RT_SUCCESS(rc))
+ {
+ if (pThis->cbFree == pThis->cbMax)
+ {
+ if (pThis->fFlags & IOBUFMGR_F_REQUIRE_NOT_PAGABLE)
+ RTMemSaferFree(pThis->pvMem, RT_ALIGN_Z(pThis->cbMax, _4K));
+ else
+ RTMemPageFree(pThis->pvMem, RT_ALIGN_Z(pThis->cbMax, _4K));
+
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ AssertPtr(pThis->pbmObjState);
+ RTMemFree(pThis->pbmObjState);
+ pThis->pbmObjState = NULL;
+#endif
+
+ RTCritSectLeave(&pThis->CritSectAlloc);
+ RTCritSectDelete(&pThis->CritSectAlloc);
+ RTMemFree(pThis);
+ }
+ else
+ {
+ rc = VERR_INVALID_STATE;
+ RTCritSectLeave(&pThis->CritSectAlloc);
+ }
+ }
+
+ return rc;
+}
+
+DECLHIDDEN(int) IOBUFMgrAllocBuf(IOBUFMGR hIoBufMgr, PIOBUFDESC pIoBufDesc, size_t cbIoBuf, size_t *pcbIoBufAllocated)
+{
+ PIOBUFMGRINT pThis = hIoBufMgr;
+
+ LogFlowFunc(("pThis=%#p pIoBufDesc=%#p cbIoBuf=%zu pcbIoBufAllocated=%#p\n",
+ pThis, pIoBufDesc, cbIoBuf, pcbIoBufAllocated));
+
+ AssertPtrReturn(pThis, VERR_INVALID_HANDLE);
+ AssertReturn(cbIoBuf > 0, VERR_INVALID_PARAMETER);
+
+ if ( !pThis->cbFree
+ || pThis->fAllocSuspended)
+ return VERR_NO_MEMORY;
+
+ int rc = RTCritSectEnter(&pThis->CritSectAlloc);
+ if (RT_SUCCESS(rc))
+ {
+ unsigned iSeg = 0;
+ size_t cbLeft = cbIoBuf;
+ size_t cbIoBufAlloc = 0;
+ PRTSGSEG pSeg = &pIoBufDesc->Int.aSegs[0];
+
+ while ( iSeg < RT_ELEMENTS(pIoBufDesc->Int.aSegs)
+ && cbLeft)
+ {
+ size_t cbAlloc = iobufMgrAllocSegment(pThis, pSeg, cbLeft);
+ if (!cbAlloc)
+ break;
+
+ iSeg++;
+ pSeg++;
+ cbLeft -= RT_MIN(cbAlloc, cbLeft);
+ cbIoBufAlloc += cbAlloc;
+ }
+
+ if (iSeg)
+ RTSgBufInit(&pIoBufDesc->SgBuf, &pIoBufDesc->Int.aSegs[0], iSeg);
+ else
+ rc = VERR_NO_MEMORY;
+
+ pIoBufDesc->Int.cSegsUsed = iSeg;
+ pIoBufDesc->Int.pIoBufMgr = pThis;
+ *pcbIoBufAllocated = cbIoBufAlloc;
+ Assert( (RT_SUCCESS(rc) && *pcbIoBufAllocated > 0)
+ || RT_FAILURE(rc));
+
+ RTCritSectLeave(&pThis->CritSectAlloc);
+ }
+
+ return rc;
+}
+
+DECLHIDDEN(void) IOBUFMgrFreeBuf(PIOBUFDESC pIoBufDesc)
+{
+ PIOBUFMGRINT pThis = pIoBufDesc->Int.pIoBufMgr;
+
+ LogFlowFunc(("pIoBufDesc=%#p{.cSegsUsed=%u}\n", pIoBufDesc, pIoBufDesc->Int.cSegsUsed));
+
+ AssertPtr(pThis);
+
+ int rc = RTCritSectEnter(&pThis->CritSectAlloc);
+ AssertRC(rc);
+
+ if (RT_SUCCESS(rc))
+ {
+ for (unsigned i = 0; i < pIoBufDesc->Int.cSegsUsed; i++)
+ {
+ PRTSGSEG pSeg = &pIoBufDesc->Int.aSegs[i];
+
+ uint32_t u32Order = ASMBitLastSetU32((uint32_t)pSeg->cbSeg) - 1;
+ unsigned iBin = u32Order - pThis->u32OrderMin;
+
+ Assert(iBin < pThis->cBins);
+ PIOBUFMGRBIN pBin = &pThis->paBins[iBin];
+ iobufMgrBinObjAdd(pBin, pSeg->pvSeg);
+ pThis->cbFree += pSeg->cbSeg;
+
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ /* Mark the objects as free. */
+ uint32_t iBinStart = ((uintptr_t)pSeg->pvSeg - (uintptr_t)pThis->pvMem) / IOBUFMGR_BIN_SIZE_MIN;
+ Assert( !(((uintptr_t)pSeg->pvSeg - (uintptr_t)pThis->pvMem) % IOBUFMGR_BIN_SIZE_MIN)
+ && !(pSeg->cbSeg % IOBUFMGR_BIN_SIZE_MIN));
+ uint32_t iBinEnd = iBinStart + (pSeg->cbSeg / IOBUFMGR_BIN_SIZE_MIN);
+ while (iBinStart < iBinEnd)
+ {
+ bool fState = ASMBitTestAndClear(pThis->pbmObjState, iBinStart);
+ //LogFlowFunc(("iBinStart=%u fState=%RTbool -> false\n", iBinStart, fState));
+ AssertMsg(fState, ("Trying to free a non allocated object\n"));
+ iBinStart++;
+ }
+
+ /* Poison the state. */
+ pSeg->cbSeg = ~0;
+ pSeg->pvSeg = (void *)~(uintptr_t)0;
+#endif
+ }
+
+ if ( pThis->cbFree == pThis->cbMax
+ && pThis->fAllocSuspended)
+ {
+ iobufMgrResetBins(pThis);
+ pThis->fAllocSuspended = false;
+ }
+
+ RTCritSectLeave(&pThis->CritSectAlloc);
+ }
+
+ pIoBufDesc->Int.cSegsUsed = 0;
+#ifdef IOBUFMGR_VERIFY_ALLOCATIONS
+ memset(&pIoBufDesc->SgBuf, 0xff, sizeof(pIoBufDesc->SgBuf));
+#endif
+}
+