From 8d9f77cfe3486fc5766d99e883e28f7d0d47ca81 Mon Sep 17 00:00:00 2001 From: Richard Chapman Date: Wed, 11 Oct 2023 13:06:41 +0100 Subject: [PATCH] HPCC-30475 Roxie disk read calls size() too often Signed-off-by: Richard Chapman --- roxie/ccd/ccdfile.cpp | 22 +++++++++++++++++++--- roxie/ccd/ccdkey.cpp | 7 ++++--- roxie/ccd/ccdstate.hpp | 1 + 3 files changed, 24 insertions(+), 6 deletions(-) diff --git a/roxie/ccd/ccdfile.cpp b/roxie/ccd/ccdfile.cpp index d7762aafc86..6c64951bc7e 100644 --- a/roxie/ccd/ccdfile.cpp +++ b/roxie/ccd/ccdfile.cpp @@ -2353,6 +2353,7 @@ class CFileIOArray : implements IFileIOArray, public CInterface UnsignedArray subfiles; StringArray filenames; Int64Array bases; + mutable Int64Array sizes; // Lazy-evaluated and cached int actualCrc = 0; unsigned valid = 0; bool multipleFormatsSeen = false; @@ -2418,6 +2419,7 @@ class CFileIOArray : implements IFileIOArray, public CInterface valid++; files.append(f); bases.append(base); + sizes.append(-1); // Calculated if/when needed if (_actualCrc) { if (actualCrc && actualCrc != _actualCrc) @@ -2468,14 +2470,28 @@ class CFileIOArray : implements IFileIOArray, public CInterface totalSize = 0; ForEachItemIn(idx, files) { - IFileIO *file = files.item(idx); - if (file) - totalSize += file->size(); + totalSize += partSize(idx); } } return totalSize; } + virtual unsigned __int64 partSize(unsigned idx) const override + { + CriticalBlock b(crit); + __int64 fsize = sizes.item(idx); + if (fsize == -1) + { + IFileIO *file = files.item(idx); + if (file) + fsize = file->size(); + else + fsize = 0; + sizes.replace(fsize, idx); + } + return (unsigned __int64) fsize; + } + virtual StringBuffer &getId(StringBuffer &ret) const override { CriticalBlock b(crit); diff --git a/roxie/ccd/ccdkey.cpp b/roxie/ccd/ccdkey.cpp index c24ad3e2b49..dc21d4fa752 100644 --- a/roxie/ccd/ccdkey.cpp +++ b/roxie/ccd/ccdkey.cpp @@ -691,10 +691,11 @@ class BufferedDirectReader : public CDirectReaderBase while (!_partNo && !thisPart && ++thisPartIdx < maxParts) // MORE { thisPart.setown(f->getFilePart(thisPartIdx, thisFileStartPos)); - if (thisPart && _startPos >= thisPart->size()) + offset_t thisPartSize = f->partSize(thisPartIdx); + if (thisPart && _startPos >= thisPartSize) { - _startPos -= thisPart->size(); - completedStreamsSize += thisPart->size(); + _startPos -= thisPartSize; + completedStreamsSize += thisPartSize; thisPart.clear(); } } diff --git a/roxie/ccd/ccdstate.hpp b/roxie/ccd/ccdstate.hpp index 44340aa9e70..6d8bc4452bc 100644 --- a/roxie/ccd/ccdstate.hpp +++ b/roxie/ccd/ccdstate.hpp @@ -93,6 +93,7 @@ interface IFileIOArray : extends IInterface virtual unsigned numValid() const = 0; virtual bool isValid(unsigned partNo) const = 0; virtual unsigned __int64 size() const = 0; + virtual unsigned __int64 partSize(unsigned partNo) const = 0; virtual StringBuffer &getId(StringBuffer &) const = 0; virtual const char *queryLogicalFilename(unsigned partNo) const = 0; virtual int queryActualFormatCrc() const = 0; // Actual format on disk