beegfs/fsck/source/components/worker/RetrieveFsIDsWork.cpp
2025-08-10 01:34:16 +02:00

126 lines
4.1 KiB
C++

#include "RetrieveFsIDsWork.h"
#include <common/net/message/fsck/RetrieveFsIDsMsg.h>
#include <common/net/message/fsck/RetrieveFsIDsRespMsg.h>
#include <common/toolkit/MessagingTk.h>
#include <common/toolkit/MetaStorageTk.h>
#include <database/FsckDBException.h>
#include <toolkit/FsckException.h>
#include <program/Program.h>
RetrieveFsIDsWork::RetrieveFsIDsWork(FsckDB* db, Node& node, SynchronizedCounter* counter,
AtomicUInt64& errors, unsigned hashDirStart, unsigned hashDirEnd) :
log("RetrieveFsIDsWork"), node(node), counter(counter), errors(&errors),
hashDirStart(hashDirStart), hashDirEnd(hashDirEnd),
table(db->getFsIDsTable()), bulkHandle(table->newBulkHandle())
{
}
RetrieveFsIDsWork::~RetrieveFsIDsWork()
{
}
void RetrieveFsIDsWork::process(char* bufIn, unsigned bufInLen, char* bufOut,
unsigned bufOutLen)
{
log.log(4, "Processing RetrieveFsIDsWork");
try
{
doWork(false);
doWork(true);
table->flush(bulkHandle);
// work package finished => increment counter
this->counter->incCount();
}
catch (std::exception &e)
{
// exception thrown, but work package is finished => increment counter
this->counter->incCount();
// after incrementing counter, re-throw exception
throw;
}
log.log(4, "Processed RetrieveFsIDsWork");
}
void RetrieveFsIDsWork::doWork(bool isBuddyMirrored)
{
for ( unsigned firstLevelhashDirNum = hashDirStart; firstLevelhashDirNum <= hashDirEnd;
firstLevelhashDirNum++ )
{
for ( unsigned secondLevelhashDirNum = 0;
secondLevelhashDirNum < META_DENTRIES_LEVEL2_SUBDIR_NUM; secondLevelhashDirNum++ )
{
unsigned hashDirNum = StorageTk::mergeHashDirs(firstLevelhashDirNum,
secondLevelhashDirNum);
int64_t hashDirOffset = 0;
int64_t contDirOffset = 0;
std::string currentContDirID;
int resultCount = 0;
do
{
RetrieveFsIDsMsg retrieveFsIDsMsg(hashDirNum, isBuddyMirrored, currentContDirID,
RETRIEVE_FSIDS_PACKET_SIZE, hashDirOffset, contDirOffset);
const auto respMsg = MessagingTk::requestResponse(node, retrieveFsIDsMsg,
NETMSGTYPE_RetrieveFsIDsResp);
if (respMsg)
{
auto* retrieveFsIDsRespMsg = (RetrieveFsIDsRespMsg*) respMsg.get();
// set new parameters
currentContDirID = retrieveFsIDsRespMsg->getCurrentContDirID();
hashDirOffset = retrieveFsIDsRespMsg->getNewHashDirOffset();
contDirOffset = retrieveFsIDsRespMsg->getNewContDirOffset();
// parse FS-IDs
FsckFsIDList& fsIDs = retrieveFsIDsRespMsg->getFsIDs();
// this is the actual result count we are interested in, because if no fsIDs
// were read, there is nothing left on the server
resultCount = fsIDs.size();
// check entry IDs
for (auto it = fsIDs.begin(); it != fsIDs.end(); )
{
if (db::EntryID::tryFromStr(it->getID()).first
&& db::EntryID::tryFromStr(it->getParentDirID()).first)
{
++it;
continue;
}
LOG(GENERAL, ERR, "Found fsid file with invalid entry IDs.",
("node", it->getSaveNodeID()),
("isBuddyMirrored", it->getIsBuddyMirrored()),
("entryID", it->getID()),
("parentEntryID", it->getParentDirID()));
++it;
errors->increase();
fsIDs.erase(std::prev(it));
}
this->table->insert(fsIDs, this->bulkHandle);
}
else
{
throw FsckException("Communication error occured with node " + node.getAlias());
}
// if any of the worker threads threw an exception, we should stop now!
if ( Program::getApp()->getShallAbort() )
return;
} while ( resultCount > 0 );
}
}
}