You've already forked UnrealEngineUWP
mirror of
https://github.com/izzy2lost/UnrealEngineUWP.git
synced 2026-03-26 18:15:20 -07:00
The async cache hierarchy: - Is required to add compression to the legacy cache by forwarding LegacyPut/LegacyGet to PutValue/GetValue. - Is always present in the graph, unlike the previous cache hierarchy, which will allow significant simplification of leaf cache stores. - Allows for the leaf cache store nodes to operate asynchronously without blocking a worker thread like the previous cache hierarchy. - Shifts from controlling cache behavior by speed class to controlling cache behavior by local/remote classification, which is a critical distinction for a cache like Zen that can identify as both local and remote. - Respects the local/remote and query/store flags in the cache policy. - Does not fully implement the partial record cache policy at this time. - Does not propagate records or values in GetChunks, which will be added in a future release. The verify wrapper was previously missing an implementation for the new cache interface. This version is more efficient than the previous because requests through the new cache interface can compare data without loading it from storage, and load it only when a mismatch has been detected, to dump it to disk. #jira UE-134381 #lockdown Mark.Lintott #preflight 61fc32ac0a50c2606f266388 #rb Zousar.Shaker #rnx #ROBOMERGE-AUTHOR: devin.doucette #ROBOMERGE-SOURCE: CL 18851861 in //UE5/Release-5.0/... via CL 18851943 via CL 18852169 #ROBOMERGE-BOT: UE5 (Release-Engine-Test -> Main) (v910-18824042) [CL 18852184 by devin doucette in ue5-main branch]
266 lines
7.9 KiB
C++
266 lines
7.9 KiB
C++
// Copyright Epic Games, Inc. All Rights Reserved.
|
|
|
|
#include "Algo/Find.h"
|
|
#include "Algo/Transform.h"
|
|
#include "DerivedDataCachePrivate.h"
|
|
#include "DerivedDataCacheRecord.h"
|
|
#include "DerivedDataLegacyCacheStore.h"
|
|
#include "HAL/PlatformProcess.h"
|
|
#include "HAL/PlatformTime.h"
|
|
#include <atomic>
|
|
|
|
namespace UE::DerivedData
|
|
{
|
|
|
|
/**
|
|
* A cache store that increases the latency and reduces the throughput of another cache store.
|
|
* 1. Reproduce timings for a remote cache with a local cache, to reduce both network usage and measurement noise.
|
|
* 2. Reproduce HDD latency and throughput even when data is stored on SSD.
|
|
*/
|
|
class FCacheStoreThrottle final : public ILegacyCacheStore
|
|
{
|
|
public:
|
|
FCacheStoreThrottle(ILegacyCacheStore* InInnerCache, uint32 InLatencyMS, uint32 InMaxBytesPerSecond)
|
|
: InnerCache(InInnerCache)
|
|
, Latency(float(InLatencyMS) / 1000.0f)
|
|
, MaxBytesPerSecond(InMaxBytesPerSecond)
|
|
{
|
|
check(InnerCache);
|
|
}
|
|
|
|
void Put(
|
|
const TConstArrayView<FCachePutRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnCachePutComplete&& OnComplete) final
|
|
{
|
|
struct FRecordSize
|
|
{
|
|
FCacheKey Key;
|
|
uint64 Size;
|
|
};
|
|
TArray<FRecordSize, TInlineAllocator<1>> RecordSizes;
|
|
RecordSizes.Reserve(Requests.Num());
|
|
Algo::Transform(Requests, RecordSizes, [](const FCachePutRequest& Request) -> FRecordSize
|
|
{
|
|
return {Request.Record.GetKey(), Private::GetCacheRecordCompressedSize(Request.Record)};
|
|
});
|
|
|
|
InnerCache->Put(Requests, Owner,
|
|
[this, RecordSizes = MoveTemp(RecordSizes), State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FCachePutResponse&& Response)
|
|
{
|
|
const FRecordSize* Size = Algo::FindBy(RecordSizes, Response.Key, &FRecordSize::Key);
|
|
CloseThrottlingScope(State, FThrottlingState(this, Size ? Size->Size : 0));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void Get(
|
|
const TConstArrayView<FCacheGetRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnCacheGetComplete&& OnComplete) final
|
|
{
|
|
InnerCache->Get(Requests, Owner,
|
|
[this, State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FCacheGetResponse&& Response)
|
|
{
|
|
CloseThrottlingScope(State, FThrottlingState(this, Private::GetCacheRecordCompressedSize(Response.Record)));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void PutValue(
|
|
const TConstArrayView<FCachePutValueRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnCachePutValueComplete&& OnComplete) final
|
|
{
|
|
struct FValueSize
|
|
{
|
|
FCacheKey Key;
|
|
uint64 Size;
|
|
};
|
|
TArray<FValueSize, TInlineAllocator<1>> ValueSizes;
|
|
ValueSizes.Reserve(Requests.Num());
|
|
Algo::Transform(Requests, ValueSizes, [](const FCachePutValueRequest& Request) -> FValueSize
|
|
{
|
|
return {Request.Key, Request.Value.GetData().GetCompressedSize()};
|
|
});
|
|
|
|
InnerCache->PutValue(Requests, Owner,
|
|
[this, ValueSizes = MoveTemp(ValueSizes), State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FCachePutValueResponse&& Response)
|
|
{
|
|
const FValueSize* Size = Algo::FindBy(ValueSizes, Response.Key, &FValueSize::Key);
|
|
CloseThrottlingScope(State, FThrottlingState(this, Size ? Size->Size : 0));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void GetValue(
|
|
const TConstArrayView<FCacheGetValueRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnCacheGetValueComplete&& OnComplete) final
|
|
{
|
|
InnerCache->GetValue(Requests, Owner,
|
|
[this, State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FCacheGetValueResponse&& Response)
|
|
{
|
|
CloseThrottlingScope(State, FThrottlingState(this, Response.Value.GetData().GetCompressedSize()));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void GetChunks(
|
|
const TConstArrayView<FCacheGetChunkRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnCacheGetChunkComplete&& OnComplete) final
|
|
{
|
|
InnerCache->GetChunks(Requests, Owner,
|
|
[this, State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FCacheGetChunkResponse&& Response)
|
|
{
|
|
CloseThrottlingScope(State, FThrottlingState(this, Response.RawData.GetSize()));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
|
|
}
|
|
|
|
void LegacyPut(
|
|
const TConstArrayView<FLegacyCachePutRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnLegacyCachePutComplete&& OnComplete) final
|
|
{
|
|
struct FValueSize
|
|
{
|
|
FCacheKey Key;
|
|
uint64 Size;
|
|
};
|
|
TArray<FValueSize, TInlineAllocator<1>> ValueSizes;
|
|
ValueSizes.Reserve(Requests.Num());
|
|
Algo::Transform(Requests, ValueSizes, [](const FLegacyCachePutRequest& Request) -> FValueSize
|
|
{
|
|
return {Request.Key.GetKey(), Request.Value.GetSize()};
|
|
});
|
|
|
|
InnerCache->LegacyPut(Requests, Owner,
|
|
[this, ValueSizes = MoveTemp(ValueSizes), State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FLegacyCachePutResponse&& Response)
|
|
{
|
|
const FValueSize* Size = Algo::FindBy(ValueSizes, Response.Key.GetKey(), &FValueSize::Key);
|
|
CloseThrottlingScope(State, FThrottlingState(this, Size ? Size->Size : 0));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void LegacyGet(
|
|
const TConstArrayView<FLegacyCacheGetRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnLegacyCacheGetComplete&& OnComplete) final
|
|
{
|
|
InnerCache->LegacyGet(Requests, Owner,
|
|
[this, State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FLegacyCacheGetResponse&& Response)
|
|
{
|
|
CloseThrottlingScope(State, FThrottlingState(this, Response.Value.GetSize()));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void LegacyDelete(
|
|
const TConstArrayView<FLegacyCacheDeleteRequest> Requests,
|
|
IRequestOwner& Owner,
|
|
FOnLegacyCacheDeleteComplete&& OnComplete) final
|
|
{
|
|
InnerCache->LegacyDelete(Requests, Owner,
|
|
[this, State = EnterThrottlingScope(), OnComplete = MoveTemp(OnComplete)](FLegacyCacheDeleteResponse&& Response)
|
|
{
|
|
CloseThrottlingScope(State, FThrottlingState(this, 0));
|
|
if (OnComplete)
|
|
{
|
|
OnComplete(MoveTemp(Response));
|
|
}
|
|
});
|
|
}
|
|
|
|
void LegacyStats(FDerivedDataCacheStatsNode& OutNode) final
|
|
{
|
|
InnerCache->LegacyStats(OutNode);
|
|
}
|
|
|
|
bool LegacyDebugOptions(FBackendDebugOptions& Options) final
|
|
{
|
|
return InnerCache->LegacyDebugOptions(Options);
|
|
}
|
|
|
|
private:
|
|
struct FThrottlingState
|
|
{
|
|
double Time;
|
|
uint64 TotalBytesTransferred;
|
|
|
|
explicit FThrottlingState(FCacheStoreThrottle* ThrottleWrapper)
|
|
: Time(FPlatformTime::Seconds())
|
|
, TotalBytesTransferred(ThrottleWrapper->TotalBytesTransferred.load(std::memory_order_relaxed))
|
|
{
|
|
}
|
|
|
|
explicit FThrottlingState(FCacheStoreThrottle* ThrottleWrapper, uint64 BytesTransferred)
|
|
: Time(FPlatformTime::Seconds())
|
|
, TotalBytesTransferred(ThrottleWrapper->TotalBytesTransferred.fetch_add(BytesTransferred, std::memory_order_relaxed) + BytesTransferred)
|
|
{
|
|
}
|
|
};
|
|
|
|
FThrottlingState EnterThrottlingScope()
|
|
{
|
|
if (Latency > 0)
|
|
{
|
|
TRACE_CPUPROFILER_EVENT_SCOPE(ThrottlingLatency);
|
|
FPlatformProcess::Sleep(Latency);
|
|
}
|
|
return FThrottlingState(this);
|
|
}
|
|
|
|
void CloseThrottlingScope(FThrottlingState PreviousState, FThrottlingState CurrentState)
|
|
{
|
|
if (MaxBytesPerSecond)
|
|
{
|
|
// Take into account any other transfer that might have happened during that time from any other thread so we have a global limit
|
|
const double ExpectedTime = double(CurrentState.TotalBytesTransferred - PreviousState.TotalBytesTransferred) / MaxBytesPerSecond;
|
|
const double ActualTime = CurrentState.Time - PreviousState.Time;
|
|
if (ExpectedTime > ActualTime)
|
|
{
|
|
TRACE_CPUPROFILER_EVENT_SCOPE(ThrottlingBandwidth);
|
|
FPlatformProcess::Sleep(ExpectedTime - ActualTime);
|
|
}
|
|
}
|
|
}
|
|
|
|
/** Backend to use for storage, my responsibilities are about throttling **/
|
|
ILegacyCacheStore* InnerCache;
|
|
float Latency;
|
|
uint32 MaxBytesPerSecond;
|
|
std::atomic<uint64> TotalBytesTransferred{0};
|
|
};
|
|
|
|
ILegacyCacheStore* CreateCacheStoreThrottle(ILegacyCacheStore* InnerCache, uint32 LatencyMS, uint32 MaxBytesPerSecond)
|
|
{
|
|
return new FCacheStoreThrottle(InnerCache, LatencyMS, MaxBytesPerSecond);
|
|
}
|
|
|
|
} // UE::DerivedData
|