Skip to content

Commit 4a8d8b6

Browse files
committed
Add to TTreePerfStats details caching/read info for each basket
1 parent 43cf893 commit 4a8d8b6

File tree

7 files changed

+200
-2
lines changed

7 files changed

+200
-2
lines changed

core/base/inc/TVirtualPerfStats.h

+7
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626

2727

2828
class TFile;
29+
class TBranch;
2930

3031

3132
class TVirtualPerfStats : public TObject {
@@ -71,6 +72,12 @@ class TVirtualPerfStats : public TObject {
7172
virtual void SetNumEvents(Long64_t num) = 0;
7273
virtual Long64_t GetNumEvents() const = 0;
7374

75+
virtual void PrintBasketInfo(Option_t * option = "") const = 0;
76+
virtual void SetLoaded(TBranch *b, size_t basketNumber) = 0;
77+
virtual void SetLoadedMiss(TBranch *b, size_t basketNumber) = 0;
78+
virtual void SetMissed(TBranch *b, size_t basketNumber) = 0;
79+
virtual void SetUsed(TBranch *b, size_t basketNumber) = 0;
80+
7481
static const char *EventType(EEventType type);
7582

7683
ClassDef(TVirtualPerfStats,0) // ABC for collecting PROOF statistics

proof/proofplayer/inc/TPerfStats.h

+6
Original file line numberDiff line numberDiff line change
@@ -131,6 +131,12 @@ friend class TProofMonSender;
131131
void SetNumEvents(Long64_t num) { fNumEvents = num; }
132132
Long64_t GetNumEvents() const { return fNumEvents; }
133133

134+
void PrintBasketInfo(Option_t * = "") const {}
135+
void SetLoaded(TBranch *, size_t) {}
136+
void SetLoadedMiss(TBranch *, size_t) {}
137+
void SetMissed(TBranch *, size_t) {}
138+
void SetUsed(TBranch *, size_t) {}
139+
134140
static void Start(TList *input, TList *output);
135141
static void Stop();
136142
static void Setup(TList *input);

tree/tree/inc/TBranch.h

+2
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,7 @@ class TDirectory;
4343
class TFile;
4444
class TClonesArray;
4545
class TTreeCloner;
46+
class TTreeCache;
4647

4748
const Int_t kDoNotProcess = BIT(10); // Active bit for branches
4849
const Int_t kIsClone = BIT(11); // to indicate a TBranchClones
@@ -60,6 +61,7 @@ class TBranch : public TNamed , public TAttFill {
6061
using TIOFeatures = ROOT::TIOFeatures;
6162

6263
protected:
64+
friend class TTreeCache;
6365
friend class TTreeCloner;
6466
friend class TTree;
6567

tree/tree/src/TBranch.cxx

+6
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@
3939
#include "TTreeCacheUnzip.h"
4040
#include "TVirtualMutex.h"
4141
#include "TVirtualPad.h"
42+
#include "TVirtualPerfStats.h"
4243

4344
#include "TBranchIMTHelper.h"
4445

@@ -1234,6 +1235,11 @@ TBasket* TBranch::GetBasket(Int_t basketnumber)
12341235
}
12351236

12361237
++fNBaskets;
1238+
1239+
auto perfStats = GetTree()->GetPerfStats();
1240+
if (perfStats)
1241+
perfStats->SetUsed(this, basketnumber);
1242+
12371243
fBaskets.AddAt(basket,basketnumber);
12381244
return basket;
12391245
}

tree/tree/src/TTreeCache.cxx

+54-1
Original file line numberDiff line numberDiff line change
@@ -256,6 +256,7 @@ of effective system reads for a given file with a code like
256256
#include "TFriendElement.h"
257257
#include "TFile.h"
258258
#include "TMath.h"
259+
#include "TVirtualPerfStats.h"
259260
#include <limits.h>
260261

261262
Int_t TTreeCache::fgLearnEntries = 100;
@@ -714,6 +715,10 @@ TBranch *TTreeCache::CalculateMissEntries(Long64_t pos, Int_t len, Bool_t all)
714715
Bool_t found_request = kFALSE;
715716
TBranch *resultBranch = nullptr;
716717
Long64_t entry = fTree->GetReadEntry();
718+
719+
std::vector<std::pair<TBranch*,Int_t>> basketsInfo;
720+
auto perfStats = GetTree()->GetPerfStats();
721+
717722
// printf("Will search %d branches for basket at %ld.\n", count, pos);
718723
for (int i = 0; i < count; i++) {
719724
TBranch *b =
@@ -730,12 +735,30 @@ TBranch *TTreeCache::CalculateMissEntries(Long64_t pos, Int_t len, Bool_t all)
730735
}
731736
// At this point, we are ready to push back a new offset
732737
fMissCache->fEntries.emplace_back(std::move(iopos));
738+
739+
if (R__unlikely(perfStats)) {
740+
Int_t blistsize = b->GetWriteBasket();
741+
Int_t basketNumber = -1;
742+
for(Int_t bn = 0; bn < blistsize; ++bn) {
743+
if (iopos.fPos == b->GetBasketSeek(bn)) {
744+
basketNumber = bn;
745+
break;
746+
}
747+
}
748+
if (basketNumber >= 0)
749+
basketsInfo.emplace_back(b, basketNumber);
750+
}
733751
}
734752
if (R__unlikely(!found_request)) {
735753
// We have gone through all the branches in this file and the requested basket
736754
// doesn't appear to be in any of them. Likely a logic error / bug.
737755
fMissCache->fEntries.clear();
738756
}
757+
if (R__unlikely(perfStats)) {
758+
for(auto &info : basketsInfo) {
759+
perfStats->SetLoadedMiss(info.first, info.second);
760+
}
761+
}
739762
return resultBranch;
740763
}
741764

@@ -1011,6 +1034,7 @@ Bool_t TTreeCache::FillBuffer()
10111034
Int_t prevNtot;
10121035
Int_t minBasket = 0; // We will use this to avoid re-checking the first baskets in the 2nd (or more) run in the while loop.
10131036
Long64_t maxReadEntry = minEntry; // If we are stopped before the end of the 2nd pass, this marker will where we need to start next time.
1037+
auto perfStats = GetTree()->GetPerfStats();
10141038
do {
10151039
prevNtot = fNtotCurrentBuf;
10161040
Int_t nextMinBasket = INT_MAX;
@@ -1101,6 +1125,11 @@ Bool_t TTreeCache::FillBuffer()
11011125
}
11021126
}
11031127
}
1128+
1129+
if (R__unlikely(perfStats)) {
1130+
perfStats->SetLoaded(b, j);
1131+
}
1132+
11041133
if (fEnablePrefetching){
11051134
if (fFirstBuffer) {
11061135
TFileCacheRead::Prefetch(pos,len);
@@ -1337,23 +1366,47 @@ Int_t TTreeCache::ReadBufferNormal(char *buf, Long64_t pos, Int_t len){
13371366
return 1;
13381367
}
13391368

1369+
static const auto recordMiss = [](TVirtualPerfStats *perfStats, TObjArray *branches, Bool_t bufferFilled, Long64_t basketpos) {
1370+
if (gDebug > 6)
1371+
::Info("TTreeCache::ReadBufferNormal", "Cache miss after an %s FillBuffer: pos=%lld", bufferFilled ? "active" : "inactive", basketpos);
1372+
for (Int_t i=0; i<branches->GetEntries(); ++i) {
1373+
TBranch *b = (TBranch*)branches->UncheckedAt(i);
1374+
Int_t blistsize = b->GetListOfBaskets()->GetSize();
1375+
for(Int_t j = 0; j < blistsize; ++j) {
1376+
if (basketpos == b->GetBasketSeek(j)) {
1377+
if (gDebug > 6)
1378+
::Info("TTreeCache::ReadBufferNormal"," Missing basket: %d for %s", j, b->GetName());
1379+
perfStats->SetMissed(b, j);
1380+
}
1381+
}
1382+
}
1383+
};
1384+
13401385
//not found in cache. Do we need to fill the cache?
13411386
Bool_t bufferFilled = FillBuffer();
13421387
if (bufferFilled) {
13431388
Int_t res = TFileCacheRead::ReadBuffer(buf,pos,len);
13441389

13451390
if (res == 1)
13461391
fNReadOk++;
1347-
else if (res == 0)
1392+
else if (res == 0) {
13481393
fNReadMiss++;
1394+
auto perfStats = GetTree()->GetPerfStats();
1395+
if (perfStats)
1396+
recordMiss(perfStats, fBranches, bufferFilled, pos);
1397+
}
13491398

13501399
return res;
13511400
}
1401+
13521402
if (CheckMissCache(buf, pos, len)) {
13531403
return 1;
13541404
}
13551405

13561406
fNReadMiss++;
1407+
auto perfStats = GetTree()->GetPerfStats();
1408+
if (perfStats)
1409+
recordMiss(perfStats, fBranches, bufferFilled, pos);
13571410

13581411
return 0;
13591412
}

tree/treeplayer/inc/TTreePerfStats.h

+21-1
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@
2323

2424
#include "TVirtualPerfStats.h"
2525
#include "TString.h"
26+
#include <vector>
2627

2728

2829
class TBrowser;
@@ -35,6 +36,14 @@ class TGaxis;
3536
class TText;
3637
class TTreePerfStats : public TVirtualPerfStats {
3738

39+
public:
40+
struct BasketInfo {
41+
UInt_t fUsed = {0}; // Number of times the basket was requested from the disk.
42+
UInt_t fLoaded = {0}; // Number of times the basket was put in the primary TTreeCache
43+
UInt_t fLoadedMiss = {0}; // Number of times the basket was put in the secondary cache
44+
UInt_t fMissed = {0}; // Number of times the basket was read directly from the file.
45+
};
46+
3847
protected:
3948
Int_t fTreeCacheSize; //TTreeCache buffer size
4049
Int_t fNleaves; //Number of leaves in the tree
@@ -59,6 +68,11 @@ class TTreePerfStats : public TVirtualPerfStats {
5968
TGaxis *fRealTimeAxis; //pointer to TGaxis object showing real-time
6069
TText *fHostInfoText; //Graphics Text object with the fHostInfo data
6170

71+
72+
std::vector<std::vector<BasketInfo> > fBasketsInfo; // Details on which baskets was used, cached, 'miss-cached' or read uncached.Browse
73+
74+
BasketInfo& GetBasketInfo(TBranch *b, size_t basketNumber);
75+
6276
public:
6377
TTreePerfStats();
6478
TTreePerfStats(const char *name, TTree *T);
@@ -117,7 +131,13 @@ class TTreePerfStats : public TVirtualPerfStats {
117131
virtual void SetTreeCacheSize(Int_t nbytes) {fTreeCacheSize = nbytes;}
118132
virtual void SetUnzipTime(Double_t uztime) {fUnzipTime = uztime;}
119133

120-
ClassDef(TTreePerfStats,6) // TTree I/O performance measurement
134+
virtual void PrintBasketInfo(Option_t * option = "") const;
135+
virtual void SetLoaded(TBranch *b, size_t basketNumber) { ++GetBasketInfo(b, basketNumber).fLoaded; }
136+
virtual void SetLoadedMiss(TBranch *b, size_t basketNumber) { ++GetBasketInfo(b, basketNumber).fLoadedMiss; }
137+
virtual void SetMissed(TBranch *b, size_t basketNumber) { ++GetBasketInfo(b, basketNumber).fMissed; }
138+
virtual void SetUsed(TBranch *b, size_t basketNumber) { ++GetBasketInfo(b, basketNumber).fUsed; }
139+
140+
ClassDef(TTreePerfStats,7) // TTree I/O performance measurement
121141
};
122142

123143
#endif

tree/treeplayer/src/TTreePerfStats.cxx

+104
Original file line numberDiff line numberDiff line change
@@ -85,6 +85,7 @@ The Physical disk speed is DiskIO + DiskIO*ReadExtra/100.
8585
#include "Riostream.h"
8686
#include "TFile.h"
8787
#include "TTree.h"
88+
#include "TTreeCache.h"
8889
#include "TAxis.h"
8990
#include "TBrowser.h"
9091
#include "TVirtualPad.h"
@@ -338,6 +339,41 @@ void TTreePerfStats::Finish()
338339
}
339340
}
340341

342+
////////////////////////////////////////////////////////////////////////////////
343+
/// Return the BasketInfo corresponding to the given branch and basket.
344+
345+
TTreePerfStats::BasketInfo &TTreePerfStats::GetBasketInfo(TBranch *br, size_t basketNumber)
346+
{
347+
static BasketInfo fallback;
348+
349+
// First find the branch index.
350+
TFile *file = fTree->GetCurrentFile();
351+
if (!file)
352+
return fallback;
353+
354+
TTreeCache *cache = dynamic_cast<TTreeCache*>(file->GetCacheRead(fTree));
355+
if (!cache)
356+
return fallback;
357+
358+
auto branches = cache->GetCachedBranches();
359+
Int_t index = -1;
360+
for(Int_t i = 0; i < branches->GetEntries(); ++i) {
361+
if (br == branches->UncheckedAt(i)) {
362+
index = i;
363+
break;
364+
}
365+
}
366+
if (index < 0)
367+
return fallback;
368+
if (fBasketsInfo.size() <= (size_t)index)
369+
fBasketsInfo.resize(index+1);
370+
371+
auto &brvec(fBasketsInfo[index]);
372+
if (brvec.size() <= basketNumber)
373+
brvec.resize(basketNumber+1);
374+
375+
return brvec[basketNumber];
376+
}
341377

342378
////////////////////////////////////////////////////////////////////////////////
343379
/// Draw the TTree I/O perf graph.
@@ -429,6 +465,7 @@ void TTreePerfStats::Print(Option_t * option) const
429465
TString opts(option);
430466
opts.ToLower();
431467
Bool_t unzip = opts.Contains("unzip");
468+
Bool_t basket = opts.Contains("basket");
432469
TTreePerfStats *ps = (TTreePerfStats*)this;
433470
ps->Finish();
434471

@@ -457,8 +494,75 @@ void TTreePerfStats::Print(Option_t * option) const
457494
printf("ReadStrCP = %7.3f MBytes/s\n",1e-6*fCompress*fBytesRead/(fCpuTime-fUnzipTime));
458495
printf("ReadZipCP = %7.3f MBytes/s\n",1e-6*fCompress*fBytesRead/fUnzipTime);
459496
}
497+
if (basket)
498+
PrintBasketInfo(option);
460499
}
461500

501+
////////////////////////////////////////////////////////////////////////////////
502+
/// Print the TTree basket information
503+
504+
void TTreePerfStats::PrintBasketInfo(Option_t * option) const {
505+
506+
TString opts(option);
507+
opts.ToLower();
508+
Bool_t all = opts.Contains("allbasketinfo");
509+
510+
TFile *file = fTree->GetCurrentFile();
511+
if (!file)
512+
return;
513+
514+
TTreeCache *cache = dynamic_cast<TTreeCache*>(file->GetCacheRead(fTree));
515+
if (!cache)
516+
return;
517+
518+
auto branches = cache->GetCachedBranches();
519+
for(size_t i = 0; i < fBasketsInfo.size(); ++i) {
520+
const char *branchname = branches->At(i)->GetName();
521+
522+
printf(" br=%ld %s read not cached: ", i, branchname);
523+
if (fBasketsInfo[i].size() == 0) {
524+
printf("none");
525+
} else for(size_t j = 0; j < fBasketsInfo[i].size(); ++j) {
526+
if (fBasketsInfo[i][j].fMissed) printf("%ld ", j);
527+
}
528+
printf("\n");
529+
530+
printf(" br=%ld %s cached more than once: ", i, branchname);
531+
for(size_t j = 0; j < fBasketsInfo[i].size(); ++j) {
532+
auto &info( fBasketsInfo[i][j] );
533+
if ((info.fLoaded + info.fLoadedMiss) > 1)
534+
printf("%ld[%d,%d] ", j, info.fLoaded, info.fLoadedMiss);
535+
}
536+
printf("\n");
537+
538+
printf(" br=%ld %s cached but not used: ", i, branchname);
539+
for(size_t j = 0; j < fBasketsInfo[i].size(); ++j) {
540+
auto &info( fBasketsInfo[i][j] );
541+
if ( (info.fLoaded + info.fLoadedMiss) && !info.fUsed) {
542+
if (info.fLoadedMiss)
543+
printf("%ld[%d,%d] ", j, info.fLoaded, info.fLoadedMiss);
544+
else
545+
printf("%ld ", j);
546+
}
547+
}
548+
printf("\n");
549+
550+
if (all) {
551+
printf(" br=%ld %s: ", i, branchname);
552+
for(size_t j = 0; j < fBasketsInfo[i].size(); ++j) {
553+
auto &info( fBasketsInfo[i][j] );
554+
printf("%ld[%d,%d,%d,%d] ", j, info.fUsed, info.fLoaded, info.fLoadedMiss, info.fMissed);
555+
}
556+
printf("\n");
557+
}
558+
}
559+
for(Int_t i = fBasketsInfo.size(); i < branches->GetEntries(); ++i) {
560+
printf(" br=%d %s: no basket information\n", i, branches->At(i)->GetName());
561+
}
562+
563+
}
564+
565+
462566
////////////////////////////////////////////////////////////////////////////////
463567
/// Save this object to filename
464568

0 commit comments

Comments
 (0)