/**************************************************************************** ** TAU Portable Profiling Package ** ** http://www.cs.uoregon.edu/research/paracomp/tau ** ***************************************************************************** ** Copyright 2003 ** ** Department of Computer and Information Science, University of Oregon ** ** Advanced Computing Laboratory, Los Alamos National Laboratory ** ** Research Center Juelich, Germany ** ****************************************************************************/ /*************************************************************************** ** File : tau2vtf.cpp ** ** Description : TAU to VTF3 translator ** ** Author : Sameer Shende ** ** Contact : sameer@cs.uoregon.edu ** ***************************************************************************/ #include #include #include #include #include /* VTF3 header file */ #include #include #include #include #include #include using namespace std; int debugPrint = 0; bool multiThreaded = false; #define dprintf if (debugPrint) printf /* The choice of the following numbers is arbitrary */ #define TAU_SAMPLE_CLASS_TOKEN 71 #define TAU_DEFAULT_COMMUNICATOR 42 /* any unique id */ /* implementation of callback routines */ map< pair, int, less< pair > > EOF_Trace; map< int,int, less > numthreads; //map< int,int > nodename; map nodenum; map threadnum; map,int, less< pair > > GlobalId; int countthreads = 0; /* numthreads[k] is no. of threads in rank k */ int EndOfTrace = 0; /* false */ /* Define limits of sample data (user defined events) */ struct { unsigned long long umin; unsigned long long umax; } taulongbounds = { 0, (unsigned long long)~(unsigned long long)0 }; struct { double fmin; double fmax; } taufloatbounds = {-1.0e+300, +1.0e+300}; /* These structures are used in user defined event data */ /* Global data */ int sampgroupid = 0; int sampclassid = 0; vector > callstack; //int *offset = 0; /* FIX GlobalID so it takes into account numthreads */ /* utilities */ /* int GlobalId(int localnodeid, int localthreadid) { localnodeid=nodename[localnodeid]; if (multiThreaded) { if (offset == (int *) NULL) { printf("Error: offset vector is NULL in GlobalId()\n"); return localnodeid; }*/ /* for multithreaded programs, modify this routine */ // return offset[localnodeid]+localthreadid; /* for single node program */ /* } else { return localnodeid; } }*/ /* implementation of callback routines */ /*************************************************************************** * Description: EnterState is called at routine entry by trace input library * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int EnterState(void *userData, double time, unsigned int nodeid, unsigned int tid, unsigned int stateid) { dprintf("Entered state %d time %g nid %d tid %d\n", stateid, time, nodeid, tid); int cpuid = GlobalId[pair(nodeid, tid)]; if (cpuid >= callstack.size()) { fprintf(stderr, "ERROR: tau2vtf: EnterState() cpuid %d exceeds callstack size %d\n", cpuid, callstack.size()); exit(1); } callstack[cpuid].push(stateid); VTF3_WriteDownto(userData, time, stateid, cpuid, VTF3_SCLNONE); return 0; } /*************************************************************************** * Description: LeaveState is called at routine exit by trace input library * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int LeaveState(void *userData, double time, unsigned int nid, unsigned int tid, unsigned int stateid) { dprintf("Leaving state time %g nid %d tid %d\n", time, nid, tid); int cpuid = GlobalId[pair(nid, tid)]; if (callstack[cpuid].size()==0) { fprintf(stderr, "ERROR: tau2vtf: LeaveState() cpuid %d has state departure before entry\n", cpuid); exit(1); } int localstateid = callstack[cpuid].top(); callstack[cpuid].pop(); VTF3_WriteUpfrom(userData, time, localstateid, cpuid, VTF3_SCLNONE); return 0; } /*************************************************************************** * Description: ClockPeriod (in microseconds) is specified here. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int ClockPeriod( void* userData, double clkPeriod ) { dprintf("Clock period %g\n", clkPeriod); VTF3_WriteDefclkperiod(userData, clkPeriod); return 0; } /*************************************************************************** * Description: DefThread is called when a new nodeid/threadid is encountered. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int DefThread(void *userData, unsigned int nodeToken, unsigned int threadToken, const char *threadName ) { dprintf("DefThread nid %d tid %d, thread name %s\n", nodeToken, threadToken, threadName); EOF_Trace[pair (nodeToken,threadToken) ] = 0; /* initialize it */ countthreads++; numthreads[nodeToken] = numthreads[nodeToken] + 1; /*if(numthreads[nodeToken]==1) { nodename[nodeToken]=countnodes;//nodename.size(); nodenum[countnodes]=nodeToken; countnodes++; printf("Node: %d, ID: %d\n",nodeToken,nodename[nodeToken]); }*/ if (threadToken > 0) multiThreaded = true; return 0; } /*************************************************************************** * Description: EndTrace is called when an EOF is encountered in a tracefile. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int EndTrace( void *userData, unsigned int nodeToken, unsigned int threadToken) { dprintf("EndTrace nid %d tid %d\n", nodeToken, threadToken); EOF_Trace[pair (nodeToken,threadToken) ] = 1; /* flag it as over */ /* yes, it is over */ map < pair, int, less< pair > >::iterator it; EndOfTrace = 1; /* Lets assume that it is over */ for (it = EOF_Trace.begin(); it != EOF_Trace.end(); it++) { /* cycle through all pairs to see if it really over */ if ((*it).second == 0) { EndOfTrace = 0; /* not over! */ /* If there's any processor that is not over, then the trace is not over */ } } return 0; } /*************************************************************************** * Description: DefStateGroup registers a profile group name with its id. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int DefStateGroup( void *userData, unsigned int stateGroupToken, const char *stateGroupName ) { dprintf("StateGroup groupid %d, group name %s\n", stateGroupToken, stateGroupName); /* create a default activity (group) */ VTF3_WriteDefact(userData, stateGroupToken, stateGroupName); return 0; } /*************************************************************************** * Description: DefState is called to define a new symbol (event). It uses * the token used to define the group identifier. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int DefState( void *userData, unsigned int stateToken, const char *stateName, unsigned int stateGroupToken ) { dprintf("DefState stateid %d stateName %s stategroup id %d\n", stateToken, stateName, stateGroupToken); /* We need to remove the backslash and quotes from "\"funcname\"" */ char *name = strdup(stateName); int len = strlen(name); if ((name[0] == '"' ) && (name[len-1] == '"')) { name += 1; name[len-2] = '\0'; } /* create a state record */ VTF3_WriteDefstate(userData, stateGroupToken, stateToken, (const char *) name, VTF3_SCLNONE); return 0; } /*************************************************************************** * Description: DefUserEvent is called to register the name and a token of the * user defined event (or a sample event in Vampir terminology). * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int DefUserEvent( void *userData, unsigned int userEventToken, const char *userEventName , int monotonicallyIncreasing) { dprintf("DefUserEvent event id %d user event name %s\n", userEventToken, userEventName); /* VTF3_WriteDefsampclass(userData, userEventToken, userEventName); */ int iscpugrpsamp = 1; int dodifferentiation; /* We need to remove the backslash and quotes from "\"funcname\"" */ char *name = strdup(userEventName); int len = strlen(name); if ((name[0] == '"' ) && (name[len-1] == '"')) { name += 1; name[len-2] = '\0'; } /* create a state record */ if (monotonicallyIncreasing) { dodifferentiation = 1; /* for hw counter data */ VTF3_WriteDefsamp(userData, userEventToken, TAU_SAMPLE_CLASS_TOKEN, iscpugrpsamp, sampgroupid, VTF3_VALUETYPE_UINT, (void *) &taulongbounds, dodifferentiation, VTF3_DATAREPHINT_BEFORE, (const char *) name, "#/s"); } else { /* for non monotonically increasing data */ dodifferentiation = 0; /* for TAU user defined events */ VTF3_WriteDefsamp(userData, userEventToken, TAU_SAMPLE_CLASS_TOKEN, iscpugrpsamp, sampgroupid, VTF3_VALUETYPE_UINT, (void *) &taulongbounds, dodifferentiation, VTF3_DATAREPHINT_BEFORE, (const char *) name, "#"); } return 0; } /*************************************************************************** * Description: EventTrigger is called when a user defined event is triggered. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int EventTrigger( void *userData, double time, unsigned int nodeToken, unsigned int threadToken, unsigned int userEventToken, long long userEventValue) { dprintf("EventTrigger: time %g, nid %d tid %d event id %d triggered value %lld \n", time, nodeToken, threadToken, userEventToken, userEventValue); int type = VTF3_VALUETYPE_UINT; int cpuid = GlobalId[pair(nodeToken, threadToken)]; /* GID */ int samplearraydim = 1; /* write the sample data */ VTF3_WriteSamp(userData, time, cpuid, samplearraydim, (const int *) &userEventToken, &type, &userEventValue); return 0; } /*************************************************************************** * Description: SendMessage is called when a message is sent by a process. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int SendMessage( void *userData, double time, unsigned int sourceNodeToken, unsigned int sourceThreadToken, unsigned int destinationNodeToken, unsigned int destinationThreadToken, unsigned int messageSize, unsigned int messageTag, unsigned int messageComm) { dprintf("SendMessage: time %g, source nid %d tid %d, destination nid %d tid %d, size %d, tag %d\n", time, sourceNodeToken, sourceThreadToken, destinationNodeToken, destinationThreadToken, messageSize, messageTag); int source = GlobalId[pair(sourceNodeToken, sourceThreadToken)]; int dest = GlobalId[pair(destinationNodeToken, destinationThreadToken)]; VTF3_WriteSendmsg(userData, time, source, dest, TAU_DEFAULT_COMMUNICATOR, messageTag, messageSize, VTF3_SCLNONE); return 0; } /*************************************************************************** * Description: RecvMessage is called when a message is received by a process. * This is a callback routine which must be registered by the * trace converter. ***************************************************************************/ int RecvMessage( void *userData, double time, unsigned int sourceNodeToken, unsigned int sourceThreadToken, unsigned int destinationNodeToken, unsigned int destinationThreadToken, unsigned int messageSize, unsigned int messageTag, unsigned int messageComm) { dprintf("RecvMessage: time %g, source nid %d tid %d, destination nid %d tid %d, size %d, tag %d\n", time, sourceNodeToken, sourceThreadToken, destinationNodeToken, destinationThreadToken, messageSize, messageTag); int source = GlobalId[pair(sourceNodeToken, sourceThreadToken)]; int dest = GlobalId[pair(destinationNodeToken, destinationThreadToken)]; VTF3_WriteRecvmsg(userData, time, dest, source, TAU_DEFAULT_COMMUNICATOR, messageTag, messageSize, VTF3_SCLNONE); return 0; } /*************************************************************************** * Description: To clean up and reset the end of file marker, we invoke this. ***************************************************************************/ int ResetEOFTrace(void) { /* mark all entries of EOF_Trace to be false */ for (map< pair, int, less< pair > >:: iterator it = EOF_Trace.begin(); it != EOF_Trace.end(); it++) { /* Explicilty mark end of trace to be not over */ (*it).second = 0; } return 0; } void usage(char *s) { fprintf(stderr,"Usage: %s [-a|-fa] [-nomessage] [-v]\n", s); fprintf(stderr," -a : ASCII VTF3 file format\n"); fprintf(stderr," -fa : FAST ASCII VTF3 file format\n"); fprintf(stderr," -nomessage : Suppress printing of message information in the trace\n"); fprintf(stderr," -v : Verbose\n"); fprintf(stderr," Default trace format of is VTF3 binary\n"); fprintf(stderr," e.g.,\n"); fprintf(stderr," %s merged.trc tau.edf app.vpt.gz\n\n", s); } /*************************************************************************** * Description: The main entrypoint. ***************************************************************************/ int main(int argc, char **argv) { Ttf_FileHandleT fh; int recs_read, pos; char *trace_file; char *edf_file = NULL; char *out_file = NULL; int output_format = VTF3_FILEFORMAT_STD_BINARY; /* Binary by default */ int no_state_flag=0, no_message_flag=0; int i; /* main program: Usage app [-a] [-nomessage] */ if (argc < 4) { usage(argv[0]); exit(1); } /*************************************************************************** * -a stands for ASCII, -fa stands for FAST ASCII and -v is for verbose. ***************************************************************************/ for (i = 0; i < argc ; i++) { switch(i) { case 0: trace_file = argv[1]; break; case 1: edf_file = argv[2]; break; case 2: out_file = argv[3]; break; default: if (strcmp(argv[i], "-a")==0) { /* Use ASCII format */ output_format = VTF3_FILEFORMAT_STD_ASCII; } if (strcmp(argv[i], "-fa")==0) { /* Use FAST ASCII format */ output_format = VTF3_FILEFORMAT_FST_ASCII; } if (strcmp(argv[i], "-nomessage")==0) { no_message_flag = 1; } if (strcmp(argv[i], "-v") == 0) { debugPrint = 1; } break; } } /* Finished parsing commandline options, now open the trace file */ fh = Ttf_OpenFileForInput( argv[1], argv[2]); if (!fh) { fprintf(stderr,"ERROR:Ttf_OpenFileForInput failed\n"); exit(1); } if (out_file == NULL) { fprintf(stderr,"ERROR: Please specify an output file\n"); usage(argv[0]); exit(1); } /* Open VTF3 Trace file for output */ (void) VTF3_InitTables(); int write_unmerged_records ; /* Define the file control block for output trace file */ void *fcb = VTF3_OpenFileOutput(out_file, output_format, write_unmerged_records = 0); /* check and verify that it was opened properly */ if (fcb == 0) { perror(out_file); exit(1); } /* Write the trace file header */ VTF3_WriteDefversion(fcb, VTF3_GetVersionNumber()); VTF3_WriteDefcreator(fcb, "tau2vtf converter"); VTF3_WriteDefsampclass(fcb, TAU_SAMPLE_CLASS_TOKEN, "TAU counter data"); /* in the first pass, we determine the no. of cpus and other group related * information. In the second pass, we look at the function entry/exits */ Ttf_CallbacksT firstpass; /* In the first pass, we just look for node/thread ids and def records */ firstpass.UserData = fcb; firstpass.DefThread = DefThread; firstpass.EndTrace = EndTrace; firstpass.DefClkPeriod = ClockPeriod; //firstpass.DefThread = DefThread; firstpass.DefStateGroup = DefStateGroup; firstpass.DefState = DefState; firstpass.SendMessage = 0; /* Important to declare these as null! */ firstpass.RecvMessage = 0; /* Important to declare these as null! */ firstpass.DefUserEvent = 0; firstpass.EventTrigger = 0; /* these events are ignored in the first pass */ firstpass.EnterState = 0; /* these events are ignored in the first pass */ firstpass.LeaveState = 0; /* these events are ignored in the first pass */ /* Go through all trace records */ do { recs_read = Ttf_ReadNumEvents(fh,firstpass, 1024); #ifdef DEBUG if (recs_read != 0) cout <<"Read "<=0) && (!EndOfTrace)); /* reset the position of the trace to the first record Initialize global id map*/ int global = 0; for (map< pair, int, less< pair > >:: iterator it = EOF_Trace.begin(); it != EOF_Trace.end(); it++) { /* Explicilty mark end of trace to be not over */ GlobalId[pair((*it).first)]=global; nodenum[global]=((*it).first).first; threadnum[global]=((*it).first).second; //printf("nodenum: %d, nodeid: %d, threadid: %d\n",global, ((*it).first).first,((*it).first).second); global++; (*it).second = 0; } /* for (map< pair, int, less< pair > >:: iterator it = GlobalId.begin(); it != GlobalId.end(); it++) { // Explicilty mark end of trace to be not over GlobalId[*it] = global; global++; }*/ int totalnidtids = EOF_Trace.size(); /* This is ok for single threaded programs. For multi-threaded programs * we'll need to modify the way we describe the cpus/threads */ VTF3_WriteDefsyscpunums(fcb, 1, &totalnidtids); /* Then write out the thread names if it is multi-threaded */ if (multiThreaded) { /* create the thread ids */ unsigned int groupid = 0x1 << 31; /* Valid vampir group id nos */ int tid = 0; int nodes = numthreads.size(); /* total no. of nodes */ int *threadnumarray = new int[nodes]; //offset = new int[nodes+1]; //offset[0] = 0; /* no offset for node 0 */ for (i=0; i < nodes; i++) { // one for each node threadnumarray[i] = numthreads[i]; //offset[i+1] = offset[i] + numthreads[i]; } unsigned int *cpuidarray = new unsigned int[totalnidtids]; /* max */ /* next, we write the cpu name and a group name for node/threads */ char name[64]; int thisnode=-1; for (i=0; i < countthreads; i++) { //for (tid = 0; tid < threadnumarray[i]; tid++) //{ sprintf(name, "node %d, thread %d", nodenum[i], threadnum[i]); int cpuid = GlobalId[pair(nodenum[i],threadnum[i])]; VTF3_WriteDefcpuname(fcb, cpuid, name); //printf("i: %d, nodenum[i]: %d, threadnum[i]: %d, cpuid: %d, name: %s\n",i,nodenum[i],threadnum[i],cpuid,name); //} if(thisnode!=nodenum[i]) { thisnode=nodenum[i]; sprintf(name, "Node %d", nodenum[i]); groupid ++; /* let flat group for samples take the first one */ /* Define a group: threadnumarray[i] represents no. of threads in node */ for(int j=0;j(nodenum[i],threadnum[i+j])]; //printf("cpuidarray: %d",cpuidarray[j]); } //printf("name: %s, numthreads:",) VTF3_WriteDefcpugrp(fcb, groupid, numthreads[thisnode], (const unsigned int *) cpuidarray, name); } } delete[] cpuidarray; } else { int nodes = numthreads.size(); for(i=0;i(nodenum[i],0)]; //printf("id: %d, name: %d\n",cpuid, nodenum[i]); VTF3_WriteDefcpuname(fcb, cpuid, name); } } unsigned int *idarray = new unsigned int[totalnidtids]; for (i = 0; i < totalnidtids; i++) { /* assign i to each entry */ idarray[i] = i; } /* create a callstack on each thread/process id */ dprintf("totalnidtids = %d\n", totalnidtids); //callstack = new stack [totalnidtids](); callstack.resize(totalnidtids); /* Define group ids */ char name[1024]; strcpy(name, "TAU sample group name"); VTF3_WriteDefcpugrp(fcb, sampgroupid, totalnidtids, idarray, name); EndOfTrace = 0; /* now reset the position of the trace to the first record */ Ttf_CloseFile(fh); /* Re-open it for input */ fh = Ttf_OpenFileForInput( argv[1], argv[2]); if (!fh) { printf("ERROR:Ttf_OpenFileForInput fails the second time"); exit(1); } dprintf("Re-analyzing the trace file \n"); Ttf_CallbacksT cb; /* Fill the callback struct */ cb.UserData = fcb; cb.DefClkPeriod = 0; cb.DefThread = 0; cb.DefStateGroup = 0; cb.DefState = 0; cb.DefUserEvent = DefUserEvent; cb.EventTrigger = EventTrigger; cb.EndTrace = EndTrace; /* should state transitions be displayed? */ /* Of course! */ cb.EnterState = EnterState; cb.LeaveState = LeaveState; /* should messages be displayed? */ if (no_message_flag) { cb.SendMessage = 0; cb.RecvMessage = 0; } else { cb.SendMessage = SendMessage; cb.RecvMessage = RecvMessage; } int writtenchars; size_t writtenbytes; /* Go through each record until the end of the trace file */ do { recs_read = Ttf_ReadNumEvents(fh,cb, 1024); #ifdef DEBUG if (recs_read != 0) cout <<"Read "<=0) && (!EndOfTrace)); /* dummy records */ Ttf_CloseFile(fh); /* close VTF file */ VTF3_Close(fcb); return 0; } /* EOF tau2vtf.cpp */ /*************************************************************************** * $RCSfile: tau2vtf.cpp,v $ $Author: amorris $ * $Revision: 1.18 $ $Date: 2009/09/16 23:48:50 $ * VERSION_ID: $Id: tau2vtf.cpp,v 1.18 2009/09/16 23:48:50 amorris Exp $ ***************************************************************************/