123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2011-2014,2016-2017 Inria
- * Copyright (C) 2012,2014,2017,2018 CNRS
- * Copyright (C) 2017 Universidade Federal do Rio Grande do Sul (UFRGS)
- * Copyright (C) 2010-2018 Université de Bordeaux
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include "starpu_fxt.h"
- #include <common/config.h>
- #ifdef STARPU_HAVE_POTI
- #include <poti.h>
- #endif
- #ifdef STARPU_USE_FXT
- #ifdef STARPU_HAVE_POTI
- #ifdef HAVE_POTI_INIT_CUSTOM
- int _starpu_poti_extendedSetState = -1;
- int _starpu_poti_semiExtendedSetState = -1;
- int _starpu_poti_MemoryEvent = -1;
- #endif
- #endif
- void _starpu_fxt_write_paje_header(FILE *file STARPU_ATTRIBUTE_UNUSED, struct starpu_fxt_options *options)
- {
- unsigned i;
- #ifdef STARPU_HAVE_POTI
- #ifdef HAVE_POTI_INIT_CUSTOM
- poti_header(); /* see poti_init_custom to customize the header */
- _starpu_poti_extendedSetState = poti_header_DeclareEvent (PAJE_SetState,
- 11,
- "Size string",
- "Params string",
- "Footprint string",
- "Tag string",
- "JobId string",
- "SubmitOrder string",
- "GFlop string",
- "X string",
- "Y string",
- /* "Z string", */
- "Iteration string",
- "Subiteration string");
- _starpu_poti_semiExtendedSetState = poti_header_DeclareEvent (PAJE_SetState,
- 6,
- "Size string",
- "Params string",
- "Footprint string",
- "Tag string",
- "JobId string",
- "SubmitOrder string"
- );
- #ifdef HAVE_POTI_USER_NEWEVENT
- if (options->memory_states)
- {
- _starpu_poti_MemoryEvent = poti_header_DeclareEvent (PAJE_NewEvent,
- 4,
- "Handle string",
- "Info string",
- "Size string",
- "Dest string");
- }
- #endif
- #else
- poti_header(1,1);
- #endif
- #else
- fprintf(file, "%%EventDef PajeDefineContainerType 1\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDefineEventType 2\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDefineStateType 3\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDefineVariableType 4\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDefineLinkType 5\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% StartContainerType string\n");
- fprintf(file, "%% EndContainerType string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDefineEntityValue 6\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%% Color color\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeCreateContainer 7\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Alias string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeDestroyContainer 8\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Name string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeNewEvent 9\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeSetState 10\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajePushState 11\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajePopState 12\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeSetVariable 13\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Value double\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeAddVariable 14\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value double\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeSubVariable 15\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value double\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeStartLink 18\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%% StartContainer string\n");
- fprintf(file, "%% Key string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeEndLink 19\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%% EndContainer string\n");
- fprintf(file, "%% Key string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeSetState 20\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%% Size string\n");
- fprintf(file, "%% Params string\n");
- fprintf(file, "%% Footprint string\n");
- fprintf(file, "%% Tag string\n");
- fprintf(file, "%% JobId string\n");
- fprintf(file, "%% SubmitOrder string\n");
- fprintf(file, "%% GFlop string\n");
- fprintf(file, "%% X string\n");
- fprintf(file, "%% Y string\n");
- /* fprintf(file, "%% Z string\n"); */
- fprintf(file, "%% Iteration string\n");
- fprintf(file, "%% Subiteration string\n");
- fprintf(file, "%%EndEventDef\n");
- fprintf(file, "%%EventDef PajeSetState 21\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%% Size string\n");
- fprintf(file, "%% Params string\n");
- fprintf(file, "%% Footprint string\n");
- fprintf(file, "%% Tag string\n");
- fprintf(file, "%% JobId string\n");
- fprintf(file, "%% SubmitOrder string\n");
- fprintf(file, "%%EndEventDef\n");
- if (options->memory_states)
- {
- fprintf(file, "%%EventDef PajeNewEvent 22\n");
- fprintf(file, "%% Time date\n");
- fprintf(file, "%% Type string\n");
- fprintf(file, "%% Container string\n");
- fprintf(file, "%% Value string\n");
- fprintf(file, "%% Handle string\n");
- fprintf(file, "%% Info string\n");
- fprintf(file, "%% Size string\n");
- fprintf(file, "%% Tid string\n");
- fprintf(file, "%%EndEventDef\n");
- }
- #endif
- #ifdef STARPU_HAVE_POTI
- poti_DefineContainerType("MPIP", "0", "MPI Program");
- poti_DefineContainerType("P", "MPIP", "Program");
- poti_DefineContainerType("Mn", "P", "Memory Node");
- poti_DefineContainerType("T", "Mn", "Thread");
- poti_DefineContainerType("UT", "P", "User Thread");
- poti_DefineContainerType("Mm", "Mn", "Memory Manager");
- poti_DefineContainerType("W", "T", "Worker");
- poti_DefineContainerType("MPICt", "P", "MPI Communication Thread");
- poti_DefineContainerType("Sc", "P", "Scheduler");
- poti_DefineEventType("prog_event", "P", "program event type");
- poti_DefineEventType("register", "P", "data registration");
- poti_DefineEventType("unregister", "P", "data unregistration");
- /* Types for the memory node */
- poti_DefineEventType("SI", "Mm", "data state invalid");
- poti_DefineEventType("SS", "Mm", "data state shared");
- poti_DefineEventType("SO", "Mm", "data state owner");
- poti_DefineEventType("WU", "Mm", "data wont use");
- poti_DefineEventType("Al", "Mm", "Allocating Start");
- poti_DefineEventType("AlE", "Mm", "Allocating End");
- poti_DefineEventType("Alr", "Mm", "Allocating Async Start");
- poti_DefineEventType("AlrE", "Mm", "Allocating Async End");
- poti_DefineEventType("Fe", "Mm", "Free Start");
- poti_DefineEventType("FeE", "Mm", "Free End");
- poti_DefineEventType("Wb", "Mm", "WritingBack Start");
- poti_DefineEventType("WbE", "Mm", "WritingBack End");
- poti_DefineEventType("DCo", "Mm", "DriverCopy Start");
- poti_DefineEventType("DCoE", "Mm", "DriverCopy End");
- poti_DefineEventType("DCoA", "Mm", "DriverCopyAsync Start");
- poti_DefineEventType("DCoAE", "Mm", "DriverCopyAsync End");
- poti_DefineVariableType("use", "Mm", "Used (MB)", "0 0 0");
- poti_DefineVariableType("bwi_mm", "Mm", "Bandwidth In (MB/s)", "0 0 0");
- poti_DefineVariableType("bwo_mm", "Mm", "Bandwidth Out (MB/s)", "0 0 0");
- poti_DefineStateType("MS", "Mm", "Memory Node State");
- poti_DefineEntityValue("A", "MS", "Allocating", ".4 .1 .0");
- poti_DefineEntityValue("Ar", "MS", "AllocatingReuse", ".1 .1 .8");
- poti_DefineEntityValue("F", "MS", "Freeing", ".6 .3 .0");
- poti_DefineEntityValue("W", "MS", "WritingBack", ".0 .0 .5");
- poti_DefineEntityValue("Wa", "MS", "WritingBackAsync", ".0 .0 .4");
- poti_DefineEntityValue("R", "MS", "Reclaiming", ".0 .1 .6");
- poti_DefineEntityValue("Co", "MS", "DriverCopy", ".3 .5 .1");
- poti_DefineEntityValue("CoA", "MS", "DriverCopyAsync", ".1 .3 .1");
- poti_DefineEntityValue("No", "MS", "Nothing", ".0 .0 .0");
- /* Types for the Worker of the Memory Node */
- poti_DefineEventType("user_event", "P", "user event type");
- poti_DefineEventType("thread_event", "T", "thread event type");
- poti_DefineVariableType("gf", "W", "GFlops", "0 0 0");
- poti_DefineStateType("S", "T", "Thread State");
- poti_DefineEntityValue("I", "S", "Idle", ".9 .1 0");
- poti_DefineEntityValue("In", "S", "Initializing", "0.0 .7 1.0");
- poti_DefineEntityValue("D", "S", "Deinitializing", "0.0 .1 .7");
- poti_DefineEntityValue("Fi", "S", "FetchingInput", "1.0 .1 1.0");
- poti_DefineEntityValue("Po", "S", "PushingOutput", "0.1 1.0 1.0");
- poti_DefineEntityValue("C", "S", "Callback", ".0 .3 .8");
- poti_DefineEntityValue("B", "S", "Overhead", ".5 .18 .0");
- poti_DefineEntityValue("E", "S", "Executing", ".0 .6 .5");
- poti_DefineEntityValue("Sc", "S", "Scheduling", ".7 .36 .0");
- poti_DefineEntityValue("Sl", "S", "Sleeping", ".9 .1 .0");
- poti_DefineEntityValue("P", "S", "Progressing", ".1 .3 .1");
- poti_DefineEntityValue("U", "S", "Unpartitioning", ".0 .0 1.0");
- poti_DefineEntityValue("H", "S", "Hypervisor", ".5 .18 .0");
- poti_DefineEntityValue("Bu", "S", "Building task", ".5 .18 .0");
- poti_DefineEntityValue("Su", "S", "Submitting task", ".3 .09 .0");
- poti_DefineEntityValue("Th", "S", "Throttling task submission", ".8 .6 .6");
- poti_DefineEntityValue("MD", "S", "Decoding task for MPI", ".5 .18 .2");
- poti_DefineEntityValue("MPr", "S", "Preparing task for MPI", ".4 .14 .2");
- poti_DefineEntityValue("MPo", "S", "Post-processing task for MPI", ".3 .09 .2");
- poti_DefineStateType("WS", "W", "Worker State");
- poti_DefineEntityValue("I", "WS", "Idle", ".9 .1 .0");
- poti_DefineEntityValue("In", "WS", "Initializing", "0.0 .7 1.0");
- poti_DefineEntityValue("D", "WS", "Deinitializing", "0.0 .1 .7");
- poti_DefineEntityValue("Fi", "WS", "FetchingInput", "1.0 .1 1.0");
- poti_DefineEntityValue("Po", "WS", "PushingOutput", "0.1 1.0 1.0");
- poti_DefineEntityValue("C", "WS", "Callback", ".0 .3 .8");
- poti_DefineEntityValue("B", "WS", "Overhead", ".5 .18 .0");
- poti_DefineEntityValue("E", "WS", "Executing", ".0 .6 .5");
- poti_DefineEntityValue("Sc", "WS", "Scheduling", ".7 .36 .0");
- poti_DefineEntityValue("Sl", "WS", "Sleeping", ".9 .1 .0");
- poti_DefineEntityValue("P", "WS", "Progressing", ".1 .3 .1");
- poti_DefineEntityValue("U", "WS", "Unpartitioning", ".0 .0 1.0");
- poti_DefineEntityValue("H", "WS", "Hypervisor", ".5 .18 .0");
- poti_DefineEntityValue("Bu", "WS", "Building task", ".5 .18 .0");
- poti_DefineEntityValue("Su", "WS", "Submitting task", ".3 .09 .0");
- poti_DefineEntityValue("Th", "WS", "Throttling task submission", ".8 .6 .6");
- /* Types for the MPI Communication Thread of the Memory Node */
- poti_DefineEventType("MPIev", "MPICt", "MPI event type");
- poti_DefineVariableType("bwi_mpi", "MPICt", "Bandwidth In (MB/s)", "0 0 0");
- poti_DefineVariableType("bwo_mpi", "MPICt", "Bandwidth Out (MB/s)", "0 0 0");
- poti_DefineStateType("CtS", "MPICt", "Communication Thread State");
- poti_DefineEntityValue("P", "CtS", "Processing", "0 0 0");
- poti_DefineEntityValue("Pl", "CtS", "Polling", "1.0 .5 0");
- poti_DefineEntityValue("Dr", "CtS", "DriverRun", ".1 .1 1.0");
- poti_DefineEntityValue("Sl", "CtS", "Sleeping", ".9 .1 .0");
- poti_DefineEntityValue("UT", "CtS", "UserTesting", ".2 .1 .6");
- poti_DefineEntityValue("UW", "CtS", "UserWaiting", ".4 .1 .3");
- poti_DefineEntityValue("SdS", "CtS", "SendSubmitted", "1.0 .1 1.0");
- poti_DefineEntityValue("RvS", "CtS", "ReceiveSubmitted", "0.1 1.0 1.0");
- poti_DefineEntityValue("SdC", "CtS", "SendCompleted", "1.0 .5 1.0");
- poti_DefineEntityValue("RvC", "CtS", "ReceiveCompleted", "0.5 1.0 1.0");
- poti_DefineEntityValue("TD", "CtS", "Testing Detached", ".0 .0 .6");
- poti_DefineEntityValue("MT", "CtS", "MPI Test", ".0 .0 .8");
- poti_DefineEntityValue("Bu", "CtS", "Building task", ".5 .18 .0");
- poti_DefineEntityValue("Su", "CtS", "Submitting task", ".3 .09 .0");
- poti_DefineEntityValue("Th", "CtS", "Throttling task submission", ".8 .6 .6");
- poti_DefineEntityValue("C", "CtS", "Callback", ".0 .3 .8");
- /* Type for other threads */
- poti_DefineEventType("user_user_event", "UT", "user event type");
- poti_DefineEventType("user_thread_event", "UT", "thread event type");
- poti_DefineStateType("US", "UT", "User Thread State");
- poti_DefineEntityValue("Bu", "US", "Building task", ".5 .18 .0");
- poti_DefineEntityValue("Su", "US", "Submitting task", ".3 .09 .0");
- poti_DefineEntityValue("C", "US", "Callback", ".0 .3 .8");
- poti_DefineEntityValue("Th", "US", "Throttling task submission", ".8 .6 .6");
- poti_DefineEntityValue("MD", "US", "Decoding task for MPI", ".5 .18 .2");
- poti_DefineEntityValue("MPr", "US", "Preparing task for MPI", ".4 .14 .2");
- poti_DefineEntityValue("MPo", "US", "Post-processing task for MPI", ".3 .09 .2");
- poti_DefineEntityValue("W", "US", "Waiting task", ".9 .1 .0");
- poti_DefineEntityValue("WA", "US", "Waiting all tasks", ".9 .1 .0");
- poti_DefineEntityValue("No", "US", "Nothing", ".0 .0 .0");
- for (i=1; i<STARPU_NMAX_SCHED_CTXS; i++)
- {
- char inctx[10];
- snprintf(inctx, sizeof(inctx), "InCtx%u", i);
- char *ctx = inctx+2;
- poti_DefineStateType(ctx, "W", inctx);
- poti_DefineEntityValue("I", ctx, "Idle", ".9 .1 .0");
- poti_DefineEntityValue("In", ctx, "Initializing", "0.0 .7 1.0");
- poti_DefineEntityValue("D", ctx, "Deinitializing", "0.0 .1 .7");
- poti_DefineEntityValue("Fi", ctx, "FetchingInput", "1.0 .1 1.0");
- poti_DefineEntityValue("Po", ctx, "PushingOutput", "0.1 1.0 1.0");
- poti_DefineEntityValue("C", ctx, "Callback", ".0 .3 .8");
- poti_DefineEntityValue("B", ctx, "Overhead", ".5 .18 .0");
- poti_DefineEntityValue("E", ctx, "Executing", ".0 .6 .5");
- poti_DefineEntityValue("Sc", ctx, "Scheduling", ".7 .36 .0");
- poti_DefineEntityValue("Sl", ctx, "Sleeping", ".9 .1 .0");
- poti_DefineEntityValue("P", ctx, "Progressing", ".1 .3 .1");
- poti_DefineEntityValue("U", ctx, "Unpartitioning", ".0 .0 1.0");
- poti_DefineEntityValue("H", ctx, "Hypervisor", ".5 .18 .0");
- }
- /* Types for the Scheduler */
- poti_DefineVariableType("nsubmitted", "Sc", "Number of Submitted Uncompleted Tasks", "0 0 0");
- poti_DefineVariableType("nready", "Sc", "Number of Ready Tasks", "0 0 0");
- poti_DefineVariableType("gft", "Sc", "Total GFlops", "0 0 0");
- /* Link types */
- poti_DefineLinkType("MPIL", "MPIP", "MPICt", "MPICt", "MPI communication");
- poti_DefineLinkType("F", "P", "Mm", "Mm", "Intra-node data Fetch");
- poti_DefineLinkType("PF", "P", "Mm", "Mm", "Intra-node data PreFetch");
- poti_DefineLinkType("IF", "P", "Mm", "Mm", "Intra-node data IdleFetch");
- poti_DefineLinkType("WSL", "P", "W", "W", "Work steal");
- /* Creating the MPI Program */
- poti_CreateContainer(0, "MPIroot", "MPIP", "0", "root");
- #else
- fprintf(file, " \n\
- 1 MPIP 0 \"MPI Program\" \n\
- 1 P MPIP \"Program\" \n\
- 1 Mn P \"Memory Node\" \n\
- 1 T Mn \"Thread\" \n\
- 1 UT P \"User Thread\" \n\
- 1 Mm Mn \"Memory Manager\" \n\
- 1 W T \"Worker\" \n\
- 1 MPICt P \"MPI Communication Thread\" \n\
- 1 Sc P \"Scheduler State\" \n\
- 2 prog_event P \"program event type\" \n\
- 2 register P \"data registration\" \n\
- 2 unregister P \"data unregistration\" \n\
- 2 user_event P \"user event type\" \n\
- 2 thread_event T \"thread event type\" \n\
- 2 user_user_event UT \"user event type\" \n\
- 2 user_thread_event UT \"thread event type\" \n\
- 2 MPIev MPICt \"MPI event type\" \n\
- 3 S T \"Thread State\" \n\
- 3 CtS MPICt \"Communication Thread State\" \n");
- for (i=1; i<STARPU_NMAX_SCHED_CTXS; i++)
- fprintf(file, "3 Ctx%u W \"InCtx%u\" \n", i, i);
- fprintf(file, "\
- 2 SI Mm \"data state invalid\" \n\
- 2 SS Mm \"data state shared\" \n\
- 2 SO Mm \"data state owner\" \n\
- 2 WU Mm \"data wont use\" \n\
- 2 Al Mm \"Allocating Start\" \n\
- 2 AlE Mm \"Allocating End\" \n\
- 2 Alr Mm \"Allocating Async Start\" \n\
- 2 AlrE Mm \"Allocating Async End\" \n\
- 2 Fe Mm \"Free Start\" \n\
- 2 FeE Mm \"Free End\" \n\
- 2 Wb Mm \"WritingBack Start\" \n\
- 2 WbE Mm \"WritingBack End\" \n\
- 2 DCo Mm \"DriverCopy Start\" \n\
- 2 DCoE Mm \"DriverCopy End\" \n\
- 2 DCoA Mm \"DriverCopyAsync Start\" \n\
- 2 DCoAE Mm \"DriverCopyAsync End\" \n\
- 3 MS Mm \"Memory Node State\" \n\
- 4 nsubmitted Sc \"Number of Submitted Uncompleted Tasks\" \n\
- 4 nready Sc \"Number of Ready Tasks\" \n\
- 4 gft Sc \"Total GFlops\" \n\
- 4 use Mm \"Used (MB)\" \n\
- 4 bwi_mm Mm \"Bandwidth In (MB/s)\" \n\
- 4 bwo_mm Mm \"Bandwidth Out (MB/s)\" \n\
- 4 bwi_mpi MPICt \"Bandwidth In (MB/s)\" \n\
- 4 bwo_mpi MPICt \"Bandwidth Out (MB/s)\" \n\
- 4 gf W \"GFlops\" \n\
- 6 I S Idle \".9 .1 .0\" \n\
- 6 In S Initializing \"0.0 .7 1.0\" \n\
- 6 D S Deinitializing \"0.0 .1 .7\" \n\
- 6 Fi S FetchingInput \"1.0 .1 1.0\" \n\
- 6 Po S PushingOutput \"0.1 1.0 1.0\" \n\
- 6 C S Callback \".0 .3 .8\" \n\
- 6 B S Overhead \".5 .18 .0\" \n\
- 6 E S Executing \".0 .6 .5\" \n\
- 6 Sc S Scheduling \".7 .36 .0\" \n\
- 6 Sl S Sleeping \".9 .1 .0\" \n\
- 6 P S Progressing \".1 .3 .1\" \n\
- 6 U S Unpartitioning \".0 .0 1.0\" \n\
- 6 H S Hypervisor \".5 .18 .0\" \n\
- 6 Bu S \"Building task\" \".5 .18 .0\" \n\
- 6 Su S \"Submitting task\" \".3 .09 .0\" \n\
- 6 Th S \"Throttling task submission\" \".8 .6 .6\" \n\
- 6 MD S \"Decoding task for MPI\" \".5 .18 .2\" \n\
- 6 MPr S \"Preparing task for MPI\" \".4 .14 .2\" \n\
- 6 MPo S \"Post-processing task for MPI\" \".3 .09 .2\" \n\
- 3 WS W \"Worker State\" \n\
- 6 I WS Idle \".9 .1 .0\" \n\
- 6 In WS Initializing \"0.0 .7 1.0\" \n\
- 6 D WS Deinitializing \"0.0 .1 .7\" \n\
- 6 Fi WS FetchingInput \"1.0 .1 1.0\" \n\
- 6 Po WS PushingOutput \"0.1 1.0 1.0\" \n\
- 6 C WS Callback \".0 .3 .8\" \n\
- 6 B WS Overhead \".5 .18 .0\" \n\
- 6 E WS Executing \".0 .6 .5\" \n\
- 6 Sc WS Scheduling \".7 .36 .0\" \n\
- 6 Sl WS Sleeping \".9 .1 .0\" \n\
- 6 P WS Progressing \".1 .3 .1\" \n\
- 6 U WS Unpartitioning \".0 .0 1.0\" \n\
- 6 H WS Hypervisor \".5 .18 .0\" \n\
- 6 Bu WS \"Building task\" \".5 .18 .0\" \n\
- 6 Su WS \"Submitting task\" \".3 .09 .0\" \n\
- 6 Th WS \"Throttling task submission\" \".8 .6 .6\" \n\
- 3 US UT \"User Thread State\" \n\
- 6 Bu US \"Building task\" \".5 .18 .0\" \n\
- 6 Su US \"Submitting task\" \".3 .09 .0\" \n\
- 6 C US \"Callback\" \".0 .3 .8\" \n\
- 6 Th US \"Throttling task submission\" \".8 .6 .6\" \n\
- 6 MD US \"Decoding task for MPI\" \".5 .18 .2\" \n\
- 6 MPr US \"Preparing task for MPI\" \".4 .14 .2\" \n\
- 6 MPo US \"Post-processing task for MPI\" \".3 .09 .2\" \n\
- 6 W US \"Waiting task\" \".9 .1 .0\" \n\
- 6 WA US \"Waiting all tasks\" \".9 .1 .0\" \n\
- 6 No US Nothing \".0 .0 .0\" \n\
- ");
- fprintf(file, "\
- 6 P CtS Processing \"0 0 0\" \n\
- 6 Pl CtS Polling \"1.0 .5 0\" \n\
- 6 Dr CtS DriverRun \".1 .1 1.0\" \n\
- 6 Sl CtS Sleeping \".9 .1 .0\" \n\
- 6 UT CtS UserTesting \".2 .1 .6\" \n\
- 6 UW CtS UserWaiting \".4 .1 .3\" \n\
- 6 SdS CtS SendSubmitted \"1.0 .1 1.0\" \n\
- 6 RvS CtS ReceiveSubmitted \"0.1 1.0 1.0\" \n\
- 6 SdC CtS SendCompleted \"1.0 .5 1.0\" \n\
- 6 RvC CtS ReceiveCompleted \"0.5 1.0 1.0\" \n\
- 6 TD CtS \"Testing Detached\" \".0 .0 .6\" \n\
- 6 MT CtS \"MPI Test\" \".0 .0 .8\" \n\
- 6 Bu CtS \"Building task\" \".5 .18 .0\" \n\
- 6 Su CtS \"Submitting task\" \".3 .09 .0\" \n\
- 6 Th CtS \"Throttling task submission\" \".8 .6 .6\" \n\
- 6 C CtS \"Callback\" \".0 .3 .8\" \n\
- ");
- for (i=1; i<STARPU_NMAX_SCHED_CTXS; i++)
- fprintf(file, "\
- 6 I Ctx%u Idle \".9 .1 .0\" \n\
- 6 In Ctx%u Initializing \"0.0 .7 1.0\" \n\
- 6 D Ctx%u Deinitializing \"0.0 .1 .7\" \n\
- 6 Fi Ctx%u FetchingInput \"1.0 .1 1.0\" \n\
- 6 Po Ctx%u PushingOutput \"0.1 1.0 1.0\" \n\
- 6 C Ctx%u Callback \".0 .3 .8\" \n\
- 6 B Ctx%u Overhead \".5 .18 .0\" \n\
- 6 E Ctx%u Executing \".0 .6 .5\" \n\
- 6 Sc Ctx%u Scheduling \".7 .36 .0\" \n\
- 6 Sl Ctx%u Sleeping \".9 .1 .0\" \n\
- 6 P Ctx%u Progressing \".1 .3 .1\" \n\
- 6 U Ctx%u Unpartitioning \".0 .0 1.0\" \n\
- 6 H Ctx%u Hypervisor \".5 .18 .0\" \n",
- i, i, i, i, i, i, i, i, i, i, i, i, i);
- fprintf(file, "\
- 6 A MS Allocating \".4 .1 .0\" \n\
- 6 Ar MS AllocatingReuse \".1 .1 .8\" \n\
- 6 F MS Freeing \".6 .3 .0\" \n\
- 6 W MS WritingBack \".0 .0 .5\" \n\
- 6 Wa MS WritingBackAsync \".0 .0 .4\" \n\
- 6 R MS Reclaiming \".0 .1 .6\" \n\
- 6 Co MS DriverCopy \".3 .5 .1\" \n\
- 6 CoA MS DriverCopyAsync \".1 .3 .1\" \n\
- 6 No MS Nothing \".0 .0 .0\" \n\
- 5 MPIL MPIP MPICt MPICt \"MPI communication\"\n\
- 5 F P Mm Mm \"Intra-node data Fetch\"\n\
- 5 PF P Mm Mm \"Intra-node data PreFetch\"\n\
- 5 IF P Mm Mm \"Intra-node data IdleFetch\"\n\
- 5 WSL P W W \"Work steal\"\n");
- fprintf(file, "7 0.0 MPIroot MPIP 0 root\n");
- #endif
- }
- #endif
|