Skip to content

Instantly share code, notes, and snippets.

Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save zbeekman/522f25d5eb5409871062ee6a2895a55a to your computer and use it in GitHub Desktop.
Save zbeekman/522f25d5eb5409871062ee6a2895a55a to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"To use the parser, we import it an then call the parse function on a directory containing profile.x.y.z files.\n",
"Note that the parser does not currently have any native support for MULTI_ directories, so if you have\n",
"those you'll have to call parse multiple times and then, if you wish, merge the resulting dataframes."
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"from tau_profile_parser import TauProfileParser"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"profile = TauProfileParser.parse('.')"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The metric field contains the metric that values in this profile represent"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"b'TIME'"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.metric"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The metadata field contains the metadata as a Python dictionary."
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"{'Metric Name': 'TIME',\n",
" 'CPU Cores': '14',\n",
" 'CPU MHz': '1652.218',\n",
" 'CPU Type': 'Intel(R) Xeon(R) CPU E5-2690 v4 @ 2.60GHz',\n",
" 'CPU Vendor': 'GenuineIntel',\n",
" 'CWD': '/gpfs/projects/paratools/nchaimov/x-gups-shmem',\n",
" 'Cache Size': '35840 KB',\n",
" 'Command Line': './gups',\n",
" 'Ending Timestamp': '1527459525908470',\n",
" 'Executable': '/gpfs/projects/paratools/nchaimov/x-gups-shmem/gups',\n",
" 'Hostname': 'n005',\n",
" 'Local Time': '2018-05-27T15:18:39-07:00',\n",
" 'Memory Size': '131916412 kB',\n",
" 'Node Name': 'n005',\n",
" 'OS Machine': 'x86_64',\n",
" 'OS Name': 'Linux',\n",
" 'OS Release': '3.10.0-693.17.1.el7.x86_64',\n",
" 'OS Version': '#1 SMP Sun Jan 14 10:36:03 EST 2018',\n",
" 'Starting Timestamp': '1527459519414157',\n",
" 'TAU Architecture': 'default',\n",
" 'TAU Config': ' -bfd=download -unwind=download -pdt=/usr/local/packages/pdt/3.25 -otf=download -iowrapper -shmem -tag=openmpi-meminst',\n",
" 'TAU Makefile': '/usr/local/packages/tau/2.27.1/x86_64/lib/Makefile.tau-openmpi-meminst-shmem-pdt',\n",
" 'TAU Version': '2.27.1-git',\n",
" 'TAU_BFD_LOOKUP': 'on',\n",
" 'TAU_CALLPATH': 'off',\n",
" 'TAU_CALLPATH_DEPTH': '2',\n",
" 'TAU_CALLSITE_DEPTH': '1',\n",
" 'TAU_COMM_MATRIX': 'off',\n",
" 'TAU_COMPENSATE': 'off',\n",
" 'TAU_CUDA_BINARY_EXE': None,\n",
" 'TAU_CUPTI_API': 'runtime',\n",
" 'TAU_EBS_KEEP_UNRESOLVED_ADDR': 'off',\n",
" 'TAU_IBM_BG_HWP_COUNTERS': 'off',\n",
" 'TAU_MAX_THREADS': '1',\n",
" 'TAU_MEASURE_TAU': 'off',\n",
" 'TAU_MEMDBG_PROTECT_ABOVE': 'off',\n",
" 'TAU_MEMDBG_PROTECT_BELOW': 'off',\n",
" 'TAU_MEMDBG_PROTECT_FREE': 'off',\n",
" 'TAU_OPENMP_RUNTIME': 'on',\n",
" 'TAU_OPENMP_RUNTIME_EVENTS': 'on',\n",
" 'TAU_OPENMP_RUNTIME_STATES': 'off',\n",
" 'TAU_OUTPUT_CUDA_CSV': 'off',\n",
" 'TAU_PAPI_MULTIPLEXING': 'off',\n",
" 'TAU_PROFILE': 'on',\n",
" 'TAU_PROFILE_FORMAT': 'profile',\n",
" 'TAU_REGION_ADDRESSES': 'off',\n",
" 'TAU_SAMPLING': 'off',\n",
" 'TAU_SHOW_MEMORY_FUNCTIONS': 'off',\n",
" 'TAU_SIGNALS_GDB': 'off',\n",
" 'TAU_THROTTLE': 'on',\n",
" 'TAU_THROTTLE_NUMCALLS': '100000',\n",
" 'TAU_THROTTLE_PERCALL': '10',\n",
" 'TAU_TRACE': 'off',\n",
" 'TAU_TRACE_FORMAT': 'tau',\n",
" 'TAU_TRACK_CUDA_CDP': 'off',\n",
" 'TAU_TRACK_CUDA_INSTRUCTIONS': None,\n",
" 'TAU_TRACK_CUDA_SASS': 'off',\n",
" 'TAU_TRACK_HEADROOM': 'off',\n",
" 'TAU_TRACK_HEAP': 'off',\n",
" 'TAU_TRACK_IO_PARAMS': 'off',\n",
" 'TAU_TRACK_MEMORY_FOOTPRINT': 'off',\n",
" 'TAU_TRACK_MEMORY_LEAKS': 'off',\n",
" 'TAU_TRACK_MESSAGE': 'off',\n",
" 'TAU_TRACK_SIGNALS': 'off',\n",
" 'TAU_TRACK_UNIFIED_MEMORY': 'off',\n",
" 'Timestamp': '1527459519414278',\n",
" 'UTC Time': '2018-05-27T22:18:39Z',\n",
" 'pid': '71186',\n",
" 'tid': '71186',\n",
" 'username': 'nchaimov'}"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.metadata"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The indices field contains the list of (node, context, thread) values present."
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"[(0, 0, 0),\n",
" (1, 0, 0),\n",
" (2, 0, 0),\n",
" (3, 0, 0),\n",
" (4, 0, 0),\n",
" (5, 0, 0),\n",
" (6, 0, 0),\n",
" (7, 0, 0),\n",
" (8, 0, 0),\n",
" (9, 0, 0),\n",
" (10, 0, 0),\n",
" (11, 0, 0),\n",
" (12, 0, 0),\n",
" (13, 0, 0),\n",
" (14, 0, 0),\n",
" (15, 0, 0),\n",
" (16, 0, 0),\n",
" (17, 0, 0),\n",
" (18, 0, 0),\n",
" (19, 0, 0),\n",
" (20, 0, 0),\n",
" (21, 0, 0),\n",
" (22, 0, 0),\n",
" (23, 0, 0),\n",
" (24, 0, 0),\n",
" (25, 0, 0),\n",
" (26, 0, 0),\n",
" (27, 0, 0),\n",
" (28, 0, 0),\n",
" (29, 0, 0),\n",
" (30, 0, 0),\n",
" (31, 0, 0),\n",
" (32, 0, 0),\n",
" (33, 0, 0),\n",
" (34, 0, 0),\n",
" (35, 0, 0),\n",
" (36, 0, 0),\n",
" (37, 0, 0),\n",
" (38, 0, 0),\n",
" (39, 0, 0),\n",
" (40, 0, 0),\n",
" (41, 0, 0),\n",
" (42, 0, 0),\n",
" (43, 0, 0),\n",
" (44, 0, 0),\n",
" (45, 0, 0),\n",
" (46, 0, 0),\n",
" (47, 0, 0),\n",
" (48, 0, 0),\n",
" (49, 0, 0),\n",
" (50, 0, 0),\n",
" (51, 0, 0),\n",
" (52, 0, 0),\n",
" (53, 0, 0),\n",
" (54, 0, 0),\n",
" (55, 0, 0),\n",
" (56, 0, 0),\n",
" (57, 0, 0),\n",
" (58, 0, 0),\n",
" (59, 0, 0),\n",
" (60, 0, 0),\n",
" (61, 0, 0),\n",
" (62, 0, 0),\n",
" (63, 0, 0)]"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.indices"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The atomic_data() function returns a Pandas dataframe containing the atomic events (user and context events). This is a multi-index dataframe with Node, Context, Thread, and Timer as the indices."
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>Count</th>\n",
" <th>Maximum</th>\n",
" <th>Minimum</th>\n",
" <th>Mean</th>\n",
" <th>SumSq</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Node</th>\n",
" <th>Context</th>\n",
" <th>Thread</th>\n",
" <th>Timer</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th rowspan=\"30\" valign=\"top\">0</th>\n",
" <th rowspan=\"30\" valign=\"top\">0</th>\n",
" <th rowspan=\"30\" valign=\"top\">0</th>\n",
" <th>alloc opal_thread_t</th>\n",
" <td>1</td>\n",
" <td>40</td>\n",
" <td>40</td>\n",
" <td>40.000000</td>\n",
" <td>1600</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_base_component_list_item_t</th>\n",
" <td>90</td>\n",
" <td>48</td>\n",
" <td>48</td>\n",
" <td>48.000000</td>\n",
" <td>207360</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_base_var_group_t</th>\n",
" <td>194</td>\n",
" <td>280</td>\n",
" <td>280</td>\n",
" <td>280.000000</td>\n",
" <td>15209600</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_base_var_t</th>\n",
" <td>945</td>\n",
" <td>168</td>\n",
" <td>168</td>\n",
" <td>168.000000</td>\n",
" <td>26671680</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_base_var_enum_t</th>\n",
" <td>19</td>\n",
" <td>88</td>\n",
" <td>88</td>\n",
" <td>88.000000</td>\n",
" <td>147136</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_dss_type_info_t</th>\n",
" <td>46</td>\n",
" <td>80</td>\n",
" <td>80</td>\n",
" <td>80.000000</td>\n",
" <td>294400</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_list_t</th>\n",
" <td>70</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>286720</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_base_component_repository_item_t</th>\n",
" <td>119</td>\n",
" <td>176</td>\n",
" <td>176</td>\n",
" <td>176.000000</td>\n",
" <td>3686144</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_if_t</th>\n",
" <td>3</td>\n",
" <td>224</td>\n",
" <td>224</td>\n",
" <td>224.000000</td>\n",
" <td>150528</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_schizo_base_active_module_t</th>\n",
" <td>2</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>8192</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_progress_tracker_t</th>\n",
" <td>1</td>\n",
" <td>256</td>\n",
" <td>256</td>\n",
" <td>256.000000</td>\n",
" <td>65536</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_pmix_proc_data_t</th>\n",
" <td>65</td>\n",
" <td>112</td>\n",
" <td>112</td>\n",
" <td>112.000000</td>\n",
" <td>815360</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_hash_table_t</th>\n",
" <td>6</td>\n",
" <td>72</td>\n",
" <td>72</td>\n",
" <td>72.000000</td>\n",
" <td>31104</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_value_t</th>\n",
" <td>1585</td>\n",
" <td>136</td>\n",
" <td>136</td>\n",
" <td>136.000000</td>\n",
" <td>29316160</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_state_t</th>\n",
" <td>2</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>8192</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_routed_base_active_t</th>\n",
" <td>4</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>16384</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_oob_ud_device_t</th>\n",
" <td>1</td>\n",
" <td>496</td>\n",
" <td>496</td>\n",
" <td>496.000000</td>\n",
" <td>246016</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_oob_ud_port_t</th>\n",
" <td>1</td>\n",
" <td>912</td>\n",
" <td>912</td>\n",
" <td>912.000000</td>\n",
" <td>831744</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_rml_pathway_t</th>\n",
" <td>1</td>\n",
" <td>176</td>\n",
" <td>176</td>\n",
" <td>176.000000</td>\n",
" <td>30976</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_attribute_t</th>\n",
" <td>5</td>\n",
" <td>112</td>\n",
" <td>112</td>\n",
" <td>112.000000</td>\n",
" <td>62720</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_rml_base_active_t</th>\n",
" <td>1</td>\n",
" <td>56</td>\n",
" <td>56</td>\n",
" <td>56.000000</td>\n",
" <td>3136</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_rml_posted_recv_t</th>\n",
" <td>4</td>\n",
" <td>80</td>\n",
" <td>80</td>\n",
" <td>80.000000</td>\n",
" <td>25600</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_rml_posted_recv_t &lt;= orte_rml_recv_request_t</th>\n",
" <td>4</td>\n",
" <td>80</td>\n",
" <td>80</td>\n",
" <td>80.000000</td>\n",
" <td>25600</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_rml_recv_request_t</th>\n",
" <td>4</td>\n",
" <td>168</td>\n",
" <td>168</td>\n",
" <td>168.000000</td>\n",
" <td>112896</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_grpcomm_base_active_t</th>\n",
" <td>1</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>4096</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_hwloc_topo_data_t</th>\n",
" <td>1</td>\n",
" <td>96</td>\n",
" <td>96</td>\n",
" <td>96.000000</td>\n",
" <td>9216</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_datatype_t</th>\n",
" <td>23</td>\n",
" <td>288</td>\n",
" <td>288</td>\n",
" <td>288.000000</td>\n",
" <td>1907712</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_convertor_t</th>\n",
" <td>2</td>\n",
" <td>248</td>\n",
" <td>248</td>\n",
" <td>248.000000</td>\n",
" <td>123008</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_proc_t</th>\n",
" <td>64</td>\n",
" <td>112</td>\n",
" <td>112</td>\n",
" <td>112.000000</td>\n",
" <td>802816</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_pointer_array_t</th>\n",
" <td>2</td>\n",
" <td>112</td>\n",
" <td>112</td>\n",
" <td>112.000000</td>\n",
" <td>25088</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"30\" valign=\"top\">63</th>\n",
" <th rowspan=\"30\" valign=\"top\">0</th>\n",
" <th rowspan=\"30\" valign=\"top\">0</th>\n",
" <th>alloc orte_namelist_t</th>\n",
" <td>129</td>\n",
" <td>48</td>\n",
" <td>48</td>\n",
" <td>48.000000</td>\n",
" <td>297216</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc orte_namelist_t &lt;= oshmem_group_t</th>\n",
" <td>129</td>\n",
" <td>48</td>\n",
" <td>48</td>\n",
" <td>48.000000</td>\n",
" <td>297216</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_list_t &lt;= oshmem_group_t</th>\n",
" <td>4</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>16384</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_scoll_mpi_module_t</th>\n",
" <td>3</td>\n",
" <td>160</td>\n",
" <td>160</td>\n",
" <td>160.000000</td>\n",
" <td>76800</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_scoll_mpi_module_t &lt;= oshmem_group_t</th>\n",
" <td>2</td>\n",
" <td>160</td>\n",
" <td>160</td>\n",
" <td>160.000000</td>\n",
" <td>51200</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc avail_com_t</th>\n",
" <td>10</td>\n",
" <td>56</td>\n",
" <td>56</td>\n",
" <td>56.000000</td>\n",
" <td>31360</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc avail_com_t &lt;= oshmem_group_t</th>\n",
" <td>5</td>\n",
" <td>56</td>\n",
" <td>56</td>\n",
" <td>56.000000</td>\n",
" <td>15680</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_scoll_basic_module_t</th>\n",
" <td>5</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>20480</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_scoll_basic_module_t &lt;= oshmem_group_t</th>\n",
" <td>3</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>12288</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_atomic_mxm_module_t</th>\n",
" <td>1</td>\n",
" <td>32</td>\n",
" <td>32</td>\n",
" <td>32.000000</td>\n",
" <td>1024</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_atomic_basic_module_t</th>\n",
" <td>1</td>\n",
" <td>32</td>\n",
" <td>32</td>\n",
" <td>32.000000</td>\n",
" <td>1024</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_proc_t ** &lt;= ompi_group_t</th>\n",
" <td>1</td>\n",
" <td>512</td>\n",
" <td>512</td>\n",
" <td>512.000000</td>\n",
" <td>262144</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_comm_allreduce_context_t</th>\n",
" <td>6</td>\n",
" <td>80</td>\n",
" <td>80</td>\n",
" <td>80.000000</td>\n",
" <td>38400</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_buffer_t</th>\n",
" <td>1</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>4096</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_proc_t ** &lt;= oshmem_group_t &lt;= ompi_group_t</th>\n",
" <td>1</td>\n",
" <td>512</td>\n",
" <td>512</td>\n",
" <td>512.000000</td>\n",
" <td>262144</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_group_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>72</td>\n",
" <td>72</td>\n",
" <td>72.000000</td>\n",
" <td>5184</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_communicator_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>264</td>\n",
" <td>264</td>\n",
" <td>264.000000</td>\n",
" <td>69696</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc opal_hash_table_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>72</td>\n",
" <td>72</td>\n",
" <td>72.000000</td>\n",
" <td>5184</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc attribute_value_t &lt;= oshmem_group_t</th>\n",
" <td>7</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>28672</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_comm_cid_context_t &lt;= oshmem_group_t</th>\n",
" <td>2</td>\n",
" <td>120</td>\n",
" <td>120</td>\n",
" <td>120.000000</td>\n",
" <td>28800</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_comm_request_item_t &lt;= oshmem_group_t</th>\n",
" <td>13</td>\n",
" <td>72</td>\n",
" <td>72</td>\n",
" <td>72.000000</td>\n",
" <td>67392</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_comm_allreduce_context_t &lt;= oshmem_group_t</th>\n",
" <td>3</td>\n",
" <td>80</td>\n",
" <td>80</td>\n",
" <td>80.000000</td>\n",
" <td>19200</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc ompi_coll_libnbc_module_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>480</td>\n",
" <td>480</td>\n",
" <td>480.000000</td>\n",
" <td>230400</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc avail_coll_t &lt;= oshmem_group_t</th>\n",
" <td>3</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>12288</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_coll_tuned_module_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>1024</td>\n",
" <td>1024</td>\n",
" <td>1024.000000</td>\n",
" <td>1048576</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_coll_basic_module_t &lt;= oshmem_group_t</th>\n",
" <td>1</td>\n",
" <td>408</td>\n",
" <td>408</td>\n",
" <td>408.000000</td>\n",
" <td>166464</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc mca_coll_base_comm_t &lt;= oshmem_group_t</th>\n",
" <td>2</td>\n",
" <td>136</td>\n",
" <td>136</td>\n",
" <td>136.000000</td>\n",
" <td>36992</td>\n",
" </tr>\n",
" <tr>\n",
" <th>alloc oshmem_group_cache_t</th>\n",
" <td>1</td>\n",
" <td>64</td>\n",
" <td>64</td>\n",
" <td>64.000000</td>\n",
" <td>4096</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Message size received from all nodes</th>\n",
" <td>65536</td>\n",
" <td>8</td>\n",
" <td>8</td>\n",
" <td>8.000000</td>\n",
" <td>4194304</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Message size sent to all nodes</th>\n",
" <td>131712</td>\n",
" <td>8208</td>\n",
" <td>8</td>\n",
" <td>47.844509</td>\n",
" <td>43125997568</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>6272 rows × 5 columns</p>\n",
"</div>"
],
"text/plain": [
" Count \\\n",
"Node Context Thread Timer \n",
"0 0 0 alloc opal_thread_t 1 \n",
" alloc mca_base_component_list_item_t 90 \n",
" alloc mca_base_var_group_t 194 \n",
" alloc mca_base_var_t 945 \n",
" alloc mca_base_var_enum_t 19 \n",
" alloc opal_dss_type_info_t 46 \n",
" alloc opal_list_t 70 \n",
" alloc mca_base_component_repository_item_t 119 \n",
" alloc opal_if_t 3 \n",
" alloc orte_schizo_base_active_module_t 2 \n",
" alloc opal_progress_tracker_t 1 \n",
" alloc opal_pmix_proc_data_t 65 \n",
" alloc opal_hash_table_t 6 \n",
" alloc opal_value_t 1585 \n",
" alloc orte_state_t 2 \n",
" alloc orte_routed_base_active_t 4 \n",
" alloc mca_oob_ud_device_t 1 \n",
" alloc mca_oob_ud_port_t 1 \n",
" alloc orte_rml_pathway_t 1 \n",
" alloc orte_attribute_t 5 \n",
" alloc orte_rml_base_active_t 1 \n",
" alloc orte_rml_posted_recv_t 4 \n",
" alloc orte_rml_posted_recv_t <= orte_rml_recv_r... 4 \n",
" alloc orte_rml_recv_request_t 4 \n",
" alloc orte_grpcomm_base_active_t 1 \n",
" alloc opal_hwloc_topo_data_t 1 \n",
" alloc ompi_datatype_t 23 \n",
" alloc opal_convertor_t 2 \n",
" alloc ompi_proc_t 64 \n",
" alloc opal_pointer_array_t 2 \n",
"... ... \n",
"63 0 0 alloc orte_namelist_t 129 \n",
" alloc orte_namelist_t <= oshmem_group_t 129 \n",
" alloc opal_list_t <= oshmem_group_t 4 \n",
" alloc mca_scoll_mpi_module_t 3 \n",
" alloc mca_scoll_mpi_module_t <= oshmem_group_t 2 \n",
" alloc avail_com_t 10 \n",
" alloc avail_com_t <= oshmem_group_t 5 \n",
" alloc mca_scoll_basic_module_t 5 \n",
" alloc mca_scoll_basic_module_t <= oshmem_group_t 3 \n",
" alloc mca_atomic_mxm_module_t 1 \n",
" alloc mca_atomic_basic_module_t 1 \n",
" alloc ompi_proc_t ** <= ompi_group_t 1 \n",
" alloc ompi_comm_allreduce_context_t 6 \n",
" alloc opal_buffer_t 1 \n",
" alloc ompi_proc_t ** <= oshmem_group_t <= ompi_... 1 \n",
" alloc ompi_group_t <= oshmem_group_t 1 \n",
" alloc ompi_communicator_t <= oshmem_group_t 1 \n",
" alloc opal_hash_table_t <= oshmem_group_t 1 \n",
" alloc attribute_value_t <= oshmem_group_t 7 \n",
" alloc ompi_comm_cid_context_t <= oshmem_group_t 2 \n",
" alloc ompi_comm_request_item_t <= oshmem_group_t 13 \n",
" alloc ompi_comm_allreduce_context_t <= oshmem_g... 3 \n",
" alloc ompi_coll_libnbc_module_t <= oshmem_group_t 1 \n",
" alloc avail_coll_t <= oshmem_group_t 3 \n",
" alloc mca_coll_tuned_module_t <= oshmem_group_t 1 \n",
" alloc mca_coll_basic_module_t <= oshmem_group_t 1 \n",
" alloc mca_coll_base_comm_t <= oshmem_group_t 2 \n",
" alloc oshmem_group_cache_t 1 \n",
" Message size received from all nodes 65536 \n",
" Message size sent to all nodes 131712 \n",
"\n",
" Maximum \\\n",
"Node Context Thread Timer \n",
"0 0 0 alloc opal_thread_t 40 \n",
" alloc mca_base_component_list_item_t 48 \n",
" alloc mca_base_var_group_t 280 \n",
" alloc mca_base_var_t 168 \n",
" alloc mca_base_var_enum_t 88 \n",
" alloc opal_dss_type_info_t 80 \n",
" alloc opal_list_t 64 \n",
" alloc mca_base_component_repository_item_t 176 \n",
" alloc opal_if_t 224 \n",
" alloc orte_schizo_base_active_module_t 64 \n",
" alloc opal_progress_tracker_t 256 \n",
" alloc opal_pmix_proc_data_t 112 \n",
" alloc opal_hash_table_t 72 \n",
" alloc opal_value_t 136 \n",
" alloc orte_state_t 64 \n",
" alloc orte_routed_base_active_t 64 \n",
" alloc mca_oob_ud_device_t 496 \n",
" alloc mca_oob_ud_port_t 912 \n",
" alloc orte_rml_pathway_t 176 \n",
" alloc orte_attribute_t 112 \n",
" alloc orte_rml_base_active_t 56 \n",
" alloc orte_rml_posted_recv_t 80 \n",
" alloc orte_rml_posted_recv_t <= orte_rml_recv_r... 80 \n",
" alloc orte_rml_recv_request_t 168 \n",
" alloc orte_grpcomm_base_active_t 64 \n",
" alloc opal_hwloc_topo_data_t 96 \n",
" alloc ompi_datatype_t 288 \n",
" alloc opal_convertor_t 248 \n",
" alloc ompi_proc_t 112 \n",
" alloc opal_pointer_array_t 112 \n",
"... ... \n",
"63 0 0 alloc orte_namelist_t 48 \n",
" alloc orte_namelist_t <= oshmem_group_t 48 \n",
" alloc opal_list_t <= oshmem_group_t 64 \n",
" alloc mca_scoll_mpi_module_t 160 \n",
" alloc mca_scoll_mpi_module_t <= oshmem_group_t 160 \n",
" alloc avail_com_t 56 \n",
" alloc avail_com_t <= oshmem_group_t 56 \n",
" alloc mca_scoll_basic_module_t 64 \n",
" alloc mca_scoll_basic_module_t <= oshmem_group_t 64 \n",
" alloc mca_atomic_mxm_module_t 32 \n",
" alloc mca_atomic_basic_module_t 32 \n",
" alloc ompi_proc_t ** <= ompi_group_t 512 \n",
" alloc ompi_comm_allreduce_context_t 80 \n",
" alloc opal_buffer_t 64 \n",
" alloc ompi_proc_t ** <= oshmem_group_t <= ompi_... 512 \n",
" alloc ompi_group_t <= oshmem_group_t 72 \n",
" alloc ompi_communicator_t <= oshmem_group_t 264 \n",
" alloc opal_hash_table_t <= oshmem_group_t 72 \n",
" alloc attribute_value_t <= oshmem_group_t 64 \n",
" alloc ompi_comm_cid_context_t <= oshmem_group_t 120 \n",
" alloc ompi_comm_request_item_t <= oshmem_group_t 72 \n",
" alloc ompi_comm_allreduce_context_t <= oshmem_g... 80 \n",
" alloc ompi_coll_libnbc_module_t <= oshmem_group_t 480 \n",
" alloc avail_coll_t <= oshmem_group_t 64 \n",
" alloc mca_coll_tuned_module_t <= oshmem_group_t 1024 \n",
" alloc mca_coll_basic_module_t <= oshmem_group_t 408 \n",
" alloc mca_coll_base_comm_t <= oshmem_group_t 136 \n",
" alloc oshmem_group_cache_t 64 \n",
" Message size received from all nodes 8 \n",
" Message size sent to all nodes 8208 \n",
"\n",
" Minimum \\\n",
"Node Context Thread Timer \n",
"0 0 0 alloc opal_thread_t 40 \n",
" alloc mca_base_component_list_item_t 48 \n",
" alloc mca_base_var_group_t 280 \n",
" alloc mca_base_var_t 168 \n",
" alloc mca_base_var_enum_t 88 \n",
" alloc opal_dss_type_info_t 80 \n",
" alloc opal_list_t 64 \n",
" alloc mca_base_component_repository_item_t 176 \n",
" alloc opal_if_t 224 \n",
" alloc orte_schizo_base_active_module_t 64 \n",
" alloc opal_progress_tracker_t 256 \n",
" alloc opal_pmix_proc_data_t 112 \n",
" alloc opal_hash_table_t 72 \n",
" alloc opal_value_t 136 \n",
" alloc orte_state_t 64 \n",
" alloc orte_routed_base_active_t 64 \n",
" alloc mca_oob_ud_device_t 496 \n",
" alloc mca_oob_ud_port_t 912 \n",
" alloc orte_rml_pathway_t 176 \n",
" alloc orte_attribute_t 112 \n",
" alloc orte_rml_base_active_t 56 \n",
" alloc orte_rml_posted_recv_t 80 \n",
" alloc orte_rml_posted_recv_t <= orte_rml_recv_r... 80 \n",
" alloc orte_rml_recv_request_t 168 \n",
" alloc orte_grpcomm_base_active_t 64 \n",
" alloc opal_hwloc_topo_data_t 96 \n",
" alloc ompi_datatype_t 288 \n",
" alloc opal_convertor_t 248 \n",
" alloc ompi_proc_t 112 \n",
" alloc opal_pointer_array_t 112 \n",
"... ... \n",
"63 0 0 alloc orte_namelist_t 48 \n",
" alloc orte_namelist_t <= oshmem_group_t 48 \n",
" alloc opal_list_t <= oshmem_group_t 64 \n",
" alloc mca_scoll_mpi_module_t 160 \n",
" alloc mca_scoll_mpi_module_t <= oshmem_group_t 160 \n",
" alloc avail_com_t 56 \n",
" alloc avail_com_t <= oshmem_group_t 56 \n",
" alloc mca_scoll_basic_module_t 64 \n",
" alloc mca_scoll_basic_module_t <= oshmem_group_t 64 \n",
" alloc mca_atomic_mxm_module_t 32 \n",
" alloc mca_atomic_basic_module_t 32 \n",
" alloc ompi_proc_t ** <= ompi_group_t 512 \n",
" alloc ompi_comm_allreduce_context_t 80 \n",
" alloc opal_buffer_t 64 \n",
" alloc ompi_proc_t ** <= oshmem_group_t <= ompi_... 512 \n",
" alloc ompi_group_t <= oshmem_group_t 72 \n",
" alloc ompi_communicator_t <= oshmem_group_t 264 \n",
" alloc opal_hash_table_t <= oshmem_group_t 72 \n",
" alloc attribute_value_t <= oshmem_group_t 64 \n",
" alloc ompi_comm_cid_context_t <= oshmem_group_t 120 \n",
" alloc ompi_comm_request_item_t <= oshmem_group_t 72 \n",
" alloc ompi_comm_allreduce_context_t <= oshmem_g... 80 \n",
" alloc ompi_coll_libnbc_module_t <= oshmem_group_t 480 \n",
" alloc avail_coll_t <= oshmem_group_t 64 \n",
" alloc mca_coll_tuned_module_t <= oshmem_group_t 1024 \n",
" alloc mca_coll_basic_module_t <= oshmem_group_t 408 \n",
" alloc mca_coll_base_comm_t <= oshmem_group_t 136 \n",
" alloc oshmem_group_cache_t 64 \n",
" Message size received from all nodes 8 \n",
" Message size sent to all nodes 8 \n",
"\n",
" Mean \\\n",
"Node Context Thread Timer \n",
"0 0 0 alloc opal_thread_t 40.000000 \n",
" alloc mca_base_component_list_item_t 48.000000 \n",
" alloc mca_base_var_group_t 280.000000 \n",
" alloc mca_base_var_t 168.000000 \n",
" alloc mca_base_var_enum_t 88.000000 \n",
" alloc opal_dss_type_info_t 80.000000 \n",
" alloc opal_list_t 64.000000 \n",
" alloc mca_base_component_repository_item_t 176.000000 \n",
" alloc opal_if_t 224.000000 \n",
" alloc orte_schizo_base_active_module_t 64.000000 \n",
" alloc opal_progress_tracker_t 256.000000 \n",
" alloc opal_pmix_proc_data_t 112.000000 \n",
" alloc opal_hash_table_t 72.000000 \n",
" alloc opal_value_t 136.000000 \n",
" alloc orte_state_t 64.000000 \n",
" alloc orte_routed_base_active_t 64.000000 \n",
" alloc mca_oob_ud_device_t 496.000000 \n",
" alloc mca_oob_ud_port_t 912.000000 \n",
" alloc orte_rml_pathway_t 176.000000 \n",
" alloc orte_attribute_t 112.000000 \n",
" alloc orte_rml_base_active_t 56.000000 \n",
" alloc orte_rml_posted_recv_t 80.000000 \n",
" alloc orte_rml_posted_recv_t <= orte_rml_recv_r... 80.000000 \n",
" alloc orte_rml_recv_request_t 168.000000 \n",
" alloc orte_grpcomm_base_active_t 64.000000 \n",
" alloc opal_hwloc_topo_data_t 96.000000 \n",
" alloc ompi_datatype_t 288.000000 \n",
" alloc opal_convertor_t 248.000000 \n",
" alloc ompi_proc_t 112.000000 \n",
" alloc opal_pointer_array_t 112.000000 \n",
"... ... \n",
"63 0 0 alloc orte_namelist_t 48.000000 \n",
" alloc orte_namelist_t <= oshmem_group_t 48.000000 \n",
" alloc opal_list_t <= oshmem_group_t 64.000000 \n",
" alloc mca_scoll_mpi_module_t 160.000000 \n",
" alloc mca_scoll_mpi_module_t <= oshmem_group_t 160.000000 \n",
" alloc avail_com_t 56.000000 \n",
" alloc avail_com_t <= oshmem_group_t 56.000000 \n",
" alloc mca_scoll_basic_module_t 64.000000 \n",
" alloc mca_scoll_basic_module_t <= oshmem_group_t 64.000000 \n",
" alloc mca_atomic_mxm_module_t 32.000000 \n",
" alloc mca_atomic_basic_module_t 32.000000 \n",
" alloc ompi_proc_t ** <= ompi_group_t 512.000000 \n",
" alloc ompi_comm_allreduce_context_t 80.000000 \n",
" alloc opal_buffer_t 64.000000 \n",
" alloc ompi_proc_t ** <= oshmem_group_t <= ompi_... 512.000000 \n",
" alloc ompi_group_t <= oshmem_group_t 72.000000 \n",
" alloc ompi_communicator_t <= oshmem_group_t 264.000000 \n",
" alloc opal_hash_table_t <= oshmem_group_t 72.000000 \n",
" alloc attribute_value_t <= oshmem_group_t 64.000000 \n",
" alloc ompi_comm_cid_context_t <= oshmem_group_t 120.000000 \n",
" alloc ompi_comm_request_item_t <= oshmem_group_t 72.000000 \n",
" alloc ompi_comm_allreduce_context_t <= oshmem_g... 80.000000 \n",
" alloc ompi_coll_libnbc_module_t <= oshmem_group_t 480.000000 \n",
" alloc avail_coll_t <= oshmem_group_t 64.000000 \n",
" alloc mca_coll_tuned_module_t <= oshmem_group_t 1024.000000 \n",
" alloc mca_coll_basic_module_t <= oshmem_group_t 408.000000 \n",
" alloc mca_coll_base_comm_t <= oshmem_group_t 136.000000 \n",
" alloc oshmem_group_cache_t 64.000000 \n",
" Message size received from all nodes 8.000000 \n",
" Message size sent to all nodes 47.844509 \n",
"\n",
" SumSq \n",
"Node Context Thread Timer \n",
"0 0 0 alloc opal_thread_t 1600 \n",
" alloc mca_base_component_list_item_t 207360 \n",
" alloc mca_base_var_group_t 15209600 \n",
" alloc mca_base_var_t 26671680 \n",
" alloc mca_base_var_enum_t 147136 \n",
" alloc opal_dss_type_info_t 294400 \n",
" alloc opal_list_t 286720 \n",
" alloc mca_base_component_repository_item_t 3686144 \n",
" alloc opal_if_t 150528 \n",
" alloc orte_schizo_base_active_module_t 8192 \n",
" alloc opal_progress_tracker_t 65536 \n",
" alloc opal_pmix_proc_data_t 815360 \n",
" alloc opal_hash_table_t 31104 \n",
" alloc opal_value_t 29316160 \n",
" alloc orte_state_t 8192 \n",
" alloc orte_routed_base_active_t 16384 \n",
" alloc mca_oob_ud_device_t 246016 \n",
" alloc mca_oob_ud_port_t 831744 \n",
" alloc orte_rml_pathway_t 30976 \n",
" alloc orte_attribute_t 62720 \n",
" alloc orte_rml_base_active_t 3136 \n",
" alloc orte_rml_posted_recv_t 25600 \n",
" alloc orte_rml_posted_recv_t <= orte_rml_recv_r... 25600 \n",
" alloc orte_rml_recv_request_t 112896 \n",
" alloc orte_grpcomm_base_active_t 4096 \n",
" alloc opal_hwloc_topo_data_t 9216 \n",
" alloc ompi_datatype_t 1907712 \n",
" alloc opal_convertor_t 123008 \n",
" alloc ompi_proc_t 802816 \n",
" alloc opal_pointer_array_t 25088 \n",
"... ... \n",
"63 0 0 alloc orte_namelist_t 297216 \n",
" alloc orte_namelist_t <= oshmem_group_t 297216 \n",
" alloc opal_list_t <= oshmem_group_t 16384 \n",
" alloc mca_scoll_mpi_module_t 76800 \n",
" alloc mca_scoll_mpi_module_t <= oshmem_group_t 51200 \n",
" alloc avail_com_t 31360 \n",
" alloc avail_com_t <= oshmem_group_t 15680 \n",
" alloc mca_scoll_basic_module_t 20480 \n",
" alloc mca_scoll_basic_module_t <= oshmem_group_t 12288 \n",
" alloc mca_atomic_mxm_module_t 1024 \n",
" alloc mca_atomic_basic_module_t 1024 \n",
" alloc ompi_proc_t ** <= ompi_group_t 262144 \n",
" alloc ompi_comm_allreduce_context_t 38400 \n",
" alloc opal_buffer_t 4096 \n",
" alloc ompi_proc_t ** <= oshmem_group_t <= ompi_... 262144 \n",
" alloc ompi_group_t <= oshmem_group_t 5184 \n",
" alloc ompi_communicator_t <= oshmem_group_t 69696 \n",
" alloc opal_hash_table_t <= oshmem_group_t 5184 \n",
" alloc attribute_value_t <= oshmem_group_t 28672 \n",
" alloc ompi_comm_cid_context_t <= oshmem_group_t 28800 \n",
" alloc ompi_comm_request_item_t <= oshmem_group_t 67392 \n",
" alloc ompi_comm_allreduce_context_t <= oshmem_g... 19200 \n",
" alloc ompi_coll_libnbc_module_t <= oshmem_group_t 230400 \n",
" alloc avail_coll_t <= oshmem_group_t 12288 \n",
" alloc mca_coll_tuned_module_t <= oshmem_group_t 1048576 \n",
" alloc mca_coll_basic_module_t <= oshmem_group_t 166464 \n",
" alloc mca_coll_base_comm_t <= oshmem_group_t 36992 \n",
" alloc oshmem_group_cache_t 4096 \n",
" Message size received from all nodes 4194304 \n",
" Message size sent to all nodes 43125997568 \n",
"\n",
"[6272 rows x 5 columns]"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.atomic_data()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"The interval_data() function returns the timer data. As with atomic_data(), it is returned as a multi-index Pandas dataframe with Node, Context, Thread, and Timer as the indices."
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th>Calls</th>\n",
" <th>Subcalls</th>\n",
" <th>Exclusive</th>\n",
" <th>Inclusive</th>\n",
" <th>ProfileCalls</th>\n",
" <th>Group</th>\n",
" <th>Timer Name</th>\n",
" <th>Timer Location</th>\n",
" <th>Timer Type</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Node</th>\n",
" <th>Context</th>\n",
" <th>Thread</th>\n",
" <th>Timer</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>54530</td>\n",
" <td>6493783</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3974524</td>\n",
" <td>3974524</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_n_pes(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_my_pe(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>131107</td>\n",
" <td>0</td>\n",
" <td>2194807</td>\n",
" <td>2194807</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_barrier_all(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>3108</td>\n",
" <td>3108</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_int_sum_to_all(int *, const int *, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>222176</td>\n",
" <td>222176</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>long long shmem_longlong_fadd(long long *, lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>38757</td>\n",
" <td>38757</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_p(long long *, long long, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>109</td>\n",
" <td>109</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_broadcast64(void *, const void *, s...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void *shmalloc(size_t) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>640</td>\n",
" <td>0</td>\n",
" <td>4576</td>\n",
" <td>4576</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_put(long long *, const lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>915</td>\n",
" <td>915</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shfree(void *) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>22</td>\n",
" <td>22</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>239</td>\n",
" <td>239</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"14\" valign=\"top\">1</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>55168</td>\n",
" <td>6450822</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3931819</td>\n",
" <td>3931819</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_n_pes(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_my_pe(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>131107</td>\n",
" <td>0</td>\n",
" <td>2134030</td>\n",
" <td>2134030</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_barrier_all(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>3103</td>\n",
" <td>3103</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_int_sum_to_all(int *, const int *, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>278368</td>\n",
" <td>278368</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>long long shmem_longlong_fadd(long long *, lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>42489</td>\n",
" <td>42489</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_p(long long *, long long, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>111</td>\n",
" <td>111</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_broadcast64(void *, const void *, s...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>17</td>\n",
" <td>17</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void *shmalloc(size_t) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>640</td>\n",
" <td>0</td>\n",
" <td>4744</td>\n",
" <td>4744</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_put(long long *, const lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>915</td>\n",
" <td>915</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shfree(void *) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>35</td>\n",
" <td>35</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"2\" valign=\"top\">2</th>\n",
" <th rowspan=\"2\" valign=\"top\">0</th>\n",
" <th rowspan=\"2\" valign=\"top\">0</th>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>52874</td>\n",
" <td>6485231</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3976504</td>\n",
" <td>3976504</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"2\" valign=\"top\">61</th>\n",
" <th rowspan=\"2\" valign=\"top\">0</th>\n",
" <th rowspan=\"2\" valign=\"top\">0</th>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>19</td>\n",
" <td>19</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>1072</td>\n",
" <td>1072</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"14\" valign=\"top\">62</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>63013</td>\n",
" <td>6243165</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3724183</td>\n",
" <td>3724183</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>3</td>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_n_pes(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_my_pe(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>131107</td>\n",
" <td>0</td>\n",
" <td>2172075</td>\n",
" <td>2172075</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_barrier_all(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>2232</td>\n",
" <td>2232</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_int_sum_to_all(int *, const int *, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>224237</td>\n",
" <td>224237</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>long long shmem_longlong_fadd(long long *, lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>42345</td>\n",
" <td>42345</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_p(long long *, long long, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>831</td>\n",
" <td>831</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_broadcast64(void *, const void *, s...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>25</td>\n",
" <td>25</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void *shmalloc(size_t) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>640</td>\n",
" <td>0</td>\n",
" <td>12446</td>\n",
" <td>12446</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_put(long long *, const lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>906</td>\n",
" <td>906</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shfree(void *) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>20</td>\n",
" <td>20</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>849</td>\n",
" <td>849</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th rowspan=\"14\" valign=\"top\">63</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th rowspan=\"14\" valign=\"top\">0</th>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>61511</td>\n",
" <td>6244331</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3735137</td>\n",
" <td>3735137</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_n_pes(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_my_pe(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>131107</td>\n",
" <td>0</td>\n",
" <td>2162614</td>\n",
" <td>2162614</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_barrier_all(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>1733</td>\n",
" <td>1733</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_int_sum_to_all(int *, const int *, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>226262</td>\n",
" <td>226262</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>long long shmem_longlong_fadd(long long *, lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>43455</td>\n",
" <td>43455</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_p(long long *, long long, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>605</td>\n",
" <td>605</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_broadcast64(void *, const void *, s...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>25</td>\n",
" <td>25</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void *shmalloc(size_t) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>640</td>\n",
" <td>0</td>\n",
" <td>11125</td>\n",
" <td>11125</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_put(long long *, const lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>906</td>\n",
" <td>906</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shfree(void *) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>26</td>\n",
" <td>26</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>929</td>\n",
" <td>929</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>896 rows × 9 columns</p>\n",
"</div>"
],
"text/plain": [
" Calls \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application 1 \n",
" void shmem_init(void) C 1 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 131107 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3 \n",
" long long shmem_longlong_fadd(long long *, long... 65536 \n",
" void shmem_longlong_p(long long *, long long, i... 65536 \n",
" void shmem_broadcast64(void *, const void *, si... 1 \n",
" void *shmalloc(size_t) C 2 \n",
" void shmem_longlong_put(long long *, const long... 640 \n",
" void shfree(void *) C 2 \n",
" void shmem_longlong_sum_to_all(long long *, con... 1 \n",
" void shmem_finalize(void) C 1 \n",
"1 0 0 .TAU application 1 \n",
" void shmem_init(void) C 1 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 131107 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3 \n",
" long long shmem_longlong_fadd(long long *, long... 65536 \n",
" void shmem_longlong_p(long long *, long long, i... 65536 \n",
" void shmem_broadcast64(void *, const void *, si... 1 \n",
" void *shmalloc(size_t) C 2 \n",
" void shmem_longlong_put(long long *, const long... 640 \n",
" void shfree(void *) C 2 \n",
" void shmem_longlong_sum_to_all(long long *, con... 1 \n",
" void shmem_finalize(void) C 1 \n",
"2 0 0 .TAU application 1 \n",
" void shmem_init(void) C 1 \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... 1 \n",
" void shmem_finalize(void) C 1 \n",
"62 0 0 .TAU application 1 \n",
" void shmem_init(void) C 1 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 131107 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3 \n",
" long long shmem_longlong_fadd(long long *, long... 65536 \n",
" void shmem_longlong_p(long long *, long long, i... 65536 \n",
" void shmem_broadcast64(void *, const void *, si... 1 \n",
" void *shmalloc(size_t) C 2 \n",
" void shmem_longlong_put(long long *, const long... 640 \n",
" void shfree(void *) C 2 \n",
" void shmem_longlong_sum_to_all(long long *, con... 1 \n",
" void shmem_finalize(void) C 1 \n",
"63 0 0 .TAU application 1 \n",
" void shmem_init(void) C 1 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 131107 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3 \n",
" long long shmem_longlong_fadd(long long *, long... 65536 \n",
" void shmem_longlong_p(long long *, long long, i... 65536 \n",
" void shmem_broadcast64(void *, const void *, si... 1 \n",
" void *shmalloc(size_t) C 2 \n",
" void shmem_longlong_put(long long *, const long... 640 \n",
" void shfree(void *) C 2 \n",
" void shmem_longlong_sum_to_all(long long *, con... 1 \n",
" void shmem_finalize(void) C 1 \n",
"\n",
" Subcalls \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application 262834 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"1 0 0 .TAU application 262834 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"2 0 0 .TAU application 262834 \n",
" void shmem_init(void) C 0 \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"62 0 0 .TAU application 262834 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"63 0 0 .TAU application 262834 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"\n",
" Exclusive \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application 54530 \n",
" void shmem_init(void) C 3974524 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 2194807 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3108 \n",
" long long shmem_longlong_fadd(long long *, long... 222176 \n",
" void shmem_longlong_p(long long *, long long, i... 38757 \n",
" void shmem_broadcast64(void *, const void *, si... 109 \n",
" void *shmalloc(size_t) C 18 \n",
" void shmem_longlong_put(long long *, const long... 4576 \n",
" void shfree(void *) C 915 \n",
" void shmem_longlong_sum_to_all(long long *, con... 22 \n",
" void shmem_finalize(void) C 239 \n",
"1 0 0 .TAU application 55168 \n",
" void shmem_init(void) C 3931819 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 2134030 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3103 \n",
" long long shmem_longlong_fadd(long long *, long... 278368 \n",
" void shmem_longlong_p(long long *, long long, i... 42489 \n",
" void shmem_broadcast64(void *, const void *, si... 111 \n",
" void *shmalloc(size_t) C 17 \n",
" void shmem_longlong_put(long long *, const long... 4744 \n",
" void shfree(void *) C 915 \n",
" void shmem_longlong_sum_to_all(long long *, con... 19 \n",
" void shmem_finalize(void) C 35 \n",
"2 0 0 .TAU application 52874 \n",
" void shmem_init(void) C 3976504 \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... 19 \n",
" void shmem_finalize(void) C 1072 \n",
"62 0 0 .TAU application 63013 \n",
" void shmem_init(void) C 3724183 \n",
" int shmem_n_pes(void) C 3 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 2172075 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 2232 \n",
" long long shmem_longlong_fadd(long long *, long... 224237 \n",
" void shmem_longlong_p(long long *, long long, i... 42345 \n",
" void shmem_broadcast64(void *, const void *, si... 831 \n",
" void *shmalloc(size_t) C 25 \n",
" void shmem_longlong_put(long long *, const long... 12446 \n",
" void shfree(void *) C 906 \n",
" void shmem_longlong_sum_to_all(long long *, con... 20 \n",
" void shmem_finalize(void) C 849 \n",
"63 0 0 .TAU application 61511 \n",
" void shmem_init(void) C 3735137 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 1 \n",
" void shmem_barrier_all(void) C 2162614 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 1733 \n",
" long long shmem_longlong_fadd(long long *, long... 226262 \n",
" void shmem_longlong_p(long long *, long long, i... 43455 \n",
" void shmem_broadcast64(void *, const void *, si... 605 \n",
" void *shmalloc(size_t) C 25 \n",
" void shmem_longlong_put(long long *, const long... 11125 \n",
" void shfree(void *) C 906 \n",
" void shmem_longlong_sum_to_all(long long *, con... 26 \n",
" void shmem_finalize(void) C 929 \n",
"\n",
" Inclusive \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application 6493783 \n",
" void shmem_init(void) C 3974524 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 2194807 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3108 \n",
" long long shmem_longlong_fadd(long long *, long... 222176 \n",
" void shmem_longlong_p(long long *, long long, i... 38757 \n",
" void shmem_broadcast64(void *, const void *, si... 109 \n",
" void *shmalloc(size_t) C 18 \n",
" void shmem_longlong_put(long long *, const long... 4576 \n",
" void shfree(void *) C 915 \n",
" void shmem_longlong_sum_to_all(long long *, con... 22 \n",
" void shmem_finalize(void) C 239 \n",
"1 0 0 .TAU application 6450822 \n",
" void shmem_init(void) C 3931819 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 2 \n",
" void shmem_barrier_all(void) C 2134030 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 3103 \n",
" long long shmem_longlong_fadd(long long *, long... 278368 \n",
" void shmem_longlong_p(long long *, long long, i... 42489 \n",
" void shmem_broadcast64(void *, const void *, si... 111 \n",
" void *shmalloc(size_t) C 17 \n",
" void shmem_longlong_put(long long *, const long... 4744 \n",
" void shfree(void *) C 915 \n",
" void shmem_longlong_sum_to_all(long long *, con... 19 \n",
" void shmem_finalize(void) C 35 \n",
"2 0 0 .TAU application 6485231 \n",
" void shmem_init(void) C 3976504 \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... 19 \n",
" void shmem_finalize(void) C 1072 \n",
"62 0 0 .TAU application 6243165 \n",
" void shmem_init(void) C 3724183 \n",
" int shmem_n_pes(void) C 3 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 2172075 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 2232 \n",
" long long shmem_longlong_fadd(long long *, long... 224237 \n",
" void shmem_longlong_p(long long *, long long, i... 42345 \n",
" void shmem_broadcast64(void *, const void *, si... 831 \n",
" void *shmalloc(size_t) C 25 \n",
" void shmem_longlong_put(long long *, const long... 12446 \n",
" void shfree(void *) C 906 \n",
" void shmem_longlong_sum_to_all(long long *, con... 20 \n",
" void shmem_finalize(void) C 849 \n",
"63 0 0 .TAU application 6244331 \n",
" void shmem_init(void) C 3735137 \n",
" int shmem_n_pes(void) C 2 \n",
" int shmem_my_pe(void) C 1 \n",
" void shmem_barrier_all(void) C 2162614 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 1733 \n",
" long long shmem_longlong_fadd(long long *, long... 226262 \n",
" void shmem_longlong_p(long long *, long long, i... 43455 \n",
" void shmem_broadcast64(void *, const void *, si... 605 \n",
" void *shmalloc(size_t) C 25 \n",
" void shmem_longlong_put(long long *, const long... 11125 \n",
" void shfree(void *) C 906 \n",
" void shmem_longlong_sum_to_all(long long *, con... 26 \n",
" void shmem_finalize(void) C 929 \n",
"\n",
" ProfileCalls \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application 0 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"1 0 0 .TAU application 0 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"2 0 0 .TAU application 0 \n",
" void shmem_init(void) C 0 \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"62 0 0 .TAU application 0 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"63 0 0 .TAU application 0 \n",
" void shmem_init(void) C 0 \n",
" int shmem_n_pes(void) C 0 \n",
" int shmem_my_pe(void) C 0 \n",
" void shmem_barrier_all(void) C 0 \n",
" void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
" long long shmem_longlong_fadd(long long *, long... 0 \n",
" void shmem_longlong_p(long long *, long long, i... 0 \n",
" void shmem_broadcast64(void *, const void *, si... 0 \n",
" void *shmalloc(size_t) C 0 \n",
" void shmem_longlong_put(long long *, const long... 0 \n",
" void shfree(void *) C 0 \n",
" void shmem_longlong_sum_to_all(long long *, con... 0 \n",
" void shmem_finalize(void) C 0 \n",
"\n",
" Group \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application GROUP=\"TAU_USER\" \n",
" void shmem_init(void) C GROUP=\"TAU_USER\" \n",
" int shmem_n_pes(void) C GROUP=\"TAU_USER\" \n",
" int shmem_my_pe(void) C GROUP=\"TAU_USER\" \n",
" void shmem_barrier_all(void) C GROUP=\"TAU_USER\" \n",
" void shmem_int_sum_to_all(int *, const int *, i... GROUP=\"TAU_USER\" \n",
" long long shmem_longlong_fadd(long long *, long... GROUP=\"TAU_USER\" \n",
" void shmem_longlong_p(long long *, long long, i... GROUP=\"TAU_USER\" \n",
" void shmem_broadcast64(void *, const void *, si... GROUP=\"TAU_USER\" \n",
" void *shmalloc(size_t) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_put(long long *, const long... GROUP=\"TAU_USER\" \n",
" void shfree(void *) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
" void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"1 0 0 .TAU application GROUP=\"TAU_USER\" \n",
" void shmem_init(void) C GROUP=\"TAU_USER\" \n",
" int shmem_n_pes(void) C GROUP=\"TAU_USER\" \n",
" int shmem_my_pe(void) C GROUP=\"TAU_USER\" \n",
" void shmem_barrier_all(void) C GROUP=\"TAU_USER\" \n",
" void shmem_int_sum_to_all(int *, const int *, i... GROUP=\"TAU_USER\" \n",
" long long shmem_longlong_fadd(long long *, long... GROUP=\"TAU_USER\" \n",
" void shmem_longlong_p(long long *, long long, i... GROUP=\"TAU_USER\" \n",
" void shmem_broadcast64(void *, const void *, si... GROUP=\"TAU_USER\" \n",
" void *shmalloc(size_t) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_put(long long *, const long... GROUP=\"TAU_USER\" \n",
" void shfree(void *) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
" void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"2 0 0 .TAU application GROUP=\"TAU_USER\" \n",
" void shmem_init(void) C GROUP=\"TAU_USER\" \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
" void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"62 0 0 .TAU application GROUP=\"TAU_USER\" \n",
" void shmem_init(void) C GROUP=\"TAU_USER\" \n",
" int shmem_n_pes(void) C GROUP=\"TAU_USER\" \n",
" int shmem_my_pe(void) C GROUP=\"TAU_USER\" \n",
" void shmem_barrier_all(void) C GROUP=\"TAU_USER\" \n",
" void shmem_int_sum_to_all(int *, const int *, i... GROUP=\"TAU_USER\" \n",
" long long shmem_longlong_fadd(long long *, long... GROUP=\"TAU_USER\" \n",
" void shmem_longlong_p(long long *, long long, i... GROUP=\"TAU_USER\" \n",
" void shmem_broadcast64(void *, const void *, si... GROUP=\"TAU_USER\" \n",
" void *shmalloc(size_t) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_put(long long *, const long... GROUP=\"TAU_USER\" \n",
" void shfree(void *) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
" void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"63 0 0 .TAU application GROUP=\"TAU_USER\" \n",
" void shmem_init(void) C GROUP=\"TAU_USER\" \n",
" int shmem_n_pes(void) C GROUP=\"TAU_USER\" \n",
" int shmem_my_pe(void) C GROUP=\"TAU_USER\" \n",
" void shmem_barrier_all(void) C GROUP=\"TAU_USER\" \n",
" void shmem_int_sum_to_all(int *, const int *, i... GROUP=\"TAU_USER\" \n",
" long long shmem_longlong_fadd(long long *, long... GROUP=\"TAU_USER\" \n",
" void shmem_longlong_p(long long *, long long, i... GROUP=\"TAU_USER\" \n",
" void shmem_broadcast64(void *, const void *, si... GROUP=\"TAU_USER\" \n",
" void *shmalloc(size_t) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_put(long long *, const long... GROUP=\"TAU_USER\" \n",
" void shfree(void *) C GROUP=\"TAU_USER\" \n",
" void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
" void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"\n",
" Timer Name \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application .TAU application \n",
" void shmem_init(void) C void shmem_init(void) C \n",
" int shmem_n_pes(void) C int shmem_n_pes(void) C \n",
" int shmem_my_pe(void) C int shmem_my_pe(void) C \n",
" void shmem_barrier_all(void) C void shmem_barrier_all(void) C \n",
" void shmem_int_sum_to_all(int *, const int *, i... void shmem_int_sum_to_all(int *, const int *, ... \n",
" long long shmem_longlong_fadd(long long *, long... long long shmem_longlong_fadd(long long *, lon... \n",
" void shmem_longlong_p(long long *, long long, i... void shmem_longlong_p(long long *, long long, ... \n",
" void shmem_broadcast64(void *, const void *, si... void shmem_broadcast64(void *, const void *, s... \n",
" void *shmalloc(size_t) C void *shmalloc(size_t) C \n",
" void shmem_longlong_put(long long *, const long... void shmem_longlong_put(long long *, const lon... \n",
" void shfree(void *) C void shfree(void *) C \n",
" void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
" void shmem_finalize(void) C void shmem_finalize(void) C \n",
"1 0 0 .TAU application .TAU application \n",
" void shmem_init(void) C void shmem_init(void) C \n",
" int shmem_n_pes(void) C int shmem_n_pes(void) C \n",
" int shmem_my_pe(void) C int shmem_my_pe(void) C \n",
" void shmem_barrier_all(void) C void shmem_barrier_all(void) C \n",
" void shmem_int_sum_to_all(int *, const int *, i... void shmem_int_sum_to_all(int *, const int *, ... \n",
" long long shmem_longlong_fadd(long long *, long... long long shmem_longlong_fadd(long long *, lon... \n",
" void shmem_longlong_p(long long *, long long, i... void shmem_longlong_p(long long *, long long, ... \n",
" void shmem_broadcast64(void *, const void *, si... void shmem_broadcast64(void *, const void *, s... \n",
" void *shmalloc(size_t) C void *shmalloc(size_t) C \n",
" void shmem_longlong_put(long long *, const long... void shmem_longlong_put(long long *, const lon... \n",
" void shfree(void *) C void shfree(void *) C \n",
" void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
" void shmem_finalize(void) C void shmem_finalize(void) C \n",
"2 0 0 .TAU application .TAU application \n",
" void shmem_init(void) C void shmem_init(void) C \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
" void shmem_finalize(void) C void shmem_finalize(void) C \n",
"62 0 0 .TAU application .TAU application \n",
" void shmem_init(void) C void shmem_init(void) C \n",
" int shmem_n_pes(void) C int shmem_n_pes(void) C \n",
" int shmem_my_pe(void) C int shmem_my_pe(void) C \n",
" void shmem_barrier_all(void) C void shmem_barrier_all(void) C \n",
" void shmem_int_sum_to_all(int *, const int *, i... void shmem_int_sum_to_all(int *, const int *, ... \n",
" long long shmem_longlong_fadd(long long *, long... long long shmem_longlong_fadd(long long *, lon... \n",
" void shmem_longlong_p(long long *, long long, i... void shmem_longlong_p(long long *, long long, ... \n",
" void shmem_broadcast64(void *, const void *, si... void shmem_broadcast64(void *, const void *, s... \n",
" void *shmalloc(size_t) C void *shmalloc(size_t) C \n",
" void shmem_longlong_put(long long *, const long... void shmem_longlong_put(long long *, const lon... \n",
" void shfree(void *) C void shfree(void *) C \n",
" void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
" void shmem_finalize(void) C void shmem_finalize(void) C \n",
"63 0 0 .TAU application .TAU application \n",
" void shmem_init(void) C void shmem_init(void) C \n",
" int shmem_n_pes(void) C int shmem_n_pes(void) C \n",
" int shmem_my_pe(void) C int shmem_my_pe(void) C \n",
" void shmem_barrier_all(void) C void shmem_barrier_all(void) C \n",
" void shmem_int_sum_to_all(int *, const int *, i... void shmem_int_sum_to_all(int *, const int *, ... \n",
" long long shmem_longlong_fadd(long long *, long... long long shmem_longlong_fadd(long long *, lon... \n",
" void shmem_longlong_p(long long *, long long, i... void shmem_longlong_p(long long *, long long, ... \n",
" void shmem_broadcast64(void *, const void *, si... void shmem_broadcast64(void *, const void *, s... \n",
" void *shmalloc(size_t) C void *shmalloc(size_t) C \n",
" void shmem_longlong_put(long long *, const long... void shmem_longlong_put(long long *, const lon... \n",
" void shfree(void *) C void shfree(void *) C \n",
" void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
" void shmem_finalize(void) C void shmem_finalize(void) C \n",
"\n",
" Timer Location \\\n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"1 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"2 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"62 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"63 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"\n",
" Timer Type \n",
"Node Context Thread Timer \n",
"0 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"1 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"2 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
"... ... \n",
"61 0 0 void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"62 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"63 0 0 .TAU application None \n",
" void shmem_init(void) C None \n",
" int shmem_n_pes(void) C None \n",
" int shmem_my_pe(void) C None \n",
" void shmem_barrier_all(void) C None \n",
" void shmem_int_sum_to_all(int *, const int *, i... None \n",
" long long shmem_longlong_fadd(long long *, long... None \n",
" void shmem_longlong_p(long long *, long long, i... None \n",
" void shmem_broadcast64(void *, const void *, si... None \n",
" void *shmalloc(size_t) C None \n",
" void shmem_longlong_put(long long *, const long... None \n",
" void shfree(void *) C None \n",
" void shmem_longlong_sum_to_all(long long *, con... None \n",
" void shmem_finalize(void) C None \n",
"\n",
"[896 rows x 9 columns]"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.interval_data()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"We can manipulate this using normal Pandas functions. For example, here are the timers on (0,0,0) sorted by number of calls descending."
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Calls</th>\n",
" <th>Subcalls</th>\n",
" <th>Exclusive</th>\n",
" <th>Inclusive</th>\n",
" <th>ProfileCalls</th>\n",
" <th>Group</th>\n",
" <th>Timer Name</th>\n",
" <th>Timer Location</th>\n",
" <th>Timer Type</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Timer</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>131107</td>\n",
" <td>0</td>\n",
" <td>2194807</td>\n",
" <td>2194807</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_barrier_all(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>222176</td>\n",
" <td>222176</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>long long shmem_longlong_fadd(long long *, lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>65536</td>\n",
" <td>0</td>\n",
" <td>38757</td>\n",
" <td>38757</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_p(long long *, long long, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>640</td>\n",
" <td>0</td>\n",
" <td>4576</td>\n",
" <td>4576</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_put(long long *, const lon...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" <td>3108</td>\n",
" <td>3108</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_int_sum_to_all(int *, const int *, ...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_n_pes(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>int shmem_my_pe(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void *shmalloc(size_t) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>915</td>\n",
" <td>915</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shfree(void *) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>.TAU application</th>\n",
" <td>1</td>\n",
" <td>262834</td>\n",
" <td>54530</td>\n",
" <td>6493783</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>.TAU application</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>3974524</td>\n",
" <td>3974524</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_init(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>109</td>\n",
" <td>109</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_broadcast64(void *, const void *, s...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>22</td>\n",
" <td>22</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_longlong_sum_to_all(long long *, co...</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>239</td>\n",
" <td>239</td>\n",
" <td>0</td>\n",
" <td>GROUP=\"TAU_USER\"</td>\n",
" <td>void shmem_finalize(void) C</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Calls Subcalls \\\n",
"Timer \n",
"void shmem_barrier_all(void) C 131107 0 \n",
"long long shmem_longlong_fadd(long long *, long... 65536 0 \n",
"void shmem_longlong_p(long long *, long long, i... 65536 0 \n",
"void shmem_longlong_put(long long *, const long... 640 0 \n",
"void shmem_int_sum_to_all(int *, const int *, i... 3 0 \n",
"int shmem_n_pes(void) C 2 0 \n",
"int shmem_my_pe(void) C 2 0 \n",
"void *shmalloc(size_t) C 2 0 \n",
"void shfree(void *) C 2 0 \n",
".TAU application 1 262834 \n",
"void shmem_init(void) C 1 0 \n",
"void shmem_broadcast64(void *, const void *, si... 1 0 \n",
"void shmem_longlong_sum_to_all(long long *, con... 1 0 \n",
"void shmem_finalize(void) C 1 0 \n",
"\n",
" Exclusive Inclusive \\\n",
"Timer \n",
"void shmem_barrier_all(void) C 2194807 2194807 \n",
"long long shmem_longlong_fadd(long long *, long... 222176 222176 \n",
"void shmem_longlong_p(long long *, long long, i... 38757 38757 \n",
"void shmem_longlong_put(long long *, const long... 4576 4576 \n",
"void shmem_int_sum_to_all(int *, const int *, i... 3108 3108 \n",
"int shmem_n_pes(void) C 2 2 \n",
"int shmem_my_pe(void) C 0 0 \n",
"void *shmalloc(size_t) C 18 18 \n",
"void shfree(void *) C 915 915 \n",
".TAU application 54530 6493783 \n",
"void shmem_init(void) C 3974524 3974524 \n",
"void shmem_broadcast64(void *, const void *, si... 109 109 \n",
"void shmem_longlong_sum_to_all(long long *, con... 22 22 \n",
"void shmem_finalize(void) C 239 239 \n",
"\n",
" ProfileCalls \\\n",
"Timer \n",
"void shmem_barrier_all(void) C 0 \n",
"long long shmem_longlong_fadd(long long *, long... 0 \n",
"void shmem_longlong_p(long long *, long long, i... 0 \n",
"void shmem_longlong_put(long long *, const long... 0 \n",
"void shmem_int_sum_to_all(int *, const int *, i... 0 \n",
"int shmem_n_pes(void) C 0 \n",
"int shmem_my_pe(void) C 0 \n",
"void *shmalloc(size_t) C 0 \n",
"void shfree(void *) C 0 \n",
".TAU application 0 \n",
"void shmem_init(void) C 0 \n",
"void shmem_broadcast64(void *, const void *, si... 0 \n",
"void shmem_longlong_sum_to_all(long long *, con... 0 \n",
"void shmem_finalize(void) C 0 \n",
"\n",
" Group \\\n",
"Timer \n",
"void shmem_barrier_all(void) C GROUP=\"TAU_USER\" \n",
"long long shmem_longlong_fadd(long long *, long... GROUP=\"TAU_USER\" \n",
"void shmem_longlong_p(long long *, long long, i... GROUP=\"TAU_USER\" \n",
"void shmem_longlong_put(long long *, const long... GROUP=\"TAU_USER\" \n",
"void shmem_int_sum_to_all(int *, const int *, i... GROUP=\"TAU_USER\" \n",
"int shmem_n_pes(void) C GROUP=\"TAU_USER\" \n",
"int shmem_my_pe(void) C GROUP=\"TAU_USER\" \n",
"void *shmalloc(size_t) C GROUP=\"TAU_USER\" \n",
"void shfree(void *) C GROUP=\"TAU_USER\" \n",
".TAU application GROUP=\"TAU_USER\" \n",
"void shmem_init(void) C GROUP=\"TAU_USER\" \n",
"void shmem_broadcast64(void *, const void *, si... GROUP=\"TAU_USER\" \n",
"void shmem_longlong_sum_to_all(long long *, con... GROUP=\"TAU_USER\" \n",
"void shmem_finalize(void) C GROUP=\"TAU_USER\" \n",
"\n",
" Timer Name \\\n",
"Timer \n",
"void shmem_barrier_all(void) C void shmem_barrier_all(void) C \n",
"long long shmem_longlong_fadd(long long *, long... long long shmem_longlong_fadd(long long *, lon... \n",
"void shmem_longlong_p(long long *, long long, i... void shmem_longlong_p(long long *, long long, ... \n",
"void shmem_longlong_put(long long *, const long... void shmem_longlong_put(long long *, const lon... \n",
"void shmem_int_sum_to_all(int *, const int *, i... void shmem_int_sum_to_all(int *, const int *, ... \n",
"int shmem_n_pes(void) C int shmem_n_pes(void) C \n",
"int shmem_my_pe(void) C int shmem_my_pe(void) C \n",
"void *shmalloc(size_t) C void *shmalloc(size_t) C \n",
"void shfree(void *) C void shfree(void *) C \n",
".TAU application .TAU application \n",
"void shmem_init(void) C void shmem_init(void) C \n",
"void shmem_broadcast64(void *, const void *, si... void shmem_broadcast64(void *, const void *, s... \n",
"void shmem_longlong_sum_to_all(long long *, con... void shmem_longlong_sum_to_all(long long *, co... \n",
"void shmem_finalize(void) C void shmem_finalize(void) C \n",
"\n",
" Timer Location Timer Type \n",
"Timer \n",
"void shmem_barrier_all(void) C None None \n",
"long long shmem_longlong_fadd(long long *, long... None None \n",
"void shmem_longlong_p(long long *, long long, i... None None \n",
"void shmem_longlong_put(long long *, const long... None None \n",
"void shmem_int_sum_to_all(int *, const int *, i... None None \n",
"int shmem_n_pes(void) C None None \n",
"int shmem_my_pe(void) C None None \n",
"void *shmalloc(size_t) C None None \n",
"void shfree(void *) C None None \n",
".TAU application None None \n",
"void shmem_init(void) C None None \n",
"void shmem_broadcast64(void *, const void *, si... None None \n",
"void shmem_longlong_sum_to_all(long long *, con... None None \n",
"void shmem_finalize(void) C None None "
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.interval_data().loc[0,0,0].sort_values('Calls', ascending=False)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Find the mean exclusive time for each timer across all (node, context, thread) indices."
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Exclusive</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Timer</th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>.TAU application</th>\n",
" <td>5.818211e+04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_init(void) C</th>\n",
" <td>3.902098e+06</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_n_pes(void) C</th>\n",
" <td>1.562500e+00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>int shmem_my_pe(void) C</th>\n",
" <td>1.078125e+00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_barrier_all(void) C</th>\n",
" <td>2.160057e+06</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_int_sum_to_all(int *, const int *, int, int, int, int, int *, long *) C</th>\n",
" <td>2.859750e+03</td>\n",
" </tr>\n",
" <tr>\n",
" <th>long long shmem_longlong_fadd(long long *, long long, int) C</th>\n",
" <td>2.407764e+05</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_p(long long *, long long, int) C</th>\n",
" <td>4.205644e+04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_broadcast64(void *, const void *, size_t, int, int, int, int, long *) C</th>\n",
" <td>2.562969e+02</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void *shmalloc(size_t) C</th>\n",
" <td>2.093750e+01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_put(long long *, const long long *, size_t, int) C</th>\n",
" <td>1.089719e+04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shfree(void *) C</th>\n",
" <td>9.131719e+02</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_longlong_sum_to_all(long long *, const long long *, int, int, int, int, long long *, long *) C</th>\n",
" <td>1.981250e+01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>void shmem_finalize(void) C</th>\n",
" <td>2.581562e+02</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Exclusive\n",
"Timer \n",
".TAU application 5.818211e+04\n",
"void shmem_init(void) C 3.902098e+06\n",
"int shmem_n_pes(void) C 1.562500e+00\n",
"int shmem_my_pe(void) C 1.078125e+00\n",
"void shmem_barrier_all(void) C 2.160057e+06\n",
"void shmem_int_sum_to_all(int *, const int *, i... 2.859750e+03\n",
"long long shmem_longlong_fadd(long long *, long... 2.407764e+05\n",
"void shmem_longlong_p(long long *, long long, i... 4.205644e+04\n",
"void shmem_broadcast64(void *, const void *, si... 2.562969e+02\n",
"void *shmalloc(size_t) C 2.093750e+01\n",
"void shmem_longlong_put(long long *, const long... 1.089719e+04\n",
"void shfree(void *) C 9.131719e+02\n",
"void shmem_longlong_sum_to_all(long long *, con... 1.981250e+01\n",
"void shmem_finalize(void) C 2.581562e+02"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"profile.interval_data().groupby('Timer').agg({'Exclusive': 'mean'})"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Log-scale bar plot of mean exclusive time using Matplotlib."
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"<matplotlib.axes._subplots.AxesSubplot at 0x1140dbbe0>"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"profile.interval_data().groupby('Timer').agg({'Exclusive': 'mean'}).plot.bar(log=True)"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.5"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment