Vikas Raunak vyraun

## threading_example.py
import threading
import time


class ThreadingExample(object):
    """ Threading example class

    The run() method will be started and it will run in the background
    until the application exits.
    """

## pytorch_performance_profiling.md

      
              2 files
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vyraun
                / pytorch_performance_profiling.md
            
            
              Created
              March 20, 2022 15:59
                — forked from mingfeima/pytorch_performance_profiling.md
            
              
                How to do performance profiling on PyTorch
              
          
    (Internal Tranining Material)
Usually the first step in performance optimization is to do profiling, e.g. to identify performance hotspots of a workload.
This gist tells basic knowledge of performance profiling on PyTorch, you will get:

How to find the bottleneck operator?
How to trace source file of a particular operator?
How do I indentify threading issues? (oversubscription)
How do I tell a specific operator is running efficiently or not?

This tutorial takes one of my recent projects - pssp-transformer as an example to guide you through path of PyTorch CPU peformance optimization. Focus will be on Part 1 & Part 2.

  
## dataset.py
def load_train_data(path: str, sort: bool) -> List[Example]:
    sentences = list()
    with open(path) as f:
        first = False
        for line in f:
            if not first:
                first = True
                continue
            text_a, text_b, label = line.rstrip().split("\t")
            lab = len(text_a) + len(text_b)

## Makefile
# required by (\ SHELL COMMANDS \)
SHELL:=/bin/bash

VIRT_ENV_FOLDER = ~/.local/share/virtualenvs/xnli
SOURCE_VIRT_ENV = source $(VIRT_ENV_FOLDER)/bin/activate


.PHONY: train
train:
	( \

## Mixture_of_softmaxes.py
# PyTorch code For implementing the mixture of softmaxes layer from
# "Breaking the Softmax Bottleneck: A High-Rank RNN Language Model"
# https://arxiv.org/abs/1711.03953
context = self.fc(out)

# Non-log version
priors = F.softmax(context[:,-self.n_components:])
mixtures = torch.stack([priors[:,i].unsqueeze(1) * F.softmax(context[:, i * self.nClasses : (i + 1) * self.nClasses]) for i in range(self.n_components)],1)
out = torch.log(mixtures.sum(1))

## Mixture_of_softmaxes.py
# PyTorch code For implementing the mixture of softmaxes layer from
# "Breaking the Softmax Bottleneck: A High-Rank RNN Language Model"
# https://arxiv.org/abs/1711.03953
context = self.fc(out)

# Non-log version
priors = F.softmax(context[:,-self.n_components:])
mixtures = torch.stack([priors[:,i].unsqueeze(1) * F.softmax(context[:, i * self.nClasses : (i + 1) * self.nClasses]) for i in range(self.n_components)],1)
out = torch.log(mixtures.sum(1))

## st-gumbel.py
from __future__ import print_function
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.autograd import Variable

def sample_gumbel(shape, eps=1e-20):
    U = torch.rand(shape).cuda()
    return -Variable(torch.log(-torch.log(U + eps) + eps))

## binary_crossentropy_with_ranking.py

def binary_crossentropy_with_ranking(y_true, y_pred):
    """ Trying to combine ranking loss with numeric precision"""
    # first get the log loss like normal
    logloss = K.mean(K.binary_crossentropy(y_pred, y_true), axis=-1)

    # next, build a rank loss

    # clip the probabilities to keep stability
    y_pred_clipped = K.clip(y_pred, K.epsilon(), 1-K.epsilon())

## weight_init.py
#!/usr/bin/env python
# -*- coding:UTF-8 -*-

import torch
import torch.nn as nn
import torch.nn.init as init


def weight_init(m):
    '''

## audio_tools.py
raise ValueError("DEPRECATED/FROZEN - see https://github.com/kastnerkyle/tools for the latest")

# License: BSD 3-clause
# Authors: Kyle Kastner
# Harvest, Cheaptrick, D4C, WORLD routines based on MATLAB code from M. Morise
# http://ml.cs.yamanashi.ac.jp/world/english/
# MGC code based on r9y9 (Ryuichi Yamamoto) MelGeneralizedCepstrums.jl
# Pieces also adapted from SPTK
from __future__ import division
import numpy as np
	import threading
	import time


	class ThreadingExample(object):
	""" Threading example class

	The run() method will be started and it will run in the background
	until the application exits.
	"""
	def load_train_data(path: str, sort: bool) -> List[Example]:
	sentences = list()
	with open(path) as f:
	first = False
	for line in f:
	if not first:
	first = True
	continue
	text_a, text_b, label = line.rstrip().split("\t")
	lab = len(text_a) + len(text_b)
	# required by (\ SHELL COMMANDS \)
	SHELL:=/bin/bash

	VIRT_ENV_FOLDER = ~/.local/share/virtualenvs/xnli
	SOURCE_VIRT_ENV = source $(VIRT_ENV_FOLDER)/bin/activate


	.PHONY: train
	train:
	( \
	# PyTorch code For implementing the mixture of softmaxes layer from
	# "Breaking the Softmax Bottleneck: A High-Rank RNN Language Model"
	# https://arxiv.org/abs/1711.03953
	context = self.fc(out)

	# Non-log version
	priors = F.softmax(context[:,-self.n_components:])
	mixtures = torch.stack([priors[:,i].unsqueeze(1) * F.softmax(context[:, i * self.nClasses : (i + 1) * self.nClasses]) for i in range(self.n_components)],1)
	out = torch.log(mixtures.sum(1))
	from __future__ import print_function
	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	from torch.autograd import Variable

	def sample_gumbel(shape, eps=1e-20):
	U = torch.rand(shape).cuda()
	return -Variable(torch.log(-torch.log(U + eps) + eps))

	def binary_crossentropy_with_ranking(y_true, y_pred):
	""" Trying to combine ranking loss with numeric precision"""
	# first get the log loss like normal
	logloss = K.mean(K.binary_crossentropy(y_pred, y_true), axis=-1)

	# next, build a rank loss

	# clip the probabilities to keep stability
	y_pred_clipped = K.clip(y_pred, K.epsilon(), 1-K.epsilon())
	#!/usr/bin/env python
	# -- coding:UTF-8 --

	import torch
	import torch.nn as nn
	import torch.nn.init as init


	def weight_init(m):
	'''
	raise ValueError("DEPRECATED/FROZEN - see https://github.com/kastnerkyle/tools for the latest")

	# License: BSD 3-clause
	# Authors: Kyle Kastner
	# Harvest, Cheaptrick, D4C, WORLD routines based on MATLAB code from M. Morise
	# http://ml.cs.yamanashi.ac.jp/world/english/
	# MGC code based on r9y9 (Ryuichi Yamamoto) MelGeneralizedCepstrums.jl
	# Pieces also adapted from SPTK
	from __future__ import division
	import numpy as np