Cheng Li cli99

## starship-tmux.sh
#!/bin/sh

# requirements
# - wget

# prepare directory
mkdir -p ~/.local/bin
mkdir -p ~/.config

if ! [ -x "$(command -v tmux)" ]; then

## profile_inception_v4.py
import timm
from timm.data import resolve_data_config
from timm.data.transforms_factory import create_transform
import torch
from deepspeed.profiling.flops_profiler import get_model_profile

model = timm.create_model('inception_v4', pretrained=True)
model.eval()

config = resolve_data_config({}, model=model)

## bet-base-flops.txt

-------------------------- DeepSpeed Flops Profiler --------------------------
Profile Summary at step 1:
Notations:
data parallel size (dp_size), model parallel size(mp_size),
number of parameters (params), number of multiply-accumulate operations(MACs),
number of floating-point operations (flops), floating-point operations per second (FLOPS),
fwd latency (forward propagation latency), bwd latency (backward propagation latency),
step (weights update latency), iter latency (sum of fwd, bwd and step latency)

## get_hf_models.py
from transformers import CONFIG_MAPPING
from huggingface_hub import HfApi

api = HfApi()

def _get_all_hf_model_types():
    return list(CONFIG_MAPPING.keys())

def _get_total_downloads_by_model_type(model_type):
    models = api.list_models(filter=model_type)

## test_pt_profiler.py
import torch
import torch.nn as nn
from torch.profiler import profile, record_function, ProfilerActivity
import torchprof

class NeuralNetwork(nn.Module):
    def __init__(self):
        super(NeuralNetwork, self).__init__()
        self.flatten = nn.Flatten()
        self.linear_relu_stack = nn.Sequential(

## pr.md

      
              1 file
            
          
              0 forks
            
          
                0 comments
              
            
              0 stars
            
          
                cli99
                / pr.md
            
            
              Created
              May 13, 2021 18:16
                — forked from piscisaureus/pr.md
            
              
                Checkout github pull requests locally
              
          
    Locate the section for your github remote in the .git/config file. It looks like this:
[remote "origin"]
	fetch = +refs/heads/*:refs/remotes/origin/*
	url = git@github.com:joyent/node.git

Now add the line fetch = +refs/pull/*/head:refs/remotes/origin/pr/* to this section. Obviously, change the github url to match your project's URL. It ends up looking like this:

  
## busy.py
import argparse
import torch
import torch.distributed as dist

parser = argparse.ArgumentParser()
parser.add_argument("--local_rank", type=int)
args = parser.parse_args()
device = args.local_rank

dist.init_process_group('nccl')

## bash
perl: warning: Setting locale failed.
perl: warning: Please check that your locale settings:
	LANGUAGE = (unset),
	LC_ALL = (unset),
	LC_CTYPE = "UTF-8",
	LANG = "en_US.UTF-8"
    are supported and installed on your system.
perl: warning: Falling back to the standard locale ("C").

~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~

## megatron-lm.txt
deepspeed --num_nodes 1 --num_gpus 16 pretrain_gpt2.py --model-parallel-size 1 --num-layers 4 --hidden-size 512 --num-attention-heads 8 --seq-length 512 --max-position-embeddings 4096 --batch-size 1 --train-iters 10 --lr-decay-iters 320000 --data-path data/webtext/webtext_text_document --vocab-file data/gpt2-vocab.json --merge-file data/gpt2-merges.txt --data-impl mmap --split 949,50,1 --distributed-backend nccl --lr 1.5e-4 --lr-decay-style cosine --min-lr 1.0e-5 --weight-decay 1e-2 --clip-grad 1.0 --warmup 0.01 --log-interval 100 --save-interval 10000 --eval-interval 1000 --eval-iters 10 --fp16 --hysteresis 2 --num-workers 0 --deepspeed --deepspeed_config /home/chengli1/projects/Megatron-LM/examples/ds_zero_stage_2_config.json --zero-stage 0 --zero-reduce-bucket-size 50000000 --zero-allgather-bucket-size 5000000000 --zero-contigious-gradients --zero-reduce-scatter --checkpoint-activations --checkpoint-num-layers 1 --partition-activations --synchronize-each-layer --contigious-checkpointing
[2020-10-30 23:43:3

## get_python_cmake_flags.py
## @package get_python_cmake_flags
# Module scripts.get_python_cmake_flags
##############################################################################
# Use this script to find your preferred python installation.
##############################################################################
#
# You can use the following to build with your preferred version of python
# if your installation is not being properly detected by CMake.
#
#   mkdir -p build && cd build
	#!/bin/sh

	# requirements
	# - wget

	# prepare directory
	mkdir -p ~/.local/bin
	mkdir -p ~/.config

	if ! [ -x "$(command -v tmux)" ]; then
	import timm
	from timm.data import resolve_data_config
	from timm.data.transforms_factory import create_transform
	import torch
	from deepspeed.profiling.flops_profiler import get_model_profile

	model = timm.create_model('inception_v4', pretrained=True)
	model.eval()

	config = resolve_data_config({}, model=model)

	-------------------------- DeepSpeed Flops Profiler --------------------------
	Profile Summary at step 1:
	Notations:
	data parallel size (dp_size), model parallel size(mp_size),
	number of parameters (params), number of multiply-accumulate operations(MACs),
	number of floating-point operations (flops), floating-point operations per second (FLOPS),
	fwd latency (forward propagation latency), bwd latency (backward propagation latency),
	step (weights update latency), iter latency (sum of fwd, bwd and step latency)
	from transformers import CONFIG_MAPPING
	from huggingface_hub import HfApi

	api = HfApi()

	def _get_all_hf_model_types():
	return list(CONFIG_MAPPING.keys())

	def _get_total_downloads_by_model_type(model_type):
	models = api.list_models(filter=model_type)
	import torch
	import torch.nn as nn
	from torch.profiler import profile, record_function, ProfilerActivity
	import torchprof

	class NeuralNetwork(nn.Module):
	def __init__(self):
	super(NeuralNetwork, self).__init__()
	self.flatten = nn.Flatten()
	self.linear_relu_stack = nn.Sequential(
	import argparse
	import torch
	import torch.distributed as dist

	parser = argparse.ArgumentParser()
	parser.add_argument("--local_rank", type=int)
	args = parser.parse_args()
	device = args.local_rank

	dist.init_process_group('nccl')
	perl: warning: Setting locale failed.
	perl: warning: Please check that your locale settings:
	LANGUAGE = (unset),
	LC_ALL = (unset),
	LC_CTYPE = "UTF-8",
	LANG = "en_US.UTF-8"
	are supported and installed on your system.
	perl: warning: Falling back to the standard locale ("C").

	~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~ ~
	## @package get_python_cmake_flags
	# Module scripts.get_python_cmake_flags
	##############################################################################
	# Use this script to find your preferred python installation.
	##############################################################################
	#
	# You can use the following to build with your preferred version of python
	# if your installation is not being properly detected by CMake.
	#
	# mkdir -p build && cd build