Vlad Lialin Guitaricet

## check_wandb_login.py
import netrc
import os

def is_wandb_logged_in():
    netrc_path = os.path.expanduser("~/.netrc")
    if not os.path.exists(netrc_path):
        return False

    auth = netrc.netrc(netrc_path).authenticators("api.wandb.ai")
    return bool(auth)

## better_repr.py
from torch.nn import ModuleList


def _addindent(s_, numSpaces):
    s = s_.split('\n')
    # don't do anything for single-line stuff
    if len(s) == 1:
        return s_
    first = s.pop(0)
    s = [(numSpaces * ' ') + line for line in s]

## named_shape.py
import torch


class NamedShape:
    """A convenience class to make beautifully named shapes."""
    def __init__(self, tensor) -> None:
        self.names = tensor.names
        self.shape = tensor.shape

    def __repr__(self) -> str:

## generate_multigpu.py
# torchrun --nproc_per_node 2 generate_multigpu.py
# tested on torch==1.12.1 and transformers==4.21
import os
import json

import torch
import torch.distributed as dist

import transformers
import datasets

## logger.py
import os
import sys
import logging

logging.basicConfig(
    format="%(asctime)s | %(levelname)s | %(name)s | %(message)s",
    datefmt="%Y-%m-%d %H:%M:%S",
    level=logging.INFO,
    stream=sys.stdout,
)

## learning_subspaces.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                Guitaricet
                / learning_subspaces.ipynb
            
            
              Created
              April 5, 2021 19:33
            
              
                A quick and dirty reimplementation of the training algorithm from Learning Neural Network Subspaces, Wortsman et al., https://arxiv.org/abs/2102.10472
              
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## lite_transformer.py
class LiteTransformerLayer(nn.Module):
    def __init__(self, dim=496, heads=4, kernel_size=4):
        super().__init__()
        assert dim % 2 == 0

        self.attention = Attention(dim // 2, heads=heads)
        self.cnn = LightweightConv(dim // 2, kernel=kernel_size)  # or Dynamic conv

        self.fc = nn.Sequential(
            nn.Linear(dim, dim),

## transformer.py
class TransformerLayer(nn.Module):
    def __init__(self, dim=496, heads=4, ffn_dim=1984):
        super().__init__()
        self.attention = Attention(dim, heads=heads)

        self.fc = nn.Sequential(
            nn.Linear(dim, ffn_dim),
            nn.ReLU(),  # chose your favorite nonlinearity here
            nn.Linear(ffn_dim, dim),
        )

## att.py
# Just dot product self-attention
class SelfAttention(nn.Module):
    def __init__(self, dim=7):
        super().__init__()
        self.K = nn.Linear(dim, dim)
        self.Q = nn.Linear(dim, dim)
        self.V = nn.Linear(dim, dim)
        self.scale = dim ** 0.5

    def forward(self, x):

## ipynb_output_filter.py
#!/usr/bin/env python3

import sys

try:
    runarg_idx = sys.argv.index('--rundir')
    rundir = sys.argv[runarg_idx+1]
    import os
    os.chdir(os.path.expanduser(rundir))
except ValueError:
	import netrc
	import os

	def is_wandb_logged_in():
	netrc_path = os.path.expanduser("~/.netrc")
	if not os.path.exists(netrc_path):
	return False

	auth = netrc.netrc(netrc_path).authenticators("api.wandb.ai")
	return bool(auth)
	from torch.nn import ModuleList


	def _addindent(s_, numSpaces):
	s = s_.split('\n')
	# don't do anything for single-line stuff
	if len(s) == 1:
	return s_
	first = s.pop(0)
	s = [(numSpaces * ' ') + line for line in s]
	import torch


	class NamedShape:
	"""A convenience class to make beautifully named shapes."""
	def __init__(self, tensor) -> None:
	self.names = tensor.names
	self.shape = tensor.shape

	def __repr__(self) -> str:
	# torchrun --nproc_per_node 2 generate_multigpu.py
	# tested on torch==1.12.1 and transformers==4.21
	import os
	import json

	import torch
	import torch.distributed as dist

	import transformers
	import datasets
	import os
	import sys
	import logging

	logging.basicConfig(
	format="%(asctime)s \| %(levelname)s \| %(name)s \| %(message)s",
	datefmt="%Y-%m-%d %H:%M:%S",
	level=logging.INFO,
	stream=sys.stdout,
	)
	class LiteTransformerLayer(nn.Module):
	def __init__(self, dim=496, heads=4, kernel_size=4):
	super().__init__()
	assert dim % 2 == 0

	self.attention = Attention(dim // 2, heads=heads)
	self.cnn = LightweightConv(dim // 2, kernel=kernel_size) # or Dynamic conv

	self.fc = nn.Sequential(
	nn.Linear(dim, dim),
	class TransformerLayer(nn.Module):
	def __init__(self, dim=496, heads=4, ffn_dim=1984):
	super().__init__()
	self.attention = Attention(dim, heads=heads)

	self.fc = nn.Sequential(
	nn.Linear(dim, ffn_dim),
	nn.ReLU(), # chose your favorite nonlinearity here
	nn.Linear(ffn_dim, dim),
	)
	# Just dot product self-attention
	class SelfAttention(nn.Module):
	def __init__(self, dim=7):
	super().__init__()
	self.K = nn.Linear(dim, dim)
	self.Q = nn.Linear(dim, dim)
	self.V = nn.Linear(dim, dim)
	self.scale = dim ** 0.5

	def forward(self, x):
	#!/usr/bin/env python3

	import sys

	try:
	runarg_idx = sys.argv.index('--rundir')
	rundir = sys.argv[runarg_idx+1]
	import os
	os.chdir(os.path.expanduser(rundir))
	except ValueError: