Peter pszemraj

## USAGE.md

      
              2 files
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                pszemraj
                / USAGE.md
            
            
              Last active
              May 19, 2024 18:40
            
              
                how to use unsloth grad checkpointing
              
          
    usage


Credit/source: here

how to use unsloth grad checkpointing
steps

To integrate the provided monkey patch for offloading gradient checkpointing into the Hugging Face transformers library, you need to follow these steps:

  
## datasets_split.py
import os

import numpy as np

from datasets import ClassLabel, Dataset, DatasetDict


def split_dataset(
    dataset: Dataset,
    test_size=0.025,

## enable_tf32.py
import torch
import logging


def check_ampere_gpu():
    """
    Check if the GPU supports NVIDIA Ampere or later and enable FP32 in PyTorch if it does.
    """
    # Check if CUDA is available
    if not torch.cuda.is_available():

## hf_repofolder_watchdog.py
import argparse
import logging
import time
from datetime import datetime
from pathlib import Path
from typing import Optional

from huggingface_hub import upload_folder
from watchdog.events import PatternMatchingEventHandler
from watchdog.observers import Observer

## calculate_code_readability.py
import re
from itertools import chain


def calculate_readability(code_string:str) -> float:
    code = code_string.splitlines()

    # Heuristic 1: Line length
    max_line_length = 80
    long_lines = sum(1 for line in code if len(line) > max_line_length)

## generic_embedder.py
"""
generic & basic sbert-like embedder class for the  jina-bert model

Usage:

model = EmbeddingModel("jinaai/jina-embeddings-v2-base-en")
embeddings = model.encode(
        ["How is the weather today?", "What is the current weather like today?"]
    )
print(model.cos_sim(embeddings[0], embeddings[1]))

## download_URLs_in_file.py
import os
import argparse
import requests
from urllib.parse import urlparse
from tqdm import tqdm
from joblib import Parallel, delayed
from tenacity import retry, stop_after_attempt, wait_fixed


@retry(stop=stop_after_attempt(5), wait=wait_fixed(2))

## train_tokenizer.py
import logging
import gzip
from pathlib import Path
import fire
from tqdm import tqdm
from tokenizers import (
    Tokenizer,
    decoders,
    models,
    normalizers,

## nougat_em.sh
#!/bin/bash

# pip install nougat-ocr
# see https://github.com/facebookresearch/nougat for details and license

DEFAULT_BATCHSIZE=4

usage() {
    echo "Usage: $0 <path_to_directory> [--batchsize BATCHSIZE]"
    exit 1

## merge_peft.py
# Example usage:
# python merge_peft.py --base_model=meta-llama/Llama-2-7b-hf --peft_model=./qlora-out --hub_id=alpaca-qlora

from transformers import AutoModelForCausalLM, AutoTokenizer
from peft import PeftModel
import torch

import argparse

def get_args():
	import os

	import numpy as np

	from datasets import ClassLabel, Dataset, DatasetDict


	def split_dataset(
	dataset: Dataset,
	test_size=0.025,
	import torch
	import logging


	def check_ampere_gpu():
	"""
	Check if the GPU supports NVIDIA Ampere or later and enable FP32 in PyTorch if it does.
	"""
	# Check if CUDA is available
	if not torch.cuda.is_available():
	import argparse
	import logging
	import time
	from datetime import datetime
	from pathlib import Path
	from typing import Optional

	from huggingface_hub import upload_folder
	from watchdog.events import PatternMatchingEventHandler
	from watchdog.observers import Observer
	import re
	from itertools import chain


	def calculate_readability(code_string:str) -> float:
	code = code_string.splitlines()

	# Heuristic 1: Line length
	max_line_length = 80
	long_lines = sum(1 for line in code if len(line) > max_line_length)
	"""
	generic & basic sbert-like embedder class for the jina-bert model

	Usage:

	model = EmbeddingModel("jinaai/jina-embeddings-v2-base-en")
	embeddings = model.encode(
	["How is the weather today?", "What is the current weather like today?"]
	)
	print(model.cos_sim(embeddings[0], embeddings[1]))
	import os
	import argparse
	import requests
	from urllib.parse import urlparse
	from tqdm import tqdm
	from joblib import Parallel, delayed
	from tenacity import retry, stop_after_attempt, wait_fixed


	@retry(stop=stop_after_attempt(5), wait=wait_fixed(2))
	import logging
	import gzip
	from pathlib import Path
	import fire
	from tqdm import tqdm
	from tokenizers import (
	Tokenizer,
	decoders,
	models,
	normalizers,
	#!/bin/bash

	# pip install nougat-ocr
	# see https://github.com/facebookresearch/nougat for details and license

	DEFAULT_BATCHSIZE=4

	usage() {
	echo "Usage: $0 <path_to_directory> [--batchsize BATCHSIZE]"
	exit 1
	# Example usage:
	# python merge_peft.py --base_model=meta-llama/Llama-2-7b-hf --peft_model=./qlora-out --hub_id=alpaca-qlora

	from transformers import AutoModelForCausalLM, AutoTokenizer
	from peft import PeftModel
	import torch

	import argparse

	def get_args():