Vui Seng Chua vuiseng9

## bench_linear.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vuiseng9
                / bench_linear.md
            
            
              Last active
              July 11, 2024 19:38
            
          
    $ python bench_linear.py --bs 1
BS:    1, Latency:    0.389 ms, IC:  4096, OC: 11008, Samples: 100, Warmup: 10

$ python bench_linear.py --bs 128
BS:  128, Latency:    3.640 ms, IC:  4096, OC: 11008, Samples: 100, Warmup: 10

$ python bench_linear.py --bs 1024
BS: 1024, Latency:   41.244 ms, IC:  4096, OC: 11008, Samples: 100, Warmup: 10

  
## temp.md

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                vuiseng9
                / temp.md
            
            
              Created
              April 12, 2024 04:28
            
          
    import intel_extension_for_pytorch # requried for XPU
import torch
from bigdl.llm.transformers import AutoModelForCausalLM
from transformers import AutoTokenizer, pipeline

# model_id = "facebook/opt-1.3b"
# model_id = "meta-llama/Llama-2-7b"
model_id = "meta-llama/Llama-2-7b-chat-hf"
prompt = "I love the Avengers,"

  
## prompt_creator.md

      
              1 file
            
          
              0 forks
            
          
              1 comment
            
          
              0 stars
            
          
                vuiseng9
                / prompt_creator.md
            
            
              Last active
              March 5, 2024 20:07
            
          
    import warnings
from transformers import AutoTokenizer

class PromptCreator:
    def __init__(self, model_id):
        self.tokenizer = AutoTokenizer.from_pretrained(model_id)
        self.offset = len(self.tokenizer(self.tokenizer.special_tokens_map['bos_token'])['input_ids'])
        self.samples = [
                                {

  
## bigcode.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vuiseng9
                / bigcode.md
            
            
              Last active
              January 24, 2024 02:52
            
          
    Install

git clone https://github.com/bigcode-project/bigcode-evaluation-harness
pip install -e .
Deterministic Generation

mistralai/Mistral-7B-v0.1 should result in "pass@1": 0.29878 paper: 30.5%, 0.7% gap
accelerate launch $WORKDIR/main.py \

  
## watched_jira.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vuiseng9
                / watched_jira.md
            
            
              Created
              November 2, 2023 16:16
            
              
                jira ql to filter watched issues
              
          
    From

https://community.atlassian.com/t5/Jira-Core-Server-questions/how-to-find-all-issues-i-am-watching/qaq-p/2332
watcher = currentUser() AND resolution = Unresolved ORDER BY priority DESC, updated DESC


## hf-download.py
import os
from huggingface_hub import snapshot_download

REPO_ID = "repo_id"
LOCAL_ROOT= "/hf-model"
LOCAL_DIR = os.path.join(LOCAL_ROOT, os.path.basename(REPO_ID))

snapshot_download(repo_id=REPO_ID, local_dir=LOCAL_DIR, local_dir_use_symlinks=False)

## build-ov-rt.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vuiseng9
                / build-ov-rt.md
            
            
              Last active
              October 23, 2023 14:08
            
              
                build-ov-rt.md
              
          
    cheatsheet

# based on following
https://github.com/openvinotoolkit/openvino/wiki/BuildingForLinux
(new) https://github.com/openvinotoolkit/openvino/blob/master/docs/dev/build_linux.md

# create conda env and activate environment (optional but recommended, use python 3.8/3.9)

git clone https://github.com/openvinotoolkit/openvino
# checkout tag or commit according

  
## hf-text-gen-pipeline.md

      
              1 file
            
          
              0 forks
            
          
              5 comments
            
          
              0 stars
            
          
                vuiseng9
                / hf-text-gen-pipeline.md
            
            
              Last active
              September 11, 2023 05:27
            
          
    Setup

pip install transformers torch
git clone https://huggingface.co/EleutherAI/gpt-j-6b # depends on git-lfs 
Run following as python script

from transformers import AutoTokenizer, pipeline

  
## reshape_ov_ir.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                vuiseng9
                / reshape_ov_ir.md
            
            
              Last active
              February 20, 2023 03:59
            
          
    import os
import logging as log
from openvino.runtime import Core, PartialShape, serialize

log.info = print

def get_input_output_names(ports):
    return [port.any_name for port in ports]

  
## inspect_ov_ir_weights.py
# Openvino==2022.1.0
import sys

from openvino.runtime import Core

DELIMITER = ' | '

if len(sys.argv) < 3:
    print("Please provide path to model xml file as a first arg and"
          " path to output text file to dump model constants.")
	import os
	from huggingface_hub import snapshot_download

	REPO_ID = "repo_id"
	LOCAL_ROOT= "/hf-model"
	LOCAL_DIR = os.path.join(LOCAL_ROOT, os.path.basename(REPO_ID))

	snapshot_download(repo_id=REPO_ID, local_dir=LOCAL_DIR, local_dir_use_symlinks=False)
	# Openvino==2022.1.0
	import sys

	from openvino.runtime import Core

	DELIMITER = ' \| '

	if len(sys.argv) < 3:
	print("Please provide path to model xml file as a first arg and"
	" path to output text file to dump model constants.")