Onuralp cx0

## hello_world.py
"""Hello world, with a genetic algorithm.

https://twitter.com/matthen2/status/1769368467067621791
"""

import random
import time
from dataclasses import dataclass
from itertools import chain
from typing import Iterable, List

## airoboros-gpt4-2.0.md

      
              3 files
            
          
              2 forks
            
          
              0 comments
            
          
              10 stars
            
          
                jondurbin
                / airoboros-gpt4-2.0.md
            
            
              Last active
              November 2, 2023 06:30
            
          
    Details on how the airoboros-gpt4-2.0 dataset was created.

Script

https://github.com/jondurbin/airoboros
pip install --upgrade airoboros==2.0.13

  
## llama2-mac-gpu.sh
# Clone llama.cpp
git clone https://github.com/ggerganov/llama.cpp.git
cd llama.cpp

# Build it
make clean
LLAMA_METAL=1 make

# Download model
export MODEL=llama-2-13b-chat.ggmlv3.q4_0.bin

## baka_trace.py
import traceback
import openai
import sys

# list models
models = openai.Model.list()

def baka(error, character="tsundere",):
    exc_type, exc_value, exc_traceback = sys.exc_info()
    traceback_list = traceback.extract_tb(exc_traceback)

## gpt_rec.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              5 stars
            
          
                liorfox
                / gpt_rec.md
            
            
              Created
              January 5, 2023 18:50
            
          
    Recursive games with ChatGPT

Lior Fox, January 2023
TL;DR: I present examples of apparent "symbolic" capabilities of ChatGPT, and discuss some context and possible interpretations
Motivation and scope

ChatGPT probably requires no introduction at this stage. If you haven't had the chance to play with it yet, you should do so (as long as it free?). Before I dive in, it is perhaps better to clearly state what this post isn't about. I will not discuss:

Social, political, or economical aspects of Large Language Models (LLMs) and their deployment


## LLMs.md

      
              1 file
            
          
              21 forks
            
          
              34 comments
            
          
              342 stars
            
          
                yoavg
                / LLMs.md
            
            
              Last active
              February 17, 2024 18:39
            
          
    Some remarks on Large Language Models

Yoav Goldberg, January 2023

Audience: I assume you heard of chatGPT, maybe played with it a little, and was imressed by it (or tried very hard not to be). And that you also heard that it is "a large language model". And maybe that it "solved natural language understanding". Here is a short personal perspective of my thoughts of this (and similar) models, and where we stand with respect to language understanding.
Intro

Around 2014-2017, right within the rise of neural-network based methods for NLP, I was giving a semi-academic-semi-popsci lecture, revolving around the story that achieving perfect language modeling is equivalent to being as intelligent as a human. Somewhere around the same time I was also asked in an academic panel "what would you do if you were given infinite compute and no need to worry about labour costs" to which I cockily responded "I would train a really huge language model, just to show that it doesn't solve everything!". We

  
## operator_overload_stupidity.py
from typing import TypeVar, Generic, Callable
from dataclasses import dataclass
from argparse import Namespace

T = TypeVar('T')
S = TypeVar('S')

@dataclass
class ListMap(Generic[S, T]):
    f: Callable[[T], S]

## probs-odds-logits.R
library(tidyverse)
library(patchwork)
library(latex2exp)

logit_df <- tibble(x = seq(0, 100, length.out = 101),
                   logits = seq(-4, 4, length.out = 101)) |>
  mutate(odds = exp(logits)) |>
  mutate(probs = plogis(logits))

p1 <- ggplot(logit_df, aes(x = x, y = probs)) +

## CodeGen_GPTJ_Conversion.md

      
              1 file
            
          
              2 forks
            
          
              1 comment
            
          
              56 stars
            
          
                moyix
                / CodeGen_GPTJ_Conversion.md
            
            
              Last active
              January 5, 2024 12:50
            
              
                How to convert the SalesForce CodeGen models to GPT-J
              
          
    Using Linear Algebra to Convert a Large Code Model

Background

The SalesForce CodeGen models are a family of large language models trained on a large amount of natural language data and then fine-tuned on specialized datasets of code. Models of size 350M, 2B, 6B, and 16B parameters are provided in three flavors:

nl, the base model trained on The Pile, a large natural language dataset compiled by EleutherAI
multi, which is fine-tuned from the nl model on a dataset of code in multiple languages, scraped from GitHub, and
mono, which is fine-tuned from the multi model on Python code only.


## kaplan_meier_for_revenue.py
from matplotlib import pyplot
import random
import time

pyplot.style.use("ggplot")
now = time.time()

def generate_user(censor=now):
    # Pick some point in time the user was created
    t_created = t = now - random.random() * 1e7
	"""Hello world, with a genetic algorithm.

	https://twitter.com/matthen2/status/1769368467067621791
	"""

	import random
	import time
	from dataclasses import dataclass
	from itertools import chain
	from typing import Iterable, List
	# Clone llama.cpp
	git clone https://github.com/ggerganov/llama.cpp.git
	cd llama.cpp

	# Build it
	make clean
	LLAMA_METAL=1 make

	# Download model
	export MODEL=llama-2-13b-chat.ggmlv3.q4_0.bin
	import traceback
	import openai
	import sys

	# list models
	models = openai.Model.list()

	def baka(error, character="tsundere",):
	exc_type, exc_value, exc_traceback = sys.exc_info()
	traceback_list = traceback.extract_tb(exc_traceback)
	from typing import TypeVar, Generic, Callable
	from dataclasses import dataclass
	from argparse import Namespace

	T = TypeVar('T')
	S = TypeVar('S')

	@dataclass
	class ListMap(Generic[S, T]):
	f: Callable[[T], S]
	library(tidyverse)
	library(patchwork)
	library(latex2exp)

	logit_df <- tibble(x = seq(0, 100, length.out = 101),
	logits = seq(-4, 4, length.out = 101)) \|>
	mutate(odds = exp(logits)) \|>
	mutate(probs = plogis(logits))

	p1 <- ggplot(logit_df, aes(x = x, y = probs)) +
	from matplotlib import pyplot
	import random
	import time

	pyplot.style.use("ggplot")
	now = time.time()

	def generate_user(censor=now):
	# Pick some point in time the user was created
	t_created = t = now - random.random() * 1e7