Goals: Add links that are reasonable and good explanations of how stuff works. No hype and no vendor content if possible. Practical first-hand accounts of models in prod eagerly sought.
![Screenshot 2023-12-18 at 10 40 27 PM](https://private-user-images.githubusercontent.com/3837836/291468646-4c30ad72-76ee-4939-a5fb-16b570d38cf2.png?jwt=eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJpc3MiOiJnaXRodWIuY29tIiwiYXVkIjoicmF3LmdpdGh1YnVzZXJjb250ZW50LmNvbSIsImtleSI6ImtleTUiLCJleHAiOjE3MTk2MzI4MjksIm5iZiI6MTcxOTYzMjUyOSwicGF0aCI6Ii8zODM3ODM2LzI5MTQ2ODY0Ni00YzMwYWQ3Mi03NmVlLTQ5MzktYTVmYi0xNmI1NzBkMzhjZjIucG5nP1gtQW16LUFsZ29yaXRobT1BV1M0LUhNQUMtU0hBMjU2JlgtQW16LUNyZWRlbnRpYWw9QUtJQVZDT0RZTFNBNTNQUUs0WkElMkYyMDI0MDYyOSUyRnVzLWVhc3QtMSUyRnMzJTJGYXdzNF9yZXF1ZXN0JlgtQW16LURhdGU9MjAyNDA2MjlUMDM0MjA5WiZYLUFtei1FeHBpcmVzPTMwMCZYLUFtei1TaWduYXR1cmU9YjhhNmMwY2UyOTE5YTc4NDIwODQ4Y2Y2NzdlZjY1NmYxN2MxMmY0MjJlN2U0MmI5OWQ0N2Y4MWYxZTlkM2I1ZCZYLUFtei1TaWduZWRIZWFkZXJzPWhvc3QmYWN0b3JfaWQ9MCZrZXlfaWQ9MCZyZXBvX2lkPTAifQ.sX1mRcnd050ytQEmLorDTc0aDpdaJOY8dv2qtkKuCvs)
# | |
# this is adapted from https://github.com/facebookresearch/llama/blob/main/llama/generation.py#L213 | |
# the tokenizer is replaced with ord() to make it easier to see whats actually happening | |
from typing_extensions import TypedDict, Literal | |
from typing import List, Optional | |
Role = Literal["system", "user", "assistant"] | |
class Message(TypedDict): |
I am no longer abe to monitor this post , I have decided to move everything to my personal blog for better monitoring.
Please click here to access the full post
import baker | |
import json | |
import os | |
from cytoolz import merge, join, groupby | |
from cytoolz.compatibility import iteritems | |
from cytoolz.curried import update_in | |
from itertools import starmap | |
from collections import deque | |
from lxml import etree, objectify | |
from scipy.io import savemat |
""" | |
this code is not mine! i shamelessly copied it from http://stackoverflow.com/questions/19790188/expanding-english-language-contractions-in-python | |
all credits go to alko and arturomp @ stack overflow. | |
basically, it's a big find/replace. | |
""" | |
import re | |
cList = { | |
"ain't": "am not", |
As configured in my dotfiles.
start new:
tmux
start new with session name: