Daniel Barker dcbark01

## llamaindex_activeloop_vectorize_data_from_github.py
''' in .env file
GITHUB_TOKEN="YOUR_GH_CLASSIC_TOKEN"
OPENAI_API_KEY="YOUR_OPENAI_KEY"
ACTIVELOOP_TOKEN="YOUR_ACTIVELOOP_TOKEN"
DATASET_PATH="hub://YOUR_ORG/repository_vector_store"


need to install llama-index >= 0.10.0, python-dotenv, and llama-index-readers-github >= 0.1.5
'''

## ollama_dspy.py
# install DSPy: pip install dspy
import dspy

# Ollam is now compatible with OpenAI APIs
#
# To get this to work you must include `model_type='chat'` in the `dspy.OpenAI` call.
# If you do not include this you will get an error.
#
# I have also found that `stop='\n\n'` is required to get the model to stop generating text after the ansewr is complete.
# At least with mistral.

## h5fsutil.py
import h5py

# Copyright (c) 2023 kglspl
# MIT License (the same as: https://github.com/kglspl/ppmparser/blob/master/LICENSE)

class H5FS(object):
    def __init__(self, filename, mode):
        self.filename = filename
        self.f = h5py.File(filename, mode)
        self.dset = None

## Docker Desktop v 4.0.0 thru 4.22.1 direct download links
This list was compiled from https://web.archive.org/web/20230911135706/https://docs.docker.com/desktop/release-notes/, retrieved on 2024-05-24

The information may not be correct in all cases, or may have changed since archive.org archived the page. At time of posting, I spot-checked a few links and they appeared to be good, but really, all I've done is copied, pasted, and visually formatted the information I found on archive.org, so no warrantee that it's good.

If the download links don't work, sometimes archive.org has the download archive, and you can try adding https://web.archive.org/web/20230911135706/ to the beginning of the URL. For instance, as of this writing, the 4.22.1 Windows download is available from archive.org https://web.archive.org/web/20230911135706/https://desktop.docker.com/win/main/amd64/Docker%20Desktop%20Installer.exe as well as the normal web link at https://desktop.docker.com/win/main/amd64/Docker%20Desktop%20Installer.exe.

Self-promotion: Michael Kupietz • Software Solutions fo

## fix-tokenizer.rs
/// Fix a huggingface tokenizer to which tokens have been added after training.
///
/// Adding tokens after training via `add_special_tokens` leads to them being added to the
/// `added_tokens` section but not to the `model.vocab` section. This yields warnings like:
/// ```
/// [2023-10-17T07:54:05Z WARN  tokenizers::tokenizer::serialization] Warning: Token '<|empty_usable_token_space_1023|>' was expected to have ID '129023' but was given ID 'None'
/// ```
/// The code in this file ensures that all tokens from `added_tokens` are also placed into
/// `model.vocab`. This fixes the warning and does not change the tokenizer's behavior.

## requirements.txt
# main
llama-index
langchain

## kernel_kmeans.py
"""Kernel K-means"""

# Author: Mathieu Blondel <mathieu@mblondel.org>
# License: BSD 3 clause

import numpy as np

from sklearn.base import BaseEstimator, ClusterMixin
from sklearn.metrics.pairwise import pairwise_kernels
from sklearn.utils import check_random_state

## tmux-cheatsheet.markdown

      
              1 file
            
          
              3266 forks
            
          
              181 comments
            
          
              14378 stars
            
          
                MohamedAlaa
                / tmux-cheatsheet.markdown
            
            
              Last active
              July 26, 2024 12:21
            
              
                tmux shortcuts & cheatsheet
              
          
    tmux shortcuts & cheatsheet

start new:
tmux

start new with session name:
tmux new -s myname
	''' in .env file
	GITHUB_TOKEN="YOUR_GH_CLASSIC_TOKEN"
	OPENAI_API_KEY="YOUR_OPENAI_KEY"
	ACTIVELOOP_TOKEN="YOUR_ACTIVELOOP_TOKEN"
	DATASET_PATH="hub://YOUR_ORG/repository_vector_store"


	need to install llama-index >= 0.10.0, python-dotenv, and llama-index-readers-github >= 0.1.5
	'''
	# install DSPy: pip install dspy
	import dspy

	# Ollam is now compatible with OpenAI APIs
	#
	# To get this to work you must include `model_type='chat'` in the `dspy.OpenAI` call.
	# If you do not include this you will get an error.
	#
	# I have also found that `stop='\n\n'` is required to get the model to stop generating text after the ansewr is complete.
	# At least with mistral.
	import h5py

	# Copyright (c) 2023 kglspl
	# MIT License (the same as: https://github.com/kglspl/ppmparser/blob/master/LICENSE)

	class H5FS(object):
	def __init__(self, filename, mode):
	self.filename = filename
	self.f = h5py.File(filename, mode)
	self.dset = None
	This list was compiled from https://web.archive.org/web/20230911135706/https://docs.docker.com/desktop/release-notes/, retrieved on 2024-05-24

	The information may not be correct in all cases, or may have changed since archive.org archived the page. At time of posting, I spot-checked a few links and they appeared to be good, but really, all I've done is copied, pasted, and visually formatted the information I found on archive.org, so no warrantee that it's good.

	If the download links don't work, sometimes archive.org has the download archive, and you can try adding https://web.archive.org/web/20230911135706/ to the beginning of the URL. For instance, as of this writing, the 4.22.1 Windows download is available from archive.org https://web.archive.org/web/20230911135706/https://desktop.docker.com/win/main/amd64/Docker%20Desktop%20Installer.exe as well as the normal web link at https://desktop.docker.com/win/main/amd64/Docker%20Desktop%20Installer.exe.

	Self-promotion: Michael Kupietz • Software Solutions fo
	/// Fix a huggingface tokenizer to which tokens have been added after training.
	///
	/// Adding tokens after training via `add_special_tokens` leads to them being added to the
	/// `added_tokens` section but not to the `model.vocab` section. This yields warnings like:
	/// ```
	/// [2023-10-17T07:54:05Z WARN tokenizers::tokenizer::serialization] Warning: Token '<\|empty_usable_token_space_1023\|>' was expected to have ID '129023' but was given ID 'None'
	/// ```
	/// The code in this file ensures that all tokens from `added_tokens` are also placed into
	/// `model.vocab`. This fixes the warning and does not change the tokenizer's behavior.
	"""Kernel K-means"""

	# Author: Mathieu Blondel <mathieu@mblondel.org>
	# License: BSD 3 clause

	import numpy as np

	from sklearn.base import BaseEstimator, ClusterMixin
	from sklearn.metrics.pairwise import pairwise_kernels
	from sklearn.utils import check_random_state