Ian Scrivener ianscrivener

## Install whatever node.js version on raspberry pi, inclusing armv6l
#Download from https://unofficial-builds.nodejs.org/download/release/ the appropriate build for armv6l, example https://unofficial-builds.nodejs.org/download/release/v18.9.1/node-v18.9.1-linux-armv6l.tar.gz
wget https://unofficial-builds.nodejs.org/download/release/v18.9.1/node-v18.9.1-linux-armv6l.tar.gz
tar -xzf node-v18.9.1-linux-armv6l.tar.gz
cd node-v18.9.1-linux-armv6l
sudo cp -R * /usr/local
node -v

## azure-vm.sh
export AZ_MAIN_NAME=Kube2

export AZ_RG=RG_$AZ_MAIN_NAME
export AZ_VNET=VNET_$AZ_MAIN_NAME
export AZ_IP=Public_IP_$AZ_MAIN_NAME
export AZ_SUBNET=Subnet_$AZ_MAIN_NAME
export AZ_NSG=NetworkSecurityGroup_$AZ_MAIN_NAME
export AZ_NAME=VM_$AZ_MAIN_NAME
export AZ_NIC=NIC_$AZ_MAIN_NAME
ENV | grep AZ

## remove-systemctl-service.sh
sudo systemctl stop [servicename]
sudo systemctl disable [servicename]
#rm /etc/systemd/system/[servicename]
#rm /etc/systemd/system/[servicename] symlinks that might be related
sudo systemctl daemon-reload
sudo systemctl reset-failed

## mqtt-relayon.py
from time import sleep
import ssl
import json
import os
from paho.mqtt.client import Client

username = "your VRM email"
password = "your VRM pasword"
portal_id = "your VRM portal ID"

## LM-Studio-preset.json
{
  "name": "My New Config Preset",
  "load_params": {
    "n_ctx": 1500,
    "n_batch": 512,
    "rope_freq_base": 10000,
    "rope_freq_scale": 1,
    "n_gpu_layers": 1,
    "use_mlock": true,
    "main_gpu": 0,

## setup.sh
# BTW: we are running in a nvidia/cuda:11.x.x-devel-ubuntu22.04

# install some extra Ubuntu packages
  apt install unzip libopenblas-dev nano git-lfs aria2c jq build-essential python3 python3-pip git -y
  pip install --upgrade pip setuptools wheel

# clone llama.cpp repo
	cd /workspace
	git clone https://github.com/ggerganov/llama.cpp.git

## llama-cpp-python-test-7.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ianscrivener
                / llama-cpp-python-test-7.md
            
            
              Created
              June 9, 2023 04:10
            
          
    Test


try installing llama-cpp-python and llama-cpp-python[server] from pip ... WITH ggml-metal.metal (WITH Metal GPU support) file in  python executable directory

Environment


from previous test

Result


llama-cpp-python[server] FAILS

Steps


## llama-cpp-python-test-6.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ianscrivener
                / llama-cpp-python-test-6.md
            
            
              Created
              June 9, 2023 04:09
            
          
    Test


try rebuilding llama-cpp-python and llama-cpp-python[server] with GPU support and WITH ggml-metal.metal (WITH Metal GP support) to python executable directory

Environment


from previous test

Result


llama-cpp-python[server] FAILS


## llama-cpp-python-test-5.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ianscrivener
                / llama-cpp-python-test-5.md
            
            
              Created
              June 9, 2023 04:09
            
          
    Test


try adding ggml-metal.metal (WITH Metal GP support) to python executable directory

Environment


from previous test

Result


llama-cpp-python[server] FAILS


## llama-cpp-python-test-4.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ianscrivener
                / llama-cpp-python-test-4.md
            
            
              Created
              June 9, 2023 04:08
            
          
    Test


try rebuild llama.cpp with Metal GPU support

Environment


from previous test

Result


llama-cpp-python[server] FAILS 😞
	#Download from https://unofficial-builds.nodejs.org/download/release/ the appropriate build for armv6l, example https://unofficial-builds.nodejs.org/download/release/v18.9.1/node-v18.9.1-linux-armv6l.tar.gz
	wget https://unofficial-builds.nodejs.org/download/release/v18.9.1/node-v18.9.1-linux-armv6l.tar.gz
	tar -xzf node-v18.9.1-linux-armv6l.tar.gz
	cd node-v18.9.1-linux-armv6l
	sudo cp -R * /usr/local
	node -v
	export AZ_MAIN_NAME=Kube2

	export AZ_RG=RG_$AZ_MAIN_NAME
	export AZ_VNET=VNET_$AZ_MAIN_NAME
	export AZ_IP=Public_IP_$AZ_MAIN_NAME
	export AZ_SUBNET=Subnet_$AZ_MAIN_NAME
	export AZ_NSG=NetworkSecurityGroup_$AZ_MAIN_NAME
	export AZ_NAME=VM_$AZ_MAIN_NAME
	export AZ_NIC=NIC_$AZ_MAIN_NAME
	ENV \| grep AZ
	from time import sleep
	import ssl
	import json
	import os
	from paho.mqtt.client import Client

	username = "your VRM email"
	password = "your VRM pasword"
	portal_id = "your VRM portal ID"
	{
	"name": "My New Config Preset",
	"load_params": {
	"n_ctx": 1500,
	"n_batch": 512,
	"rope_freq_base": 10000,
	"rope_freq_scale": 1,
	"n_gpu_layers": 1,
	"use_mlock": true,
	"main_gpu": 0,
	# BTW: we are running in a nvidia/cuda:11.x.x-devel-ubuntu22.04

	# install some extra Ubuntu packages
	apt install unzip libopenblas-dev nano git-lfs aria2c jq build-essential python3 python3-pip git -y
	pip install --upgrade pip setuptools wheel

	# clone llama.cpp repo
	cd /workspace
	git clone https://github.com/ggerganov/llama.cpp.git