Jacob Chapman chapmanjacobd

## titles.nd.js
Array.from(document.querySelectorAll('.title')).map(e => e.innerText).join('\n');

## html2sqlite.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              2 stars
            
          
                chapmanjacobd
                / html2sqlite.md
            
            
              Last active
              May 2, 2024 11:48
            
          
    Have you ever wanted to do:
SELECT * FROM www.google.com

With BigQuery you kind of can. But have you ever wanted to do:
SELECT * FROM www.wikipedia.com

With Wikidata Query Service you kind of can (semantic web!, RDF!?, https://www.w3.org/wiki/SparqlImplementations).

  
## HtmlList.py

class HtmlList:
    def __init__(self):
        self.tree = []
        self.xpath = []

    def resolve_parents(self, el) -> list:
        if el.parent is None:
            return self.xpath
        else:

## artsearch.py wip
import argparse, re, webbrowser

from xklb.utils import web


def search_art(term):
    search_url = f"https://artsandculture.google.com/search?q={term.replace(' ', '+')}"
    response = web.requests_session().get(search_url)

    if response.status_code == 200:

## eda sqlite example
$ lb eda temp.db -L inf

## temp.db:playlists
### Shape

(1, 8)

### Sample of rows

|    |   id |   time_modified |   time_deleted | extractor_config   | extractor_key   | path          |   time_created |   hours_update_delay |

## cover_scan.py
def cover_scan(media_duration, scan_percentage):
    num_scans = max(2, int(math.log(media_duration) * (scan_percentage / 10)))
    scan_duration_total = max(1, media_duration * (scan_percentage / 100))
    scan_duration = max(1, int(scan_duration_total / num_scans))
    scan_interval = media_duration / num_scans

    scans = sorted(set(int(scan * scan_interval) for scan in range(num_scans)))
    if scans[-1] < media_duration - (scan_duration * 2):
        scans.append(math.floor(media_duration - scan_duration))

## get_file_part.py

def get_file_part(file_path, specifier):
    size = file_path.stat().st_size

    if specifier.isdigit():
        specifier = int(specifier)
        if specifier > 0:
            with file_path.open('rb') as file:
                return file.read(specifier)
        else:

## merge.py
def compare_stats(destination_files, destination_folders, source_files, source_empty_folders):
    new_empty_folders = source_empty_folders - destination_folders

    source_dirs = {p.parent for p in source_files}
    destination_dirs = {p.parent for p in destination_files}
    new_directories = source_dirs - destination_dirs

    new_files = source_files - destination_files
    replaced_files = source_files & destination_files
    trumped_files = replaced_files.intersection(source_files | destination_files)

## ffprobe_class.py
class FFProbe:
    def __init__(self, path, *args):
        args = ["ffprobe", "-show_format", "-show_streams", "-show_chapters", "-of", "json", *args, path]
        p = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE)

        out, err = p.communicate()
        if p.returncode != 0:
            raise RuntimeError(out, err)
        d = json.loads(out.decode("utf-8"))

## btrfs_raid1_metadata_ENOSPC.txt
kern  :info  : [  +0.000006] BTRFS info (device sde: state A): dumping space info:
kern  :info  : [  +0.000006] BTRFS info (device sde: state A): space_info DATA has 142864384 free, is not full
kern  :info  : [  +0.000006] BTRFS info (device sde: state A): space_info total=9971804340224, used=9688658702336, pinned=283002445824, reserved=0, may_use=0, readonly=327680 zone_unusable=0
kern  :info  : [  +0.000009] BTRFS info (device sde: state A): space_info METADATA has 0 free, is full
kern  :info  : [  +0.000005] BTRFS info (device sde: state A): space_info total=15032385536, used=14061862912, pinned=329777152, reserved=640679936, may_use=0, readonly

	class HtmlList:
	def __init__(self):
	self.tree = []
	self.xpath = []

	def resolve_parents(self, el) -> list:
	if el.parent is None:
	return self.xpath
	else:
	import argparse, re, webbrowser

	from xklb.utils import web


	def search_art(term):
	search_url = f"https://artsandculture.google.com/search?q={term.replace(' ', '+')}"
	response = web.requests_session().get(search_url)

	if response.status_code == 200:
	$ lb eda temp.db -L inf

	## temp.db:playlists
	### Shape

	(1, 8)

	### Sample of rows

	\| \| id \| time_modified \| time_deleted \| extractor_config \| extractor_key \| path \| time_created \| hours_update_delay \|
	def cover_scan(media_duration, scan_percentage):
	num_scans = max(2, int(math.log(media_duration) * (scan_percentage / 10)))
	scan_duration_total = max(1, media_duration * (scan_percentage / 100))
	scan_duration = max(1, int(scan_duration_total / num_scans))
	scan_interval = media_duration / num_scans

	scans = sorted(set(int(scan * scan_interval) for scan in range(num_scans)))
	if scans[-1] < media_duration - (scan_duration * 2):
	scans.append(math.floor(media_duration - scan_duration))

	def get_file_part(file_path, specifier):
	size = file_path.stat().st_size

	if specifier.isdigit():
	specifier = int(specifier)
	if specifier > 0:
	with file_path.open('rb') as file:
	return file.read(specifier)
	else:
	def compare_stats(destination_files, destination_folders, source_files, source_empty_folders):
	new_empty_folders = source_empty_folders - destination_folders

	source_dirs = {p.parent for p in source_files}
	destination_dirs = {p.parent for p in destination_files}
	new_directories = source_dirs - destination_dirs

	new_files = source_files - destination_files
	replaced_files = source_files & destination_files
	trumped_files = replaced_files.intersection(source_files \| destination_files)
	class FFProbe:
	def __init__(self, path, *args):
	args = ["ffprobe", "-show_format", "-show_streams", "-show_chapters", "-of", "json", *args, path]
	p = subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE)

	out, err = p.communicate()
	if p.returncode != 0:
	raise RuntimeError(out, err)
	d = json.loads(out.decode("utf-8"))
	kern :info : [ +0.000006] BTRFS info (device sde: state A): dumping space info:
	kern :info : [ +0.000006] BTRFS info (device sde: state A): space_info DATA has 142864384 free, is not full
	kern :info : [ +0.000006] BTRFS info (device sde: state A): space_info total=9971804340224, used=9688658702336, pinned=283002445824, reserved=0, may_use=0, readonly=327680 zone_unusable=0
	kern :info : [ +0.000009] BTRFS info (device sde: state A): space_info METADATA has 0 free, is full
	kern :info : [ +0.000005] BTRFS info (device sde: state A): space_info total=15032385536, used=14061862912, pinned=329777152, reserved=640679936, may_use=0, readonly