Ed Summers edsu

## bagit.sh
#!/bin/bash

#
# The simplest way to create a valid BagIt bag?
#
# Usage: bagit.sh <dir_to_bag> <bag_dir>
#
# Note: you'll need to have md5deep installed:
# brew install md5deep
# apt-get install md5deep

## en.wav

      
              2 files
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                edsu
                / en.wav
            
            
              Last active
              March 29, 2024 12:22
            
              
                This seems to cause whisper to segfault on my MacBook Pro 2.4 GHz 8-Core Intel Core i9, Sonoma 14.4.1, Python 3.12.0
              
          
            View raw
        
    
## response.json
{
  "l": "1",
  "p": "https://lh3.googleusercontent.com/-XdUIqdMkCWA/AAAAAAAAAAI/AAAAAAAAAAA/4252rscbv5M/s64-c-mo/photo.jpg",
  "r": [
    {
      "t": "The Internet Archive and the socio-technical construction of historical facts",
      "u": "https://scholar.google.com/scholar_url?url=https://www.tandfonline.com/doi/abs/10.1080/24701475.2018.1455412&hl=en&sa=T&oi=gsr-r&ct=res&cd=0&d=3272375975175528132&ei=YBH7ZeXNA4Cb6rQPmrOdoA8&scisig=AFWwaeb_dRhXurIfWX0NXA2y4G9I",
      "x": "",
      "m": "A Ben-David, A Amram - Internet Histories, 2018",
      "s": "This article analyses the socio-technical epistemic processes behind the construction of historical facts by the Internet Archive Wayback Machine (IAWM). Grounded in theoretical debates in Science and Technology Studies about digital and algorithmic platforms as “black boxes”, this article uses provenance information and other data traces provided by the IAWM to uncover specific epistemic processes embedded at its back-end, through a case study on the archiv

## gist:c683a99d51d4faa26b4e18a466ba1b13

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                edsu
                / gist:c683a99d51d4faa26b4e18a466ba1b13
            
            
              Last active
              March 5, 2024 16:55
            
              
                GIS filenames
              
          
filename
count


data.zip
22397


data_EPSG_4326.zip
22397


preview.jpg
22397


index_map.json
147


Beechey_WGS.tif.xml
1


Beechey_WGS-iso19139.xml
1


Beechey_WGS-fgdc.xml
1


bathy20.txt
1


## wacz-images.py
#!/usr/bin/env python3

#
# usage: wacz-images.py <wacz_file>
#
# This program will extract images from the WARC files contained in a WACZ
# file and write them to the current working directory using the image's URL
# as a file location.
#
# You will need to `pip install warcio` for it to work.

## lcauthority.py
#!/usr/bin/env python3

"""
A small command line tool to get the JSON-LD for a Library of Congress authority
record by first looking up the authority as a string using the label lookup
service and then getting the JSON-LD for the authority and writing it out using
a JSON-LD frame where the SKOS is the default vocabulary.
"""

import sys

## mix.sh
# concatenate two videos with different resolution

ffmpeg -i part1.mp4 -i part2.mp4 -filter_complex "[0]scale=1280:720:force_original_aspect_ratio=decrease,pad=1280:720:(ow-iw)/2:(oh-ih)/2,setsar=1[v0];[1]scale=1280:720:force_original_aspect_ratio=decrease,pad=1280:720:(ow-iw)/2:(oh-ih)/2,setsar=1[v1];[v0][0:a:0][v1][1:a:0]concat=n=2:v=1:a=1[v][a]" -map "[v]" -map "[a]" out.mp4

## guess_doi.py
#!/usr/bin/env python3

import sys
import requests

title = sys.argv[1]
api_url = "https://api.crossref.org/works"

response = requests.get(api_url, params={"query.title": title})

## 2023-12-20.txt
[13] Sufjan Stevens - Javelin [Clash, The Fader, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, Mojo, Uncut, Piccadilly Records, Rough Trade]
[12] Kelela - Raven [Clash, The Fader, The Forty-Five, PopMatters, Pitchfork, Crack, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, The Quietus]
[12] Wednesday - Rat Saw God [Clash, The Fader, The Forty-Five, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, Uncut, Rough Trade]
[11] Noname - Sundial [Clash, The Fader, The Forty-Five, The Wire, PopMatters, Pitchfork, Crack, The Line of Best Fit, Rolling Stone, Paste, The Quietus]
[9] Mitski - The Land Is Inhospitable and So Are We [Clash, The Fader, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Mojo]
[9] Lankum - False Lankum [Clash, Concrete Islands, Crack, The Line of Best Fit, Fast 'n' Bulbous, Louder Than War, Mojo, Uncut, The Quietus]
[8] Amaarae - Fountain Baby [Clash, The Fader, T

## json_shapes.py
#!/usr/bin/env python3

import csv
import json
from collections import OrderedDict
from collections import Counter

def trace(data, shape=None):
    if isinstance(data, dict):
        new_dict = OrderedDict()
	#!/bin/bash

	#
	# The simplest way to create a valid BagIt bag?
	#
	# Usage: bagit.sh <dir_to_bag> <bag_dir>
	#
	# Note: you'll need to have md5deep installed:
	# brew install md5deep
	# apt-get install md5deep
	{
	"l": "1",
	"p": "https://lh3.googleusercontent.com/-XdUIqdMkCWA/AAAAAAAAAAI/AAAAAAAAAAA/4252rscbv5M/s64-c-mo/photo.jpg",
	"r": [
	{
	"t": "The Internet Archive and the socio-technical construction of historical facts",
	"u": "https://scholar.google.com/scholar_url?url=https://www.tandfonline.com/doi/abs/10.1080/24701475.2018.1455412&hl=en&sa=T&oi=gsr-r&ct=res&cd=0&d=3272375975175528132&ei=YBH7ZeXNA4Cb6rQPmrOdoA8&scisig=AFWwaeb_dRhXurIfWX0NXA2y4G9I",
	"x": "",
	"m": "A Ben-David, A Amram - Internet Histories, 2018",
	"s": "This article analyses the socio-technical epistemic processes behind the construction of historical facts by the Internet Archive Wayback Machine (IAWM). Grounded in theoretical debates in Science and Technology Studies about digital and algorithmic platforms as “black boxes”, this article uses provenance information and other data traces provided by the IAWM to uncover specific epistemic processes embedded at its back-end, through a case study on the archiv
filename	count
data.zip	22397
data_EPSG_4326.zip	22397
preview.jpg	22397
index_map.json	147
Beechey_WGS.tif.xml	1
Beechey_WGS-iso19139.xml	1
Beechey_WGS-fgdc.xml	1
bathy20.txt	1
	#!/usr/bin/env python3

	#
	# usage: wacz-images.py <wacz_file>
	#
	# This program will extract images from the WARC files contained in a WACZ
	# file and write them to the current working directory using the image's URL
	# as a file location.
	#
	# You will need to `pip install warcio` for it to work.
	#!/usr/bin/env python3

	"""
	A small command line tool to get the JSON-LD for a Library of Congress authority
	record by first looking up the authority as a string using the label lookup
	service and then getting the JSON-LD for the authority and writing it out using
	a JSON-LD frame where the SKOS is the default vocabulary.
	"""

	import sys
	# concatenate two videos with different resolution

	ffmpeg -i part1.mp4 -i part2.mp4 -filter_complex "[0]scale=1280:720:force_original_aspect_ratio=decrease,pad=1280:720:(ow-iw)/2:(oh-ih)/2,setsar=1[v0];[1]scale=1280:720:force_original_aspect_ratio=decrease,pad=1280:720:(ow-iw)/2:(oh-ih)/2,setsar=1[v1];[v0][0:a:0][v1][1:a:0]concat=n=2:v=1:a=1[v][a]" -map "[v]" -map "[a]" out.mp4
	#!/usr/bin/env python3

	import sys
	import requests

	title = sys.argv[1]
	api_url = "https://api.crossref.org/works"

	response = requests.get(api_url, params={"query.title": title})
	[13] Sufjan Stevens - Javelin [Clash, The Fader, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, Mojo, Uncut, Piccadilly Records, Rough Trade]
	[12] Kelela - Raven [Clash, The Fader, The Forty-Five, PopMatters, Pitchfork, Crack, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, The Quietus]
	[12] Wednesday - Rat Saw God [Clash, The Fader, The Forty-Five, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Paste, Uncut, Rough Trade]
	[11] Noname - Sundial [Clash, The Fader, The Forty-Five, The Wire, PopMatters, Pitchfork, Crack, The Line of Best Fit, Rolling Stone, Paste, The Quietus]
	[9] Mitski - The Land Is Inhospitable and So Are We [Clash, The Fader, PopMatters, Pitchfork, The Line of Best Fit, Consequence, Rolling Stone, Exclaim, Mojo]
	[9] Lankum - False Lankum [Clash, Concrete Islands, Crack, The Line of Best Fit, Fast 'n' Bulbous, Louder Than War, Mojo, Uncut, The Quietus]
	[8] Amaarae - Fountain Baby [Clash, The Fader, T
	#!/usr/bin/env python3

	import csv
	import json
	from collections import OrderedDict
	from collections import Counter

	def trace(data, shape=None):
	if isinstance(data, dict):
	new_dict = OrderedDict()