Skip to content

Instantly share code, notes, and snippets.

@eggplants
Last active June 19, 2019 17:28
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save eggplants/98ce48fe02c69b425ba1922511b46ee5 to your computer and use it in GitHub Desktop.
Save eggplants/98ce48fe02c69b425ba1922511b46ee5 to your computer and use it in GitHub Desktop.
#レコード数分の辞書
wc_n=File.read('jbisc.txt').count('*')
data,i=Array.new(wc_n).map{Hash.new},0
duplicate = %w(ISBN NOTE TITLEHEADING AUTHORHEADING)
#Hash化
File.foreach("jbisc.txt"){|row|
row.chomp!
unless row=='*'
key=row.scan(/^([A-Z]+): /)[0][0]
unless duplicate.include?(key)
data[i][key.to_sym]=row.delete(key+": ")
else
(data[i][key.to_sym]||=[])<<row.delete(key+": ")
end
else
i+=1
end
}
#書き出し
out=[]
data.each{|dic|
duplicate.each{|d|dic[d.to_sym]||=[]}
dic[:TR]=~/\//? dic[:TR].sub!(/\//,"|") : dic[:TR]+="|"
dic[:PUB].sub!(/,/,"|")
dic[:PUB].sub!(/\[2004\]$/,"2004")
dic[:PUB].sub!(/\[2005\]$/,"2005")
dic[:PUB].sub!(/\[2004.8\]$/,"2004.8")
dic[:PUB].sub!(/[c]/,"")
dic[:PUB].sub!(/印刷/,"")
out<<<<-EOF
#{dic[:NBC]}|\
#{dic[:ISBN].join(">")}|\
#{dic[:TR]}|\
#{dic[:PUB]}|\
#{dic[:ED]}|\
#{dic[:PHYS]}|\
#{dic[:SERIES]}|\
#{dic[:NOTE].join(">")}|\
#{dic[:TITLEHEADING].join(">")}|\
#{dic[:AUTHORHEADING].join(">")}|\
#{dic[:HOLDINGSRECORD]}|\
#{dic[:HOLDINGPHYS]}|\
#{dic[:HOLDINGLOC]}
EOF
}
->(a){a.each{|b|
b.gsub!(/"/,'""')
b.gsub!(/""(.*?)""/,"「\1」") if b=~/.*\|"".*/
puts b}}.call(out)
CREATE TABLE bibdata(
NBC TEXT primary key,
ISBN TEXT,
TITLE TEXT,
AUTH TEXT,
PUB TEXT,
PUBDATE TEXT,
ED TEXT,
PHYS TEXT,
SERIES TEXT,
NOTE TEXT,
TITLEHEADING TEXT,
AUTHORHEADING TEXT,
HOLDINGSRECORD TEXT,
HOLDINGPHYS TEXT,
HOLDINGLOC TEXT)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment