137 lines
5.3 KiB
Python
137 lines
5.3 KiB
Python
try:
|
|
# For Python 3.0 and later
|
|
from urllib.request import urlopen,URLError
|
|
except ImportError:
|
|
# Fall back to Python 2's urllib2
|
|
from urllib2 import urlopen,URLError
|
|
from json import loads,dumps
|
|
from socket import timeout
|
|
|
|
""" Library Book Type Description:
|
|
The book is a dictionary of the form { string : a, ... }
|
|
|
|
Keys:
|
|
required: (ideally)
|
|
title - Book/Article title
|
|
publisher - string containing semi-colon separated list eg. "UW Press; CSC, inc."
|
|
authors - as above. each name is of the form "First Initials. Last" eg. "Calum T. Dalek; Conan T.B. Ladan"
|
|
optional:
|
|
subtitle - string
|
|
edition - integer
|
|
isbn - integer (it's preferred to use the isbn-13 rather than isbn-10)
|
|
lccn - integer: library of congress catalogue number
|
|
publish date - string of date (to make things easier to code/catalogue (won't be stored)
|
|
publish year - int (this kind of thing will have to be confirmed by cataloguer)
|
|
publish month - int
|
|
publish location - like publisher
|
|
|
|
pages - integer - just the number of pages
|
|
pagination - string eg. "xviii, 1327-1850"
|
|
weight - string (purely for interest's sake eg. "3lb." or "3 pounds"
|
|
categories - list of strings?
|
|
"""
|
|
|
|
|
|
# look up data from openlibrary.org using isbn
|
|
def openLibrary_isbn(ISBN):
|
|
isbn = str(ISBN)
|
|
try:
|
|
jsondata = urlopen("http://openlibrary.org/api/books"
|
|
"?format=json&jscmd=data&bibkeys=ISBN:"+isbn,
|
|
timeout=3)
|
|
except URLError as e:
|
|
return {'title':e}
|
|
except timeout:
|
|
return {'title':'Timeout while connecting to OpenLibrary.org'}
|
|
openBook = loads(jsondata.read().decode('utf-8'))
|
|
if "ISBN:"+isbn not in openBook:
|
|
return {'isbn':isbn,'title':'Book not found'}
|
|
openBook = openBook["ISBN:"+isbn]
|
|
# create my custom dict for books with the info we want.
|
|
book = dict({"isbn" : isbn})
|
|
book["title"]=openBook["title"]
|
|
book["authors"]=""
|
|
if "authors" in openBook:
|
|
for v in openBook["authors"]:
|
|
book['authors'] += "; " + v['name']
|
|
book['authors'] = book['authors'][2:]
|
|
book["publisher"]=""
|
|
if "publishers" in openBook:
|
|
for v in openBook["publishers"]:
|
|
book["publisher"] += "; " + v['name']
|
|
book['publisher'] = book['publisher'][2:]
|
|
if "publish_places" in openBook:
|
|
book["publish location"]=""
|
|
for v in openBook["publish_places"]:
|
|
book["publish location"] += "; " + v['name']
|
|
book['publish location'] = book['publish location'][2:]
|
|
|
|
# for lccn, there maybe be multiple values in the query. I'm just taking
|
|
# the first, but the full list may be useful
|
|
if "lccn" in openBook['identifiers']:
|
|
book["lccn"]=int(openBook['identifiers']['lccn'][0])
|
|
if "publish_date" in openBook:
|
|
book['publish date']=openBook['publish_date']
|
|
#code to pull out year and month (hopefully)
|
|
if "number_of_pages" in openBook:
|
|
book["pages"]=openBook["number_of_pages"]
|
|
if "pagination" in openBook:
|
|
book["pagination"]=openBook["pagination"]
|
|
if "weight" in openBook:
|
|
book["weight"]=openBook["weight"]
|
|
if "subtitle" in openBook:
|
|
book["subtitle"]=openBook["subtitle"]
|
|
return book
|
|
|
|
# look up data from openlibrary.org using lccn
|
|
def openLibrary_lccn(LCCN):
|
|
lccn = str(LCCN)
|
|
try:
|
|
jsondata = urlopen("http://openlibrary.org/api/books"
|
|
"?format=json&jscmd=data&bibkeys=lccn:"+lccn,
|
|
timeout=3)
|
|
except URLError:
|
|
return {}
|
|
openBook = loads(jsondata.read().decode('utf-8'))
|
|
if "lccn:"+lccn not in openBook:
|
|
return {'lccn':lccn,'title':'Book not found'}
|
|
openBook = openBook["lccn:"+lccn]
|
|
# create my custom dict for books with the info we want.
|
|
book = {"lccn" : lccn}
|
|
book["title"]=openBook["title"]
|
|
book["authors"]=""
|
|
if "authors" in openBook:
|
|
for v in openBook["authors"]:
|
|
book['authors'] += "; " + v['name']
|
|
book['authors'] = book['authors'][2:]
|
|
book["publisher"]=""
|
|
if "publishers" in openBook:
|
|
for v in openBook["publishers"]:
|
|
book["publisher"] += "; " + v['name']
|
|
book['publisher'] = book['publisher'][2:]
|
|
if "publish_places" in openBook:
|
|
book["publish location"]=""
|
|
for v in openBook["publish_places"]:
|
|
book["publish location"] += "; " + v['name']
|
|
book['publish location'] = book['publish location'][2:]
|
|
|
|
# for isbn, there maybe be multiple values in the query. I'm just taking
|
|
# the first, but the full list may be useful
|
|
# There are also ISBN's that have non-number values :(
|
|
if "isbn_10" in openBook['identifiers']:
|
|
book["isbn"]=openBook['identifiers']['isbn_10'][0]
|
|
if "isbn_13" in openBook['identifiers']:
|
|
book["isbn"]=openBook['identifiers']['isbn_13'][0]
|
|
if "publish_date" in openBook:
|
|
book['publish date']=openBook['publish_date']
|
|
#code to pull out year and month (hopefully)
|
|
if "number_of_pages" in openBook:
|
|
book["pages"]=openBook["number_of_pages"]
|
|
if "pagination" in openBook:
|
|
book["pagination"]=openBook["pagination"]
|
|
if "weight" in openBook:
|
|
book["weight"]=openBook["weight"]
|
|
if "subtitle" in openBook:
|
|
book["subtitle"]=openBook["subtitle"]
|
|
return book
|