2021-08-17 19:23:45 -04:00
|
|
|
#!/usr/bin/env python2
|
2010-03-07 12:28:33 -05:00
|
|
|
"""make-index.py
|
|
|
|
|
|
|
|
Generates an nice index of the directories from a
|
|
|
|
template.
|
|
|
|
|
|
|
|
Original Author: Jeremy Roman <jbroman@csclub.uwaterloo.ca>
|
2021-08-17 19:23:45 -04:00
|
|
|
Modified by: Zachary Seguin <ztseguin@csclub.uwaterloo.ca>
|
2010-03-07 12:28:33 -05:00
|
|
|
|
|
|
|
So if you don't like how I did something,
|
|
|
|
I'm the person you get to complain to.
|
|
|
|
Please be gentle.
|
|
|
|
"""
|
|
|
|
|
|
|
|
import os, sys, time
|
|
|
|
from subprocess import Popen, PIPE
|
|
|
|
from optparse import OptionParser
|
|
|
|
import yaml, mako.exceptions, webhelpers.html.tags
|
|
|
|
from mako.template import Template
|
2021-08-17 19:23:45 -04:00
|
|
|
import humanize
|
|
|
|
import datetime
|
|
|
|
|
|
|
|
def parse_size(s):
|
|
|
|
if s.endswith("T"):
|
|
|
|
return float(s[:-1])*1000*1000*1000*1000
|
|
|
|
elif s.endswith("G"):
|
|
|
|
return float(s[:-1])*1000*1000*1000
|
|
|
|
elif s.endswith("M"):
|
|
|
|
return float(s[:-1])*1000*1000
|
|
|
|
elif s.endswith("K"):
|
|
|
|
return float(s[:-1])*1000
|
|
|
|
|
|
|
|
return float(size)
|
2010-03-07 12:28:33 -05:00
|
|
|
|
|
|
|
def reformat_size(size):
|
2021-08-17 19:23:45 -04:00
|
|
|
return humanize.naturalsize(size)
|
2010-03-07 12:28:33 -05:00
|
|
|
|
|
|
|
def atomic_write(filename, body):
|
|
|
|
"""Atomically write to a file by writing a
|
|
|
|
temporary file and then moving it to replace
|
|
|
|
the desired output file.
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
This ensures that partial files are never seen
|
|
|
|
by clients."""
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# generate an appropriate temporary filename
|
|
|
|
# in the same directory
|
|
|
|
tmp_filename = "%s.%d.tmp" % (filename, os.getpid())
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# open the directory so that we can fsync it
|
|
|
|
dir = os.open(os.path.realpath(os.path.dirname(filename)), \
|
|
|
|
os.O_DIRECTORY | os.O_RDONLY)
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# write to the temporary file
|
|
|
|
tmp = open(tmp_filename, 'w')
|
|
|
|
print >>tmp, body
|
|
|
|
tmp.flush()
|
|
|
|
os.fsync(tmp.fileno())
|
|
|
|
tmp.close()
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# atomically replace the actual file
|
|
|
|
os.rename(tmp_filename, filename)
|
|
|
|
os.fsync(dir)
|
|
|
|
os.close(dir)
|
|
|
|
|
|
|
|
def main():
|
|
|
|
# accept command-line arguments
|
|
|
|
parser = OptionParser()
|
|
|
|
parser.add_option("-c", "--config", dest="config", default="config.yaml",
|
|
|
|
help="configuration file to be used", metavar="FILE")
|
|
|
|
parser.add_option("-D", "--docroot", dest="docroot",
|
|
|
|
help="directory to be scanned", metavar="DIR")
|
|
|
|
parser.add_option("-F", "--duflags", dest="duflags",
|
|
|
|
help="flags to be passed to du, replaces any in config")
|
|
|
|
parser.add_option("-o", "--output", dest="output", metavar="FILE",
|
|
|
|
help="file to which index page will be written. "
|
|
|
|
"Use /dev/stdout to send to standard out.")
|
|
|
|
parser.add_option("-t", "--template", dest="template",
|
|
|
|
help="Mako template to render", metavar="FILE")
|
|
|
|
parser.add_option("--nonatomic", dest="nonatomic", action="store_true",
|
|
|
|
default=False, help="write the output to the path "
|
|
|
|
"given without creating a temporary file in between. "
|
|
|
|
"This is automatically set if the output appears "
|
|
|
|
"to be a character device, not a file.")
|
|
|
|
(options, args) = parser.parse_args()
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# load config file
|
|
|
|
try:
|
2021-08-17 19:23:45 -04:00
|
|
|
config = yaml.load(file(options.config,'r'), Loader=yaml.FullLoader)
|
2010-03-07 12:28:33 -05:00
|
|
|
except:
|
|
|
|
config = None
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
if not config or type(config) != dict:
|
|
|
|
print >>sys.stderr, "Unable to load configuration '%s'." % options.config
|
|
|
|
sys.exit(-1)
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# determine important variables based on an appropriate order of
|
|
|
|
# precedence (command-line flags first, then the config file,
|
|
|
|
# then built-in fallbacks)
|
|
|
|
#
|
|
|
|
# fallback value for nonatomic is used so that character devices
|
|
|
|
# (e.g. /dev/stdout, /dev/null) are written to in the regular way
|
|
|
|
docroot = options.docroot or config.get('docroot')
|
2021-08-17 19:23:45 -04:00
|
|
|
duflags = options.duflags or config.get('duflags') or "-h --max-depth=1 --exclude='.~tmp~'"
|
2010-03-07 12:28:33 -05:00
|
|
|
output = options.output or config.get('output')
|
|
|
|
template = options.template or config.get("template") or "index.mako"
|
|
|
|
nonatomic = options.nonatomic or config.get("nonatomic") or \
|
|
|
|
(os.path.exists(output) and not os.path.isfile(output))
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# sanity checks
|
|
|
|
if not docroot:
|
|
|
|
print >>sys.stderr, "docroot not specified."
|
|
|
|
print >>sys.stderr, "Define it in the config file or pass -D on the command line."
|
|
|
|
sys.exit(-1)
|
|
|
|
elif not output:
|
|
|
|
print >>sys.stderr, "output not specified."
|
|
|
|
print >>sys.stderr, "Define it in the config file or pass -o on the command line."
|
|
|
|
elif not config.get('directories'):
|
|
|
|
print >>sys.stderr, "directories not specified."
|
|
|
|
print >>sys.stderr, "Define it in the config file."
|
|
|
|
sys.exit(-1)
|
|
|
|
elif not os.path.isdir(docroot):
|
|
|
|
print >>sys.stderr, "docroot '%s' not found or not a directory." % docroot
|
|
|
|
sys.exit(-1)
|
|
|
|
elif not os.path.exists(template) or os.path.isdir(template):
|
|
|
|
print >>sys.stderr, "template '%s' not found or is a directory." % template
|
|
|
|
sys.exit(-1)
|
2021-08-17 19:23:45 -04:00
|
|
|
|
|
|
|
generated = datetime.datetime.now()
|
|
|
|
|
|
|
|
directories = []
|
|
|
|
total_size = 0.0
|
|
|
|
|
|
|
|
ls = os.listdir(docroot)
|
|
|
|
|
|
|
|
for item in ls:
|
|
|
|
if item == "pub":
|
|
|
|
continue
|
|
|
|
|
|
|
|
path = os.path.join(docroot, item)
|
|
|
|
|
|
|
|
# If symlink, then this is a project
|
|
|
|
if os.path.islink(path):
|
|
|
|
dataset = os.readlink(path)[1:]
|
|
|
|
|
|
|
|
# Get the disk space used by that dataset
|
|
|
|
du = Popen(
|
|
|
|
"/usr/bin/sudo /sbin/zfs get -H -o value used %s" % dataset,
|
|
|
|
shell=True, stdout=PIPE, stderr=PIPE).communicate()
|
|
|
|
|
|
|
|
size = "-"
|
|
|
|
if len(du[1].strip()) > 0:
|
|
|
|
sys.stderr.write(du[1])
|
|
|
|
print >>sys.stderr, "zfs get terminated unsuccessfully for %s" % item
|
|
|
|
continue
|
|
|
|
else:
|
|
|
|
size = parse_size(du[0].strip())
|
|
|
|
total_size += size
|
|
|
|
|
|
|
|
info = {'dir':item, 'size':reformat_size(size)}
|
|
|
|
|
|
|
|
# use info from config.yaml, if found
|
|
|
|
# otherwise, skip this directory
|
|
|
|
if item in config['exclude']:
|
|
|
|
continue
|
|
|
|
elif item in config['directories']:
|
|
|
|
info.update(config['directories'][item])
|
|
|
|
else:
|
|
|
|
info.update({ 'site': '', 'url': '' })
|
|
|
|
|
|
|
|
directories.append(info)
|
|
|
|
|
|
|
|
# Sort the directories
|
|
|
|
directories.sort(key=lambda d : d['dir'].lower())
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# Call du to compute size
|
2021-08-17 19:23:45 -04:00
|
|
|
#du = Popen(
|
|
|
|
# "/usr/bin/du %s/* %s | /usr/bin/sort -fk2" % (docroot, duflags),
|
|
|
|
# shell=True, stdout=PIPE, stderr=PIPE).communicate()
|
|
|
|
# du = []
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# Check that du executed successfully
|
|
|
|
# If there's anything on stderr, send it
|
|
|
|
# out our own stderr and terminate.
|
2021-08-17 19:23:45 -04:00
|
|
|
#if len(du[1].strip()) > 0:
|
|
|
|
# sys.stderr.write(du[1])
|
|
|
|
# print >>sys.stderr, "du terminated unsuccessfully. Not generating index."
|
|
|
|
# sys.exit(-1)
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# first one should be total, grab its size and format
|
2021-08-17 19:23:45 -04:00
|
|
|
#du = du[0].splitlines() # we only care about stdout now
|
|
|
|
#total_size = reformat_size(du[0].split(None,2)[0])
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# the rest are the sizes we want
|
2021-08-17 19:23:45 -04:00
|
|
|
# directories = []
|
|
|
|
# total_size = 0
|
|
|
|
|
|
|
|
# for line in du:
|
|
|
|
# (size, path) = line.split(None, 2)
|
|
|
|
# dir = os.path.basename(path)
|
|
|
|
# total_size += int(size)
|
|
|
|
# info = {'dir':dir, 'size':reformat_size(int(size))}
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# use info from config.yaml, if found
|
|
|
|
# otherwise, skip this directory
|
2021-08-17 19:23:45 -04:00
|
|
|
# if dir in config['exclude'] or not os.path.isdir(path):
|
|
|
|
# continue
|
|
|
|
# elif dir in config['directories']:
|
|
|
|
# info.update(config['directories'][dir])
|
|
|
|
# else:
|
|
|
|
# info.update({ 'site': '', 'url': '' })
|
|
|
|
|
|
|
|
# directories.append(info)
|
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# render the template to a string
|
|
|
|
body = Template(filename=template).render(
|
2021-08-17 19:23:45 -04:00
|
|
|
total_size=reformat_size(total_size),
|
2010-03-07 12:28:33 -05:00
|
|
|
directories=directories,
|
2021-08-17 19:23:45 -04:00
|
|
|
generated=generated,
|
2010-03-07 12:28:33 -05:00
|
|
|
config=config,
|
|
|
|
h=webhelpers.html.tags)
|
2021-08-17 19:23:45 -04:00
|
|
|
|
2010-03-07 12:28:33 -05:00
|
|
|
# write the rendered output
|
|
|
|
if nonatomic:
|
|
|
|
print >>file(output,'w'), body
|
|
|
|
else:
|
|
|
|
atomic_write(output, body)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|