GitList

S3/Utils.py

ec50b5a7	## Amazon S3 manager ## Author: Michal Ludvig <michal@logix.cz> ## http://www.logix.cz/michal ## License: GPL Version 2
8ec1807f	import os
df9fa4b5	import time import re
8ec1807f	import string import random
0b2aefe3	try:
3c682455	from hashlib import md5
0b2aefe3	except ImportError:
3c682455	from md5 import md5
ac9940ec	import errno
df9fa4b5
ed27a45e	from logging import debug, info, warning, error
82d9eafa	import Config
7bae4e19	try: import xml.etree.ElementTree as ET except ImportError: import elementtree.ElementTree as ET
0d91ff3f	def stripTagXmlns(xmlns, tag): """ Returns a function that, given a tag name argument, removes eventual ElementTree xmlns from it. Example: stripTagXmlns("{myXmlNS}tag") -> "tag" """ if not xmlns: return tag return re.sub(xmlns, "", tag) def fixupXPath(xmlns, xpath, max = 0): if not xmlns: return xpath retval = re.subn("//", "//%s" % xmlns, xpath, max)[0] return retval
df9fa4b5	def parseNodes(nodes, xmlns = ""):
e5c6f6c5	## WARNING: Ignores text nodes from mixed xml/text. ## For instance <tag1>some text<tag2>other text</tag2></tag1> ## will be ignore "some text" node
df9fa4b5	retval = [] for node in nodes: retval_item = {} for child in node.getchildren():
0d91ff3f	name = stripTagXmlns(xmlns, child.tag)
e5c6f6c5	if child.getchildren(): retval_item[name] = parseNodes([child], xmlns) else: retval_item[name] = node.findtext(".//%s" % child.tag)
df9fa4b5	retval.append(retval_item) return retval def getNameSpace(element): if not element.tag.startswith("{"): return "" return re.compile("^(\{[^}]+\})").match(element.tag).groups()[0]
67a8d099	def getTreeFromXml(xml):
b6e1cada	tree = ET.fromstring(xml)
67a8d099	tree.xmlns = getNameSpace(tree) return tree def getListFromXml(xml, node): tree = getTreeFromXml(xml) nodes = tree.findall('.//%s%s' % (tree.xmlns, node)) return parseNodes(nodes, tree.xmlns)
b6e1cada
0d91ff3f	def getTextFromXml(xml, xpath):
67a8d099	tree = getTreeFromXml(xml)
dc758146	if tree.tag.endswith(xpath): return tree.text else:
67a8d099	return tree.findtext(fixupXPath(tree.xmlns, xpath)) def getRootTagName(xml): tree = getTreeFromXml(xml) return stripTagXmlns(tree.xmlns, tree.tag)
0d91ff3f
df9fa4b5	def dateS3toPython(date): date = re.compile("\.\d\d\dZ").sub(".000Z", date) return time.strptime(date, "%Y-%m-%dT%H:%M:%S.000Z") def dateS3toUnix(date): ## FIXME: This should be timezone-aware. ## Currently the argument to strptime() is GMT but mktime() ## treats it as "localtime". Anyway... return time.mktime(dateS3toPython(date))
63ba9974	def formatSize(size, human_readable = False, floating_point = False): size = floating_point and float(size) or int(size)
df9fa4b5	if human_readable: coeffs = ['k', 'M', 'G', 'T'] coeff = "" while size > 2048:
b5fe5ac4	size /= 1024
df9fa4b5	coeff = coeffs.pop(0) return (size, coeff) else: return (size, "") def formatDateTime(s3timestamp): return time.strftime("%Y-%m-%d %H:%M", dateS3toPython(s3timestamp))
b5fe5ac4	def convertTupleListToDict(list): retval = {} for tuple in list: retval[tuple[0]] = tuple[1] return retval
8ec1807f	_rnd_chars = string.ascii_letters+string.digits _rnd_chars_len = len(_rnd_chars) def rndstr(len): retval = "" while len > 0: retval += _rnd_chars[random.randint(0, _rnd_chars_len-1)] len -= 1 return retval def mktmpsomething(prefix, randchars, createfunc): old_umask = os.umask(0077) tries = 5 while tries > 0: dirname = prefix + rndstr(randchars) try: createfunc(dirname) break except OSError, e: if e.errno != errno.EEXIST: os.umask(old_umask) raise tries -= 1 os.umask(old_umask) return dirname def mktmpdir(prefix = "/tmp/tmpdir-", randchars = 10): return mktmpsomething(prefix, randchars, os.mkdir) def mktmpfile(prefix = "/tmp/tmpfile-", randchars = 20): createfunc = lambda filename : os.close(os.open(filename, os.O_CREAT \| os.O_EXCL)) return mktmpsomething(prefix, randchars, createfunc)
49731b40	def hash_file_md5(filename):
3c682455	h = md5()
37a8ad44	f = open(filename, "rb")
9a5cde49	while True: # Hash 32kB chunks data = f.read(32*1024) if not data: break h.update(data)
49731b40	f.close() return h.hexdigest()
ed27a45e
bc4c306d	def mkdir_with_parents(dir_name):
ed27a45e	"""
bc4c306d	mkdir_with_parents(dst_dir)
ed27a45e	Create directory 'dir_name' with all parent directories Returns True on success, False otherwise. """ pathmembers = dir_name.split(os.sep) tmp_stack = [] while pathmembers and not os.path.isdir(os.sep.join(pathmembers)): tmp_stack.append(pathmembers.pop()) while tmp_stack: pathmembers.append(tmp_stack.pop()) cur_dir = os.sep.join(pathmembers) try: debug("mkdir(%s)" % cur_dir) os.mkdir(cur_dir)
bc4c306d	except (OSError, IOError), e: warning("%s: can not make directory: %s" % (cur_dir, e.strerror))
ed27a45e	return False except Exception, e:
bc4c306d	warning("%s: %s" % (cur_dir, e))
ed27a45e	return False return True
d90a7929
82d9eafa	def unicodise(string, encoding = None, errors = "replace"):
d90a7929	""" Convert 'string' to Unicode or raise an exception. """
82d9eafa	if not encoding: encoding = Config.Config().encoding debug("Unicodising %r using %s" % (string, encoding))
d90a7929	if type(string) == unicode: return string try:
82d9eafa	return string.decode(encoding, errors)
d90a7929	except UnicodeDecodeError: raise UnicodeDecodeError("Conversion to unicode failed: %r" % string)
82d9eafa	def deunicodise(string, encoding = None, errors = "replace"): """ Convert unicode 'string' to <type str>, by default replacing all invalid characters with '?' or raise an exception. """ if not encoding: encoding = Config.Config().encoding debug("DeUnicodising %r using %s" % (string, encoding)) if type(string) != unicode: return str(string)
d90a7929	try:
82d9eafa	return string.encode(encoding, errors) except UnicodeEncodeError: raise UnicodeEncodeError("Conversion from unicode failed: %r" % string) def unicodise_safe(string, encoding = None): """ Convert 'string' to Unicode according to current encoding and replace all invalid characters with '?' """ return unicodise(deunicodise(string, encoding), encoding).replace(u'\ufffd', '?')
d90a7929