Context Navigation

system_tools.py @ 7170

Last change on this file since 7170 was 7170, checked in by rwilson, 16 years ago
Changed safe_crc() to use suggested method.
File size: 19.1 KB

Rev	Line
[3937]	1	"""Implementation of tools to do with system administration made as platform independent as possible.
	2
	3
	4	"""
	5
	6	import sys
	7	import os
[6415]	8	import string
[6689]	9	import urllib
	10	import urllib2
	11	import getpass
	12	import tarfile
[7035]	13	try:
	14	import hashlib
	15	except ImportError:
	16	import md5 as hashlib
[3937]	17
[6689]	18
[5586]	19	def log_to_file(filename, s, verbose=False):
	20	"""Log string to file name
[5436]	21	"""
	22
	23	fid = open(filename, 'a')
	24	if verbose: print s
	25	fid.write(s + '\n')
	26	fid.close()
	27
	28
[3937]	29	def get_user_name():
	30	"""Get user name provide by operating system
	31	"""
	32
	33	if sys.platform == 'win32':
	34	#user = os.getenv('USERPROFILE')
	35	user = os.getenv('USERNAME')
	36	else:
	37	user = os.getenv('LOGNAME')
	38
	39
	40	return user
	41
	42	def get_host_name():
	43	"""Get host name provide by operating system
	44	"""
	45
	46	if sys.platform == 'win32':
	47	host = os.getenv('COMPUTERNAME')
	48	else:
	49	host = os.uname()[1]
	50
	51
	52	return host
[4787]	53
	54	def get_revision_number():
[6904]	55	"""Get the version number of this repository copy.
	56
	57	Try getting data from stored_version_info.py first, otherwise
	58	try using SubWCRev.exe (Windows) or svnversion (linux), otherwise
	59	try reading file .svn/entries for version information, otherwise
	60	throw an exception.
	61
[4787]	62	NOTE: This requires that the command svn is on the system PATH
	63	(simply aliasing svn to the binary will not work)
	64	"""
	65
[6904]	66	def get_revision_from_svn_entries():
	67	'''Get a subversion revision number from the .svn/entires file.'''
	68
[6689]	69	msg = '''
	70	No version info stored and command 'svn' is not recognised on the system PATH.
[4787]	71
[6904]	72	If ANUGA has been installed from a distribution e.g. as obtained from SourceForge,
	73	the version info should be available in the automatically generated file
	74	'stored_version_info.py' in the anuga root directory.
[4787]	75
[6904]	76	If run from a Subversion sandpit, ANUGA will try to obtain the version info by
	77	using the command 'svn info'. In this case, make sure the command line client
	78	'svn' is accessible on the system path. Simply aliasing 'svn' to the binary will
	79	not work.
[4787]	80
[6689]	81	If you are using Windows, you have to install the file svn.exe which can be
	82	obtained from http://www.collab.net/downloads/subversion.
[4787]	83
[6689]	84	Good luck!
	85	'''
[4787]	86
	87	try:
[6904]	88	fd = open(os.path.join('.svn', 'entries'))
[4787]	89	except:
[6904]	90	raise Exception, msg
[6689]	91
[6904]	92	line = fd.readlines()[3]
	93	fd.close()
	94	try:
	95	revision_number = int(line)
	96	except:
	97	msg = ".svn/entries, line 4 was '%s'?" % line.strip()
[6689]	98	raise Exception, msg
[6904]	99
	100	return revision_number
	101
	102	def get_revision_from_svn_client():
	103	'''Get a subversion revision number from an svn client.'''
	104
	105	if sys.platform[0:3] == 'win':
	106	try:
	107	fid = os.popen(r'C:\Program Files\TortoiseSVN\bin\SubWCRev.exe')
	108	except:
	109	return get_revision_from_svn_entries()
	110	else:
	111	version_info = fid.read()
	112	if version_info == '':
	113	return get_revision_from_svn_entries()
	114
	115	# split revision number from data
	116	for line in version_info.split('\n'):
	117	if line.startswith('Updated to revision '):
	118	break
	119
	120	fields = line.split(' ')
	121	msg = 'Keyword "Revision" was not found anywhere in text: %s' % version_info
	122	assert fields[0].startswith('Updated'), msg
	123
	124	try:
	125	revision_number = int(fields[3])
	126	except:
	127	msg = ("Revision number must be an integer. I got '%s' from "
	128	"'SubWCRev.exe'." % fields[3])
	129	raise Exception, msg
	130	else: # assume Linux
	131	try:
	132	fid = os.popen('svnversion -n . 2>/dev/null')
	133	except:
	134	return get_revision_from_svn_entries()
	135	else:
	136	version_info = fid.read()
	137	if version_info == '':
	138	return get_revision_from_svn_entries()
	139
	140	# split revision number from data
	141	if ':' in version_info:
	142	(_, revision_number) = version_info.split(':')
	143	elif version_info.endswith('M'):
	144	revision_number = version_info[:-1]
	145	else:
	146	revision_number = version_info
	147
	148	try:
	149	revision_number = int(revision_number)
	150	except:
	151	msg = ("Revision number must be an integer. I got '%s' from "
	152	"'svn'." % version_info)
	153	raise Exception, msg
	154
	155	return revision_number
	156
	157	# try to get revision information from stored_version_info.py
	158	try:
	159	from anuga.stored_version_info import version_info
	160	except:
	161	return get_revision_from_svn_client()
	162
	163	# split revision number from data
[4787]	164	for line in version_info.split('\n'):
	165	if line.startswith('Revision:'):
	166	break
	167
	168	fields = line.split(':')
[6689]	169	msg = 'Keyword "Revision" was not found anywhere in text: %s' % version_info
[6904]	170	assert fields[0].startswith('Revision'), msg
[4787]	171
	172	try:
	173	revision_number = int(fields[1])
	174	except:
[6904]	175	msg = ("Revision number must be an integer. I got '%s'.\n"
	176	'Check that the command svn is on the system path.'
	177	% fields[1])
[6689]	178	raise Exception, msg
	179
[4787]	180	return revision_number
	181
	182
	183	def store_version_info(destination_path='.', verbose=False):
	184	"""Obtain current version from Subversion and store it.
	185
	186	Title: store_version_info()
	187
	188	Author: Ole Nielsen (Ole.Nielsen@ga.gov.au)
	189
	190	CreationDate: January 2006
	191
	192	Description:
	193	This function obtains current version from Subversion and stores it
	194	is a Python file named 'stored_version_info.py' for use with
	195	get_version_info()
	196
	197	If svn is not available on the system PATH, an Exception is thrown
	198	"""
	199
	200	# Note (Ole): This function should not be unit tested as it will only
	201	# work when running out of the sandpit. End users downloading the
	202	# ANUGA distribution would see a failure.
	203	#
	204	# FIXME: This function should really only be used by developers (
	205	# (e.g. for creating new ANUGA releases), so maybe it should move
	206	# to somewhere else.
	207
	208	import config
	209
	210	try:
	211	fid = os.popen('svn info')
	212	except:
	213	msg = 'Command "svn" is not recognised on the system PATH'
	214	raise Exception(msg)
	215	else:
	216	txt = fid.read()
	217	fid.close()
	218
	219
	220	# Determine absolute filename
	221	if destination_path[-1] != os.sep:
	222	destination_path += os.sep
	223
	224	filename = destination_path + config.version_filename
	225
	226	fid = open(filename, 'w')
	227
	228	docstring = 'Stored version info.\n\n'
	229	docstring += 'This file provides the version for distributions '
	230	docstring += 'that are not accessing Subversion directly.\n'
	231	docstring += 'The file is automatically generated and should not '
	232	docstring += 'be modified manually.\n'
	233	fid.write('"""%s"""\n\n' %docstring)
	234
	235	fid.write('version_info = """\n%s"""' %txt)
	236	fid.close()
	237
	238
	239	if verbose is True:
	240	print 'Version info stored to %s' %filename
[4952]	241
[6689]	242
[5048]	243	def safe_crc(string):
	244	"""64 bit safe crc computation.
	245
[7170]	246	See http://docs.python.org/library/zlib.html#zlib.crc32:
	247
	248	To generate the same numeric value across all Python versions
	249	and platforms use crc32(data) & 0xffffffff.
[5048]	250	"""
	251
	252	from zlib import crc32
	253
[7170]	254	return crc32(string) & 0xffffffff
[5048]	255
	256
[4963]	257	def compute_checksum(filename, max_length=2**20):
[4952]	258	"""Compute the CRC32 checksum for specified file
[4963]	259
	260	Optional parameter max_length sets the maximum number
	261	of bytes used to limit time used with large files.
	262	Default = 2**20 (1MB)
[4952]	263	"""
	264
[5042]	265	fid = open(filename, 'rb') # Use binary for portability
[5048]	266	crcval = safe_crc(fid.read(max_length))
[4977]	267	fid.close()
[5045]	268
[4952]	269	return crcval
[5072]	270
	271	def get_pathname_from_package(package):
	272	"""Get pathname of given package (provided as string)
	273
	274	This is useful for reading files residing in the same directory as
	275	a particular module. Typically, this is required in unit tests depending
	276	on external files.
	277
	278	The given module must start from a directory on the pythonpath
	279	and be importable using the import statement.
	280
	281	Example
	282	path = get_pathname_from_package('anuga.utilities')
	283
	284	"""
	285
	286	exec('import %s as x' %package)
	287
	288	path = x.__path__[0]
	289
	290	return path
	291
	292	# Alternative approach that has been used at times
	293	#try:
	294	# # When unit test is run from current dir
	295	# p1 = read_polygon('mainland_only.csv')
	296	#except:
	297	# # When unit test is run from ANUGA root dir
	298	# from os.path import join, split
	299	# dir, tail = split(__file__)
	300	# path = join(dir, 'mainland_only.csv')
	301	# p1 = read_polygon(path)
	302
[6410]	303
[6360]	304	##
	305	# @brief Split a string into 'clean' fields.
	306	# @param str The string to process.
	307	# @param delimiter The delimiter string to split 'line' with.
	308	# @return A list of 'cleaned' field strings.
	309	# @note Any fields that were initially zero length will be removed.
	310	# @note If a field contains '\n' it isn't zero length.
	311	def clean_line(str, delimiter):
	312	"""Split string on given delimiter, remove whitespace from each field."""
[5072]	313
[6410]	314	return [x.strip() for x in str.strip().split(delimiter) if x != '']
[5072]	315
[6360]	316
[6415]	317	################################################################################
	318	# The following two functions are used to get around a problem with numpy and
	319	# NetCDF files. Previously, using Numeric, we could take a list of strings and
	320	# convert to a Numeric array resulting in this:
	321	# Numeric.array(['abc', 'xy']) -> [['a', 'b', 'c'],
	322	# ['x', 'y', ' ']]
	323	#
	324	# However, under numpy we get:
	325	# numpy.array(['abc', 'xy']) -> ['abc',
	326	# 'xy']
	327	#
	328	# And writing strings to a NetCDF file is problematic.
	329	#
	330	# The solution is to use these two routines to convert a 1-D list of strings
	331	# to the 2-D list of chars form and back. The 2-D form can be written to a
	332	# NetCDF file as before.
	333	#
	334	# The other option, of inverting a list of tag strings into a dictionary with
	335	# keys being the unique tag strings and the key value a list of indices of where
	336	# the tag string was in the original list was rejected because:
	337	# 1. It's a lot of work
	338	# 2. We'd have to rewite the I/O code a bit (extra variables instead of one)
	339	# 3. The code below is fast enough in an I/O scenario
	340	################################################################################
	341
	342	##
	343	# @brief Convert 1-D list of strings to 2-D list of chars.
	344	# @param l 1-dimensional list of strings.
	345	# @return A 2-D list of 'characters' (1 char strings).
	346	# @note No checking that we supply a 1-D list.
	347	def string_to_char(l):
	348	'''Convert 1-D list of strings to 2-D list of chars.'''
	349
[6428]	350	if not l:
	351	return []
	352
	353	if l == ['']:
	354	l = [' ']
	355
[6415]	356	maxlen = reduce(max, map(len, l))
	357	ll = [x.ljust(maxlen) for x in l]
	358	result = []
	359	for s in ll:
	360	result.append([x for x in s])
	361	return result
	362
	363
	364	##
	365	# @brief Convert 2-D list of chars to 1-D list of strings.
	366	# @param ll 2-dimensional list of 'characters' (1 char strings).
	367	# @return A 1-dimensional list of strings.
	368	# @note Each string has had right-end spaces removed.
	369	def char_to_string(ll):
	370	'''Convert 2-D list of chars to 1-D list of strings.'''
	371
	372	return map(string.rstrip, [''.join(x) for x in ll])
	373
[6786]	374	################################################################################
[6415]	375
[6689]	376	##
	377	# @brief Get list of variable names in a python expression string.
	378	# @param source A string containing a python expression.
	379	# @return A list of variable name strings.
	380	# @note Throws SyntaxError exception if not a valid expression.
	381	def get_vars_in_expression(source):
	382	'''Get list of variable names in a python expression.'''
	383
	384	import compiler
	385	from compiler.ast import Node
	386
	387	##
	388	# @brief Internal recursive function.
	389	# @param node An AST parse Node.
	390	# @param var_list Input list of variables.
	391	# @return An updated list of variables.
	392	def get_vars_body(node, var_list=[]):
	393	if isinstance(node, Node):
	394	if node.__class__.__name__ == 'Name':
	395	for child in node.getChildren():
	396	if child not in var_list:
	397	var_list.append(child)
	398	for child in node.getChildren():
	399	if isinstance(child, Node):
	400	for child in node.getChildren():
	401	var_list = get_vars_body(child, var_list)
	402	break
	403
	404	return var_list
	405
	406	return get_vars_body(compiler.parse(source))
	407
	408
	409	##
	410	# @brief Get a file from the web.
	411	# @param file_url URL of the file to fetch.
	412	# @param file_name Path to file to create in the filesystem.
	413	# @param auth Auth tuple (httpproxy, proxyuser, proxypass).
	414	# @param blocksize Read file in this block size.
[6904]	415	# @return (True, auth) if successful, else (False, auth).
[6689]	416	# @note If 'auth' not supplied, will prompt user.
	417	# @note Will try using environment variable HTTP_PROXY for proxy server.
	418	# @note Will try using environment variable PROXY_USERNAME for proxy username.
	419	# @note Will try using environment variable PROXY_PASSWORD for proxy password.
	420	def get_web_file(file_url, file_name, auth=None, blocksize=1024*1024):
[6786]	421	'''Get a file from the web (HTTP).
[6689]	422
	423	file_url: The URL of the file to get
	424	file_name: Local path to save loaded file in
	425	auth: A tuple (httpproxy, proxyuser, proxypass)
	426	blocksize: Block size of file reads
	427
	428	Will try simple load through urllib first. Drop down to urllib2
	429	if there is a proxy and it requires authentication.
	430
	431	Environment variable HTTP_PROXY can be used to supply proxy information.
	432	PROXY_USERNAME is used to supply the authentication username.
	433	PROXY_PASSWORD supplies the password, if you dare!
	434	'''
	435
	436	# Simple fetch, if fails, check for proxy error
	437	try:
	438	urllib.urlretrieve(file_url, file_name)
[6904]	439	return (True, auth) # no proxy, no auth required
[6689]	440	except IOError, e:
[6786]	441	if e[1] == 407: # proxy error
	442	pass
	443	elif e[1][0] == 113: # no route to host
	444	print 'No route to host for %s' % file_url
[6904]	445	return (False, auth) # return False
[6786]	446	else:
	447	print 'Unknown connection error to %s' % file_url
[6904]	448	return (False, auth)
[6689]	449
	450	# We get here if there was a proxy error, get file through the proxy
	451	# unpack auth info
	452	try:
	453	(httpproxy, proxyuser, proxypass) = auth
	454	except:
	455	(httpproxy, proxyuser, proxypass) = (None, None, None)
	456
	457	# fill in any gaps from the environment
	458	if httpproxy is None:
	459	httpproxy = os.getenv('HTTP_PROXY')
	460	if proxyuser is None:
	461	proxyuser = os.getenv('PROXY_USERNAME')
	462	if proxypass is None:
	463	proxypass = os.getenv('PROXY_PASSWORD')
	464
	465	# Get auth info from user if still not supplied
	466	if httpproxy is None or proxyuser is None or proxypass is None:
[6913]	467	print '-'*72
[6786]	468	print ('You need to supply proxy authentication information.')
[6689]	469	if httpproxy is None:
[6815]	470	httpproxy = raw_input(' proxy server: ')
	471	else:
	472	print ' HTTP proxy was supplied: %s' % httpproxy
[6689]	473	if proxyuser is None:
[6815]	474	proxyuser = raw_input(' proxy username: ')
	475	else:
	476	print 'HTTP proxy username was supplied: %s' % proxyuser
[6689]	477	if proxypass is None:
[6815]	478	proxypass = getpass.getpass(' proxy password: ')
	479	else:
	480	print 'HTTP proxy password was supplied: %s' % ''len(proxyuser)
[6913]	481	print '-'*72
[6689]	482
	483	# the proxy URL cannot start with 'http://', we add that later
	484	httpproxy = httpproxy.lower()
	485	if httpproxy.startswith('http://'):
	486	httpproxy = httpproxy.replace('http://', '', 1)
	487
	488	# open remote file
	489	proxy = urllib2.ProxyHandler({'http': 'http://' + proxyuser
	490	+ ':' + proxypass
	491	+ '@' + httpproxy})
	492	authinfo = urllib2.HTTPBasicAuthHandler()
	493	opener = urllib2.build_opener(proxy, authinfo, urllib2.HTTPHandler)
	494	urllib2.install_opener(opener)
[6825]	495	try:
	496	webget = urllib2.urlopen(file_url)
[6904]	497	except urllib2.HTTPError, e:
	498	print 'Error received from proxy:\n%s' % str(e)
	499	print 'Possibly the user/password is wrong.'
	500	return (False, (httpproxy, proxyuser, proxypass))
[6689]	501
	502	# transfer file to local filesystem
	503	fd = open(file_name, 'wb')
	504	while True:
	505	data = webget.read(blocksize)
	506	if len(data) == 0:
	507	break
	508	fd.write(data)
	509	fd.close
	510	webget.close()
	511
	512	# return successful auth info
[6904]	513	return (True, (httpproxy, proxyuser, proxypass))
[6689]	514
	515
	516	##
	517	# @brief Tar a file (or directory) into a tarfile.
	518	# @param files A list of files (or directories) to tar.
	519	# @param tarfile The created tarfile name.
[7024]	520	# @note 'files' may be a string (single file) or a list of strings.
[6689]	521	# @note We use gzip compression.
	522	def tar_file(files, tarname):
	523	'''Compress a file or directory into a tar file.'''
	524
[7024]	525	if isinstance(files, basestring):
	526	files = [files]
	527
[6689]	528	o = tarfile.open(tarname, 'w:gz')
	529	for file in files:
	530	o.add(file)
	531	o.close()
	532
	533
	534	##
	535	# @brief Untar a file into an optional target directory.
	536	# @param tarname Name of the file to untar.
	537	# @param target_dir Directory to untar into.
	538	def untar_file(tarname, target_dir='.'):
	539	'''Uncompress a tar file.'''
	540
	541	o = tarfile.open(tarname, 'r:gz')
	542	members = o.getmembers()
	543	for member in members:
	544	o.extract(member, target_dir)
	545	o.close()
	546
	547
	548	##
[6904]	549	# @brief Return a hex digest (MD5) of a given file.
[6689]	550	# @param filename Path to the file of interest.
	551	# @param blocksize Size of data blocks to read.
	552	# @return A hex digest string (16 bytes).
[7148]	553	# @note Uses MD5 digest if hashlib not available.
[6689]	554	def get_file_hexdigest(filename, blocksize=1024102410):
	555	'''Get a hex digest of a file.'''
[7035]	556
	557	if hashlib.__name__ == 'hashlib':
	558	m = hashlib.md5() # new - 'hashlib' module
	559	else:
	560	m = hashlib.new() # old - 'md5' module - remove once py2.4 gone
[6689]	561	fd = open(filename, 'r')
	562
	563	while True:
	564	data = fd.read(blocksize)
	565	if len(data) == 0:
	566	break
	567	m.update(data)
	568
	569	fd.close()
	570	return m.hexdigest()
	571
	572
	573	##
	574	# @brief Create a file containing a hexdigest string of a data file.
	575	# @param data_file Path to the file to get the hexdigest from.
	576	# @param digest_file Path to hexdigest file to create.
	577	# @note Uses MD5 digest.
	578	def make_digest_file(data_file, digest_file):
	579	'''Create a file containing the hex digest string of a data file.'''
	580
	581	hexdigest = get_file_hexdigest(data_file)
	582	fd = open(digest_file, 'w')
	583	fd.write(hexdigest)
	584	fd.close()
	585
	586
	587	##
	588	# @brief Function to return the length of a file.
	589	# @param in_file Path to file to get length of.
	590	# @return Number of lines in file.
	591	# @note Doesn't count '\n' characters.
	592	# @note Zero byte file, returns 0.
	593	# @note No \n in file at all, but >0 chars, returns 1.
	594	def file_length(in_file):
	595	'''Function to return the length of a file.'''
	596
	597	fid = open(in_file)
	598	data = fid.readlines()
	599	fid.close()
	600	return len(data)
	601
	602

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: branches/numpy/anuga/utilities/system_tools.py @ 7170

Download in other formats: