#!/usr/bin/env python # corestats.py (COREy STATS) # Copyright (c) 2006-2007, Corey Goldberg (corey@goldb.org) # # statistical calculation class # for processing numeric sequences # # license: GNU LGPL # # This library is free software; you can redistribute it and/or # modify it under the terms of the GNU Lesser General Public # License as published by the Free Software Foundation; either # version 2.1 of the License, or (at your option) any later version. import sys class Stats: def __init__(self, sequence): # sequence of numbers we will process # convert all items to floats for numerical processing self.sequence = [float(item) for item in sequence] self.use_fastselect = False # switch the algorithm used for percentiles def print_sequence(self): # print the sequence (newline delimited) for item in self.sequence: print item def sum(self): if len(self.sequence) < 1: return None else: return sum(self.sequence) def count(self): return len(self.sequence) def min(self): if len(self.sequence) < 1: return None else: return min(self.sequence) def max(self): if len(self.sequence) < 1: return None else: return max(self.sequence) def avg(self): if len(self.sequence) < 1: return None else: return sum(self.sequence) / len(self.sequence) def median(self): if len(self.sequence) < 1: return None else: seq.sort() return self.sequence[len(self.sequence) // 2] def stdev(self): if len(self.sequence) < 1: return None else: avg = self.avg() sdsq = sum([(i - avg) ** 2 for i in self.sequence]) stdev = (sdsq / (len(self.sequence) - 1 or 1)) ** .5 return stdev def percentile(self, percentile): if self.use_fastselect: # get fastselect here: http://aspn.activestate.com/ASPN/Cookbook/Python/Recipe/466330 import fastselect if len(self.sequence) < 1: value = None elif (percentile >= 100): sys.stderr.write('ERROR: percentile must be < 100. you supplied: %s\n'% percentile) value = None else: element_idx = int(len(self.sequence) * (percentile / 100.0)) if self.use_fastselect: # fastselect algorithm. see fastselect for performance details value = fastselect.select(element_idx, self.sequence) else: self.sequence.sort() value = self.sequence[element_idx] return value