From 1b63c73eb70f71d6a4e3ac8cb76ef599ba7fda7d Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Tue, 25 Aug 2015 14:19:57 +0200 Subject: [PATCH 1/6] More documentation; Removed dead codepath. --- libkinetics/__init__.py | 75 ++++++++++++++++++++++++++++++++--------- 1 file changed, 59 insertions(+), 16 deletions(-) diff --git a/libkinetics/__init__.py b/libkinetics/__init__.py index 5e2ed72..4ae3078 100644 --- a/libkinetics/__init__.py +++ b/libkinetics/__init__.py @@ -115,22 +115,43 @@ class Experiment(): """ Represents the actual experiment. - Consists of several Measurement objects. + Representation of a kinetics experiment. It consists of multiple + objects of type Measurement. - Args: - data_files: list containing csv-formatted data files - xlim: tuple of float values defining the lower and upper bound for - linear fitting of v0 - do_hill: boolean to define whether to fit Hill-type kinetics in - addition to Michaelis-Menten kinetics. Defaults to False - fit_to_replicates: boolean to define wheter to fit to individual - replicates instead of the avarage slope. Defaults to False - logger: logging.Logger instance. If not given, a new logger is created + Attributes: + logger: logging.Logger instance that is used for logging to console + and log file. + measurements: list of individual measurements of the experiment. + Usually defined by different substrate concentrations. + fit_to_replicates: whether to fit to individual replicates instead to + the average of each measurement. + raw_kinetic_data: dictionary storing x, y and std_err of each + measurement for fitting kinetic curves. + xlim: lower and upper bounds for calculating the v0 linear fit. """ def __init__(self, data_files, xlim, do_hill=False, fit_to_replicates=False, logger=None): + """ + Inits Experiment class with experimental parameters + This is the only class you should have to use directly in your program. + Instances of Measurement and Replicate objects are created + automatically using the provided data files. + + Args: + data_files: list containing csv-formatted data files + xlim: tuple of float values defining the lower and upper bound for + linear fitting of v0 + do_hill: boolean to define whether to fit Hill-type kinetics in + addition to Michaelis-Menten kinetics. Defaults to False + fit_to_replicates: boolean to define wheter to fit to individual + replicates instead of the avarage slope. Defaults to False + logger: logging.Logger instance. If not given, a new logger is + created + """ + + # check if a logger was handed over; if not, create a new instance if logger: self.logger = logger else: @@ -189,17 +210,39 @@ class Experiment(): else: self.hill = None - def plot_data(self, outpath): - # iterate over all measurements - for m in self.measurements: - # plot each measurement - m.plot(outpath) - def mm_kinetics_function(self, x, vmax, Km): + """ + Michaelis-Menten function. + + Classical Michaelis-Menten enzyme kinetics function. + + Args: + x: concentration at velocity v + vmax: maximum velocity + Km: Michaelis constant + + Returns: + v: velocity at given concentration x + """ v = (vmax*x)/(Km+x) return v def hill_kinetics_function(self, x, vmax, Kprime, h): + """ + Hill function. + + Hill function for enzyme kinetics with cooperativity. + + Args: + x: concentration at velocity v + vmax: maximum velocity + Kprime: kinetics constant related to Michaelis constant + h: hill slope; if 1 function is identical to Michaelis-Menten + function. + + Returns: + v: velocity at given concentration x + """ v = (vmax*(x**h))/(Kprime+(x**h)) return v From df189d08f0a494abe0865e49d896cb966d4d0736 Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Wed, 26 Aug 2015 16:45:40 +0200 Subject: [PATCH 2/6] Improve docs; Use custom Exceptions --- libkinetics/__init__.py | 141 +++++++++++++++++++++++++++++----------- 1 file changed, 104 insertions(+), 37 deletions(-) diff --git a/libkinetics/__init__.py b/libkinetics/__init__.py index 4ae3078..9605d0b 100644 --- a/libkinetics/__init__.py +++ b/libkinetics/__init__.py @@ -7,7 +7,24 @@ import logging import warnings +class Error(Exception): + + """ + Main Error class derived from Exception. + """ + pass + + +class FitError(Error): + + """ + Exception raised if fitting fails. + """ + pass + + class Replicate(): + """ Represents a single replicate within a measurement """ @@ -66,6 +83,7 @@ class Replicate(): class Measurement(): + """ Represents a single measurement within an experiment. """ @@ -112,6 +130,7 @@ class Measurement(): class Experiment(): + """ Represents the actual experiment. @@ -121,13 +140,17 @@ class Experiment(): Attributes: logger: logging.Logger instance that is used for logging to console and log file. - measurements: list of individual measurements of the experiment. + measurements: array_like + list of individual measurements of the experiment. Usually defined by different substrate concentrations. - fit_to_replicates: whether to fit to individual replicates instead to - the average of each measurement. - raw_kinetic_data: dictionary storing x, y and std_err of each - measurement for fitting kinetic curves. - xlim: lower and upper bounds for calculating the v0 linear fit. + fit_to_replicates: boolean + whether to fit to individual replicates instead to the average of + each measurement. + raw_kinetic_data: dictionary + storing x, y and std_err of each measurement for fitting kinetic + curves. + xlim: array_like + lower and upper bounds for calculating the v0 linear fit. """ def __init__(self, data_files, xlim, do_hill=False, @@ -217,12 +240,16 @@ class Experiment(): Classical Michaelis-Menten enzyme kinetics function. Args: - x: concentration at velocity v - vmax: maximum velocity - Km: Michaelis constant + x: float + concentration at velocity v + vmax: float + maximum velocity + Km: float + Michaelis constant Returns: - v: velocity at given concentration x + v: float + velocity at given concentration x """ v = (vmax*x)/(Km+x) return v @@ -234,23 +261,50 @@ class Experiment(): Hill function for enzyme kinetics with cooperativity. Args: - x: concentration at velocity v - vmax: maximum velocity - Kprime: kinetics constant related to Michaelis constant - h: hill slope; if 1 function is identical to Michaelis-Menten - function. + x: float + concentration at velocity v. + vmax: float + maximum velocity. + Kprime: float + kinetics constant related to Michaelis constant. + h: float + hill slope; if h=1, Hill function is identical to + Michaelis-Menten function. Returns: - v: velocity at given concentration x + v: float + velocity at given concentration x """ v = (vmax*(x**h))/(Kprime+(x**h)) return v def do_mm_kinetics(self): + """ + Calculates Michaelis-Menten kinetics. + + Returns: + On success, returns a dictionary containing the kinetic parameters + and their errors: + + {'vmax': float, + 'Km': float, + 'vmax_err': float, + 'Km_err': float, + 'x': array_like} + + Raises: + FitError if fitting fails. + """ try: popt, pconv = optimize.curve_fit(self.mm_kinetics_function, self.raw_kinetic_data['x'], self.raw_kinetic_data['y']) + except ValueError: + msg = ('Calculation of Michaelis-Menten kinetics failed! Your ' + 'input data (either x or y) contain empty (NaN) values!') + if self.logger: + self.logger.error('{}'.format(msg)) + raise FitError(msg) perr = np.sqrt(np.diag(pconv)) vmax = popt[0] @@ -261,23 +315,41 @@ class Experiment(): self.logger.info(' v_max: {} ± {}'.format(vmax, perr[0])) self.logger.info(' Km: {} ± {}'.format(Km, perr[1])) - return {'vmax': float(vmax), - 'Km': float(Km), - 'perr': perr, + return {'vmax': np.float(vmax), + 'Km': np.float(Km), + 'vmax_err': np.float(perr[0]), + 'Km_err': np.float(perr[1]), 'x': x} - except: - msg = 'Calculation of Michaelis-Menten kinetics failed!' - if self.logger: - self.logger.error('{}'.format(msg)) - else: - print(msg) - return None def do_hill_kinetics(self): + """ + Calculates Hill kinetics. + + Returns: + On success, returns a dictionary containing the kinetic parameters + their errors: + + {'vmax': float, + 'Kprime': float, + 'vmax_err': float, + 'Km_prime': float, + 'h_err': float, + 'h': float, + 'x': array_like} + + Raises: + FitError if fitting fails. + """ try: popt, pconv = optimize.curve_fit(self.hill_kinetics_function, self.raw_kinetic_data['x'], self.raw_kinetic_data['y']) + except ValueError: + msg = ('Calculation of Hill kinetics failed! Your input data ' + '(either x or y) contain empty (NaN) values!') + if self.logger: + self.logger.error('{}'.format(msg)) + raise FitError(msg) perr = np.sqrt(np.diag(pconv)) vmax = popt[0] @@ -291,15 +363,10 @@ class Experiment(): self.logger.info(' K_prime: {} ± {}'.format(Kprime, perr[1])) self.logger.info(' h: {} ± {}'.format(h, perr[2])) - return {'vmax': float(vmax), - 'Kprime': float(Kprime), - 'perr': perr, - 'h': h, + return {'vmax': np.float(vmax), + 'Kprime': np.float(Kprime), + 'vmax_err': np.float(perr[0]), + 'Kprime_err': np.float(perr[1]), + 'h_err': np.float(perr[2]), + 'h': np.float(h), 'x': x} - except: - msg = 'Calculation of Hill kinetics failed!' - if self.logger: - self.logger.error('{}'.format(msg)) - else: - print(msg) - return None From d5e66fd4fe7e513af6dd4acc6995bc6e2f4e18a9 Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Thu, 27 Aug 2015 15:31:08 +0200 Subject: [PATCH 3/6] Add std to results.csv --- analyze-cli.py | 49 +++++++++++++++++++++++++++++++------------------ 1 file changed, 31 insertions(+), 18 deletions(-) diff --git a/analyze-cli.py b/analyze-cli.py index 9dcc6cf..138b4b7 100755 --- a/analyze-cli.py +++ b/analyze-cli.py @@ -45,9 +45,9 @@ class ExperimentHelper(): y = slope * x + intercept return y - def plot_data(self, exp, outpath): + def plot_data(self, outpath): # iterate over all measurements - for m in exp.measurements: + for m in self.exp.measurements: # plot each measurement fig, ax = plt.subplots() ax.set_xlabel('Time') @@ -73,7 +73,8 @@ class ExperimentHelper(): bbox_inches='tight') plt.close(fig) - def plot_kinetics(self, exp, outpath): + def plot_kinetics(self, outpath): + exp = self.exp fig, ax = plt.subplots() ax.set_xlabel('c [mM]') ax.set_ylabel('dA/dt [Au/s]') @@ -100,37 +101,49 @@ class ExperimentHelper(): plt.savefig('{}/kinetics.png'.format(outpath), bbox_inches='tight') plt.close(fig) - def write_data(self, exp, outpath): + def write_data(self, outpath): + + exp = self.exp with open('{}/results.csv'.format(outpath), 'w', newline='\n') as csvfile: writer = csv.writer(csvfile, dialect='excel-tab') - writer.writerow(['# LINEAR FITS']) + writer.writerow(['LINEAR FITS']) writer.writerow([]) - writer.writerow(['# concentration', + writer.writerow(['concentration', 'avg. slope', 'slope std_err', - 'replicates (slope, intercept and r value)']) + 'replicates (slope, intercept and r_squared)']) for m in exp.measurements: row = [m.concentration, m.avg_slope, m.avg_slope_err] for r in m.replicates: row.append(r.fitresult['slope']) row.append(r.fitresult['intercept']) - row.append(r.fitresult['r_value']) + row.append(r.fitresult['r_squared']) writer.writerow(row) writer.writerow([]) if exp.mm: - writer.writerow(['# MICHAELIS-MENTEN KINETICS']) - writer.writerow(['# vmax', 'Km']) - writer.writerow([exp.mm['vmax'], exp.mm['Km']]) + self.logger.debug(' Writing Michaelis-Menten results.') + writer.writerow(['MICHAELIS-MENTEN KINETICS']) + writer.writerow(['', 'value', 'std']) + writer.writerow(['vmax', exp.mm['vmax'], + exp.mm['vmax_err']]) + writer.writerow(['Kprime', exp.mm['Km'], + exp.mm['Km_err']]) if exp.hill: - writer.writerow(['# HILL KINETICS']) - writer.writerow(['# vmax', 'Kprime', 'h']) - writer.writerow([exp.hill['vmax'], exp.hill['Kprime'], - exp.hill['h']]) + self.logger.debug(' Writing Hill results.') + writer.writerow([]) + writer.writerow(['HILL KINETICS']) + writer.writerow(['', 'value', 'std']) + writer.writerow(['vmax', exp.hill['vmax'], + exp.hill['vmax_err']]) + writer.writerow(['Kprime', exp.hill['Kprime'], + exp.hill['Kprime_err']]) + writer.writerow(['h', exp.hill['h'], + exp.hill['h_err']]) def parse_arguments(): @@ -259,11 +272,11 @@ def main(): fit_to_replicates=fit_to_replicates) ehlp = ExperimentHelper(exp, logger) logger.info('Plotting linear fits') - ehlp.plot_data(exp, str(output_path)) + ehlp.plot_data(str(output_path)) logger.info('Plotting kinetic fit(s)') - ehlp.plot_kinetics(exp, str(output_path)) + ehlp.plot_kinetics(str(output_path)) logger.info('Writing results to results.csv') - ehlp.write_data(exp, str(output_path)) + ehlp.write_data(str(output_path)) logger.info('Finished!') else: msg = '{} is not a directory!'.format(input_path) From 754c62ffd1ed705d7656ceba1238a2b9defc1d21 Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Thu, 27 Aug 2015 15:31:35 +0200 Subject: [PATCH 4/6] More robust error handling; check third-party imports --- libkinetics/__init__.py | 97 ++++++++++++++++++++++++++--------------- 1 file changed, 62 insertions(+), 35 deletions(-) diff --git a/libkinetics/__init__.py b/libkinetics/__init__.py index 9605d0b..e553fce 100644 --- a/libkinetics/__init__.py +++ b/libkinetics/__init__.py @@ -1,10 +1,19 @@ #!/usr/bin/python # -*- coding: utf-8 -*- -from scipy import stats, optimize -import numpy as np import logging import warnings +import operator + +try: + import numpy as np +except ImportError: + print('----- NumPy must be installed! -----') + +try: + from scipy import stats, optimize +except ImportError: + print('----- SciPy must be installed! -----') class Error(Exception): @@ -128,6 +137,9 @@ class Measurement(): return results + def get_concentration(self): + return self.concentration + class Experiment(): @@ -142,7 +154,8 @@ class Experiment(): and log file. measurements: array_like list of individual measurements of the experiment. - Usually defined by different substrate concentrations. + Individual measurements are sorted by their substrate + concentration. fit_to_replicates: boolean whether to fit to individual replicates instead to the average of each measurement. @@ -192,12 +205,22 @@ class Experiment(): # parse data files and generate measurements for csvfile in data_files: - tmp = np.genfromtxt(str(csvfile), comments='#') - with open(str(csvfile)) as datafile: - head = [next(datafile) for x in range(2)] + try: + tmp = np.genfromtxt(str(csvfile), comments='#') + with open(str(csvfile)) as datafile: + head = [next(datafile) for x in range(2)] + except OSError: + msg = "Failed reading file {}".format(str(csvfile)) + self.logger.error(msg) + raise + # extract concentration and unit from header # TODO: move unit to parameter - # TODO: More error-proof header detection + # check header for correct number of items + if len(head) < 2 or len(head) > 2: + msg = 'Parsing header of data files failed! Wrong format?' + self.logger.error(msg) + raise Error(msg) conc = head[0].strip('#').strip() unit = head[1].strip('#').strip() # split x and y data apart @@ -209,6 +232,10 @@ class Experiment(): measurement = Measurement((x, y), conc, unit, self) self.measurements.append(measurement) + # sort measurements by concentration + self.measurements = sorted(self.measurements, + key=operator.attrgetter('concentration')) + # iterate over all measurements for m in self.measurements: if self.fit_to_replicates: @@ -306,20 +333,20 @@ class Experiment(): self.logger.error('{}'.format(msg)) raise FitError(msg) - perr = np.sqrt(np.diag(pconv)) - vmax = popt[0] - Km = popt[1] - x = np.arange(0, max(self.raw_kinetic_data['x']), 0.0001) + perr = np.sqrt(np.diag(pconv)) + vmax = popt[0] + Km = popt[1] + x = np.arange(0, max(self.raw_kinetic_data['x']), 0.0001) - self.logger.info('Michaelis-Menten Kinetics:') - self.logger.info(' v_max: {} ± {}'.format(vmax, perr[0])) - self.logger.info(' Km: {} ± {}'.format(Km, perr[1])) + self.logger.info('Michaelis-Menten Kinetics:') + self.logger.info(' v_max: {} ± {}'.format(vmax, perr[0])) + self.logger.info(' Km: {} ± {}'.format(Km, perr[1])) - return {'vmax': np.float(vmax), - 'Km': np.float(Km), - 'vmax_err': np.float(perr[0]), - 'Km_err': np.float(perr[1]), - 'x': x} + return {'vmax': np.float(vmax), + 'Km': np.float(Km), + 'vmax_err': np.float(perr[0]), + 'Km_err': np.float(perr[1]), + 'x': x} def do_hill_kinetics(self): """ @@ -351,22 +378,22 @@ class Experiment(): self.logger.error('{}'.format(msg)) raise FitError(msg) - perr = np.sqrt(np.diag(pconv)) - vmax = popt[0] - Kprime = popt[1] - h = popt[2] + perr = np.sqrt(np.diag(pconv)) + vmax = popt[0] + Kprime = popt[1] + h = popt[2] - x = np.arange(0, max(self.raw_kinetic_data['x']), 0.0001) + x = np.arange(0, max(self.raw_kinetic_data['x']), 0.0001) - self.logger.info('Hill Kinetics:') - self.logger.info(' v_max: {} ± {}'.format(vmax, perr[0])) - self.logger.info(' K_prime: {} ± {}'.format(Kprime, perr[1])) - self.logger.info(' h: {} ± {}'.format(h, perr[2])) + self.logger.info('Hill Kinetics:') + self.logger.info(' v_max: {} ± {}'.format(vmax, perr[0])) + self.logger.info(' K_prime: {} ± {}'.format(Kprime, perr[1])) + self.logger.info(' h: {} ± {}'.format(h, perr[2])) - return {'vmax': np.float(vmax), - 'Kprime': np.float(Kprime), - 'vmax_err': np.float(perr[0]), - 'Kprime_err': np.float(perr[1]), - 'h_err': np.float(perr[2]), - 'h': np.float(h), - 'x': x} + return {'vmax': np.float(vmax), + 'Kprime': np.float(Kprime), + 'vmax_err': np.float(perr[0]), + 'Kprime_err': np.float(perr[1]), + 'h_err': np.float(perr[2]), + 'h': np.float(h), + 'x': x} From 4808d72f8ef628a46b254a2ab736b82915331f6c Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Thu, 27 Aug 2015 18:20:48 +0200 Subject: [PATCH 5/6] Improve documentation --- analyze-cli.py | 21 ++++++++++++++++++--- 1 file changed, 18 insertions(+), 3 deletions(-) diff --git a/analyze-cli.py b/analyze-cli.py index 138b4b7..4f6785b 100755 --- a/analyze-cli.py +++ b/analyze-cli.py @@ -36,6 +36,11 @@ except ImportError: class ExperimentHelper(): + """ + Helper class for dealing with results of libkinetics. + + Provides plotting and data output functionality for libkinetics.Experiment. + """ def __init__(self, experiment, logger): self.exp = experiment @@ -181,9 +186,14 @@ def parse_arguments(): def initialize_logger(): """ - Initialization of logging subsystem. Two logging handlers are brought up: - 'fh' which logs to a log file and 'ch' which logs to standard output. - :return logger: returns a logger instance + Initialization of logging subsystem. + + Two logging handlers are brought up: 'fh' which logs to a log file and + 'ch' which logs to standard output. If colorlog is installed, logging + to console will be colored. + + Returns: + logger: logging.Logger instance """ if COLORED_LOG: fmt = '%(log_color)s%(levelname)-8s%(reset)s %(message)s' @@ -227,6 +237,11 @@ def initialize_logger(): def main(): + """ + Main method of pyKinetics. + + Will be executed when analyze-cli.py is started from the command line. + """ # parse command line arguments args = parse_arguments() # initialize logger From 14ff2bd79e1c088bcf3a88c6baff1e1a6ab8b5d0 Mon Sep 17 00:00:00 2001 From: Alexander Minges Date: Thu, 27 Aug 2015 18:21:04 +0200 Subject: [PATCH 6/6] Improve documentation --- libkinetics/__init__.py | 54 +++++++++++++++++++++++++++++++++-------- 1 file changed, 44 insertions(+), 10 deletions(-) diff --git a/libkinetics/__init__.py b/libkinetics/__init__.py index e553fce..06e84dc 100644 --- a/libkinetics/__init__.py +++ b/libkinetics/__init__.py @@ -17,7 +17,6 @@ except ImportError: class Error(Exception): - """ Main Error class derived from Exception. """ @@ -25,7 +24,6 @@ class Error(Exception): class FitError(Error): - """ Exception raised if fitting fails. """ @@ -33,9 +31,21 @@ class FitError(Error): class Replicate(): - """ - Represents a single replicate within a measurement + Represents a single replicate within a measurement. + + Linear regression for v0 is executed at this level. + + Attributes: + logger: logging.Logger instance inherited by the owning Measurement. + num: float + identification number of replicate within the experiment + x, y: float + time and signal to be analysed. + owner: object + measurement this measurement belongs to + xlim: + fitresult: """ def __init__(self, num, xy, owner): @@ -92,9 +102,28 @@ class Replicate(): class Measurement(): - """ Represents a single measurement within an experiment. + + Each measurement consists of one ore more replicates and is associated + with a specific substrate concentration. + + Attributes: + logger: logging.Logger instance inherited by the owning Experiment. + concentration: float + substrate concentration associated with the measurement. + concentration_unit: string + unit of the concentration; only used for labeling plots/tables. + x, y: float + time and signal to be analysed. + replicates: array_like + list of individual replicates of the measurement. + owner: object + experiment this measurement belongs to + xlim: array_like + lower and upper bounds for calculating the v0 linear fit. + avg_slope, avg_slope_err: float + average slope (v0) of the measurement and its standard deviation """ def __init__(self, xy, conc, conc_unit, owner): @@ -131,18 +160,23 @@ class Measurement(): self.logger.info('-----') def get_results(self): + """ + Collect results of the individual replicates. + + Collects results of each replicate and append to results list. + + Returns: + results: array_like + list of results from each replicate of the measurement. + """ results = [] for r in self.replicates: results.append(r.fitresult) return results - def get_concentration(self): - return self.concentration - class Experiment(): - """ Represents the actual experiment. @@ -373,7 +407,7 @@ class Experiment(): self.raw_kinetic_data['y']) except ValueError: msg = ('Calculation of Hill kinetics failed! Your input data ' - '(either x or y) contain empty (NaN) values!') + '(either x or y) contains empty (NaN) values!') if self.logger: self.logger.error('{}'.format(msg)) raise FitError(msg)