From f6142f7456ac6099f374347a8ee477e5ace5dea2 Mon Sep 17 00:00:00 2001
From: Cameron Davidson-Pilon <cam.davidson.pilon@gmail.com>
Date: Wed, 13 Feb 2019 21:59:01 -0500
Subject: [PATCH] V0.18.6 (#635)

* v0.18.6

* some perf improvements to median survival function calculations

* lint

* change log

* bump version

* lint
---
 CHANGELOG.md                                  |  20 +-
 docs/Changelog.rst                            | 857 ++++++++++++++++++
 docs/References.rst                           |  15 +
 docs/Survival Regression.rst                  |   2 +-
 docs/Survival analysis with lifelines.rst     |  28 +-
 docs/conf.py                                  |  21 +-
 docs/index.rst                                |   3 +
 docs/lifelines.datasets.rst                   |  18 +-
 docs/lifelines.fitters.rst                    |  33 +-
 docs/lifelines.plotting.rst                   |   8 +
 docs/lifelines.rst                            |  54 +-
 docs/lifelines.utils.rst                      |  35 +-
 docs/modules.rst                              |   7 -
 lifelines/datasets/__init__.py                | 534 ++++++-----
 lifelines/fitters/__init__.py                 |  88 +-
 lifelines/fitters/aalen_johansen_fitter.py    |  18 +-
 .../breslow_fleming_harrington_fitter.py      |   7 +-
 lifelines/fitters/cox_time_varying_fitter.py  |   7 +-
 lifelines/fitters/coxph_fitter.py             |  79 +-
 lifelines/fitters/exponential_fitter.py       |  10 +-
 lifelines/fitters/kaplan_meier_fitter.py      |   2 +-
 lifelines/fitters/log_logistic_fitter.py      |  12 +-
 lifelines/fitters/log_normal_fitter.py        |  13 +-
 lifelines/fitters/nelson_aalen_fitter.py      |  15 +-
 .../fitters/piecewise_exponential_fitter.py   |   8 +-
 lifelines/fitters/weibull_fitter.py           |   8 +-
 lifelines/plotting.py                         |  66 +-
 lifelines/statistics.py                       |  14 +-
 lifelines/utils/__init__.py                   |  97 +-
 lifelines/utils/concordance.py                |  10 +-
 lifelines/version.py                          |   2 +-
 perf_tests/cp_perf_test.py                    |   4 +-
 tests/test_estimation.py                      |  10 +-
 tests/test_statistics.py                      |  33 +
 34 files changed, 1580 insertions(+), 558 deletions(-)
 create mode 100644 docs/Changelog.rst
 create mode 100644 docs/References.rst
 create mode 100644 docs/lifelines.plotting.rst
 delete mode 100644 docs/modules.rst

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 74d224d20..99227fd07 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,23 +1,27 @@
-### Changelogs
+### Changelog
 
-### 0.18.5
+#### 0.18.6
+ - some improvements to the output of `check_assumptions`. `show_plots` is turned to `False` by default now. It only shows `rank` and `km` p-values now.
+ - some performance improvements to `qth_survival_time`.
+
+#### 0.18.5
  - added new plotting methods to parametric univariate models: `plot_survival_function`, `plot_hazard` and `plot_cumulative_hazard`. The last one is an alias for `plot`.
  - added new properties to parametric univarite models: `confidence_interval_survival_function_`, `confidence_interval_hazard_`, `confidence_interval_cumulative_hazard_`. The last one is an alias for `confidence_interval_`.
  - Fixed some overflow issues with `AalenJohansenFitter`'s variance calculations when using large datasets.
  - Fixed an edgecase in `AalenJohansenFitter` that causing some datasets with to be jittered too often.
  - Add a new kwarg to  `AalenJohansenFitter`, `calculate_variance` that can be used to turn off variance calculations since this can take a long time for large datasets. Thanks @pzivich!
 
-### 0.18.4
+#### 0.18.4
  - fixed confidence intervals in cumulative hazards for parametric univarite models. They were previously 
    serverly depressed. 
  - adding left-truncation support to parametric univarite models with the `entry` kwarg in `.fit`
 
-### 0.18.3 
+#### 0.18.3 
  - Some performance improvements to parametric univariate models.
  - Suppressing some irrelevant NumPy and autograd warnings, so lifeline warnings are more noticeable. 
  - Improved some warning and error messages. 
 
-### 0.18.2
+#### 0.18.2
  - New univariate fitter `PiecewiseExponentialFitter` for creating a stepwise hazard model. See docs online.
  - Ability to create novel parametric univariate models using the new `ParametericUnivariateFitter` super class. See docs online for how to do this. 
  - Unfortunately, parametric univariate fitters are not serializable with `pickle`. The library `dill` is still useable. 
@@ -25,13 +29,13 @@
  - `LogNormalFitter` no longer models `log_sigma`.
 
 
-### 0.18.1
+#### 0.18.1
  - bug fixes in `LogNormalFitter` variance estimates
  - improve convergence of `LogNormalFitter`. We now model the log of sigma internally, but still expose sigma externally. 
  - use the `autograd` lib to help with gradients.
  - New `LogLogisticFitter` univariate fitter available. 
 
-### 0.18.0
+#### 0.18.0
  - `LogNormalFitter` is a new univariate fitter you can use.
  - `WeibullFitter` now correctly returns the confidence intervals (previously returned only NaNs)
  - `WeibullFitter.print_summary()` displays p-values associated with its parameters not equal to 1.0 - previously this was (implicitly) comparing against 0, which is trivially always true (the parameters must be greater than 0)
@@ -45,7 +49,7 @@
  - new warning message when Cox models detects possible non-unique solutions to maximum likelihood. 
  - Generally: clean up lifelines exception handling. Ex: catch `LinAlgError: Matrix is singular.` and report back to the user advice. 
 
-### 0.17.5
+#### 0.17.5
  - more bugs in `plot_covariate_groups` fixed when using non-numeric strata.
 
 #### 0.17.4
diff --git a/docs/Changelog.rst b/docs/Changelog.rst
new file mode 100644
index 000000000..8532377ae
--- /dev/null
+++ b/docs/Changelog.rst
@@ -0,0 +1,857 @@
+Changelog
+~~~~~~~~~
+
+0.18.6
+^^^^^^
+
+-  some improvements to the output of ``check_assumptions``.
+   ``show_plots`` is turned to ``False`` by default now. It only shows
+   ``rank`` and ``km`` p-values now.
+-  some performance improvements to ``qth_survival_time``.
+
+.. _section-1:
+
+0.18.5
+^^^^^^
+
+-  added new plotting methods to parametric univariate models:
+   ``plot_survival_function``, ``plot_hazard`` and
+   ``plot_cumulative_hazard``. The last one is an alias for ``plot``.
+-  added new properties to parametric univarite models:
+   ``confidence_interval_survival_function_``,
+   ``confidence_interval_hazard_``,
+   ``confidence_interval_cumulative_hazard_``. The last one is an alias
+   for ``confidence_interval_``.
+-  Fixed some overflow issues with ``AalenJohansenFitter``\ ’s variance
+   calculations when using large datasets.
+-  Fixed an edgecase in ``AalenJohansenFitter`` that causing some
+   datasets with to be jittered too often.
+-  Add a new kwarg to ``AalenJohansenFitter``, ``calculate_variance``
+   that can be used to turn off variance calculations since this can
+   take a long time for large datasets. Thanks @pzivich!
+
+.. _section-2:
+
+0.18.4
+^^^^^^
+
+-  fixed confidence intervals in cumulative hazards for parametric
+   univarite models. They were previously serverly depressed.
+-  adding left-truncation support to parametric univarite models with
+   the ``entry`` kwarg in ``.fit``
+
+.. _section-3:
+
+0.18.3
+^^^^^^
+
+-  Some performance improvements to parametric univariate models.
+-  Suppressing some irrelevant NumPy and autograd warnings, so lifeline
+   warnings are more noticeable.
+-  Improved some warning and error messages.
+
+.. _section-4:
+
+0.18.2
+^^^^^^
+
+-  New univariate fitter ``PiecewiseExponentialFitter`` for creating a
+   stepwise hazard model. See docs online.
+-  Ability to create novel parametric univariate models using the new
+   ``ParametericUnivariateFitter`` super class. See docs online for how
+   to do this.
+-  Unfortunately, parametric univariate fitters are not serializable
+   with ``pickle``. The library ``dill`` is still useable.
+-  Complete overhaul of all internals for parametric univariate fitters.
+   Moved them all (most) to use ``autograd``.
+-  ``LogNormalFitter`` no longer models ``log_sigma``.
+
+.. _section-5:
+
+0.18.1
+^^^^^^
+
+-  bug fixes in ``LogNormalFitter`` variance estimates
+-  improve convergence of ``LogNormalFitter``. We now model the log of
+   sigma internally, but still expose sigma externally.
+-  use the ``autograd`` lib to help with gradients.
+-  New ``LogLogisticFitter`` univariate fitter available.
+
+.. _section-6:
+
+0.18.0
+^^^^^^
+
+-  ``LogNormalFitter`` is a new univariate fitter you can use.
+-  ``WeibullFitter`` now correctly returns the confidence intervals
+   (previously returned only NaNs)
+-  ``WeibullFitter.print_summary()`` displays p-values associated with
+   its parameters not equal to 1.0 - previously this was (implicitly)
+   comparing against 0, which is trivially always true (the parameters
+   must be greater than 0)
+-  ``ExponentialFitter.print_summary()`` displays p-values associated
+   with its parameters not equal to 1.0 - previously this was
+   (implicitly) comparing against 0, which is trivially always true (the
+   parameters must be greater than 0)
+-  ``ExponentialFitter.plot`` now displays the cumulative hazard,
+   instead of the survival function. This is to make it easier to
+   compare to ``WeibullFitter`` and ``LogNormalFitter``
+-  Univariate fitters’ ``cumulative_hazard_at_times``,
+   ``hazard_at_times``, ``survival_function_at_times`` return pandas
+   Series now (use to be numpy arrays)
+-  remove ``alpha`` keyword from all statistical functions. This was
+   never being used.
+-  Gone are astericks and dots in ``print_summary`` functions that
+   represent signficance thresholds.
+-  In models’ ``summary`` (including ``print_summary``), the ``log(p)``
+   term has changed to ``-log2(p)``. This is known as the s-value. See
+   https://lesslikely.com/statistics/s-values/
+-  introduce new statistical tests between univariate datasets:
+   ``survival_difference_at_fixed_point_in_time_test``,…
+-  new warning message when Cox models detects possible non-unique
+   solutions to maximum likelihood.
+-  Generally: clean up lifelines exception handling. Ex: catch
+   ``LinAlgError: Matrix is singular.`` and report back to the user
+   advice.
+
+.. _section-7:
+
+0.17.5
+^^^^^^
+
+-  more bugs in ``plot_covariate_groups`` fixed when using non-numeric
+   strata.
+
+.. _section-8:
+
+0.17.4
+^^^^^^
+
+-  Fix bug in ``plot_covariate_groups`` that wasn’t allowing for strata
+   to be used.
+-  change name of ``multicenter_aids_cohort_study`` to
+   ``load_multicenter_aids_cohort_study``
+-  ``groups`` is now called ``values`` in
+   ``CoxPHFitter.plot_covariate_groups``
+
+.. _section-9:
+
+0.17.3
+^^^^^^
+
+-  Fix in ``compute_residuals`` when using ``schoenfeld`` and the
+   minumum duration has only censored subjects.
+
+.. _section-10:
+
+0.17.2
+^^^^^^
+
+-  Another round of serious performance improvements for the Cox models.
+   Up to 2x faster for CoxPHFitter and CoxTimeVaryingFitter. This was
+   mostly the result of using NumPy’s ``einsum`` to simplify a previous
+   ``for`` loop. The downside is the code is more esoteric now. I’ve
+   added comments as necessary though 🤞
+
+.. _section-11:
+
+0.17.1
+^^^^^^
+
+-  adding bottleneck as a dependency. This library is highly-recommended
+   by Pandas, and in lifelines we see some nice performance improvements
+   with it too. (~15% for ``CoxPHFitter``)
+-  There was a small bug in ``CoxPHFitter`` when using ``batch_mode``
+   that was causing coefficients to deviate from their MLE value. This
+   bug eluded tests, which means that it’s discrepancy was less than
+   0.0001 difference. It’s fixed now, and even more accurate tests are
+   added.
+-  Faster ``CoxPHFitter._compute_likelihood_ratio_test()``
+-  Fixes a Pandas performance warning in ``CoxTimeVaryingFitter``.
+-  Performances improvements to ``CoxTimeVaryingFitter``.
+
+.. _section-12:
+
+0.17.0
+^^^^^^
+
+-  corrected behaviour in ``CoxPHFitter`` where ``score_`` was not being
+   refreshed on every new ``fit``.
+-  Reimplentation of ``AalenAdditiveFitter``. There were significant
+   changes to it:
+
+   -  implementation is at least 10x faster, and possibly up to 100x
+      faster for some datasets.
+   -  memory consumption is way down
+   -  removed the time-varying component from ``AalenAdditiveFitter``.
+      This will return in a future release.
+   -  new ``print_summary``
+   -  ``weights_col`` is added
+   -  ``nn_cumulative_hazard`` is removed (may add back)
+
+-  some plotting improvemnts to ``plotting.plot_lifetimes``
+
+.. _section-13:
+
+0.16.3
+^^^^^^
+
+-  More ``CoxPHFitter`` performance improvements. Up to a 40% reduction
+   vs 0.16.2 for some datasets.
+
+.. _section-14:
+
+0.16.2
+^^^^^^
+
+-  Fixed ``CoxTimeVaryingFitter`` to allow more than one variable to be
+   stratafied
+-  Significant performance improvements for ``CoxPHFitter`` with dataset
+   has lots of duplicate times. See
+   https://github.com/CamDavidsonPilon/lifelines/issues/591
+
+.. _section-15:
+
+0.16.1
+^^^^^^
+
+-  Fixed py2 division error in ``concordance`` method.
+
+.. _section-16:
+
+0.16.0
+^^^^^^
+
+-  Drop Python 3.4 support.
+-  introduction of residual calculations in
+   ``CoxPHFitter.compute_residuals``. Residuals include “schoenfeld”,
+   “score”, “delta_beta”, “deviance”, “martingale”, and
+   “scaled_schoenfeld”.
+-  removes ``estimation`` namespace for fitters. Should be using
+   ``from lifelines import xFitter`` now. Thanks @usmanatron
+-  removes ``predict_log_hazard_relative_to_mean`` from Cox model.
+   Thanks @usmanatron
+-  ``StatisticalResult`` has be generalized to allow for multiple
+   results (ex: from pairwise comparisons). This means a slightly
+   changed API that is mostly backwards compatible. See doc string for
+   how to use it.
+-  ``statistics.pairwise_logrank_test`` now returns a
+   ``StatisticalResult`` object instead of a nasty NxN DataFrame 💗
+-  Display log(p-values) as well as p-values in ``print_summary``. Also,
+   p-values below thesholds will be truncated. The orignal p-values are
+   still recoverable using ``.summary``.
+-  Floats ``print_summary`` is now displayed to 2 decimal points. This
+   can be changed using the ``decimal`` kwarg.
+-  removed ``standardized`` from ``Cox`` model plotting. It was
+   confusing.
+-  visual improvements to Cox models ``.plot``
+-  ``print_summary`` methods accepts kwargs to also be displayed.
+-  ``CoxPHFitter`` has a new human-readable method,
+   ``check_assumptions``, to check the assumptions of your Cox
+   proportional hazard model.
+-  A new helper util to “expand” static datasets into long-form:
+   ``lifelines.utils.to_episodic_format``.
+-  ``CoxTimeVaryingFitter`` now accepts ``strata``.
+
+.. _section-17:
+
+0.15.4
+^^^^^^
+
+-  bug fix for the Cox model likelihood ratio test when using
+   non-trivial weights.
+
+.. _section-18:
+
+0.15.3
+^^^^^^
+
+-  Only allow matplotlib less than 3.0.
+
+.. _section-19:
+
+0.15.2
+^^^^^^
+
+-  API changes to ``plotting.plot_lifetimes``
+-  ``cluster_col`` and ``strata`` can be used together in
+   ``CoxPHFitter``
+-  removed ``entry`` from ``ExponentialFitter`` and ``WeibullFitter`` as
+   it was doing nothing.
+
+.. _section-20:
+
+0.15.1
+^^^^^^
+
+-  Bug fixes for v0.15.0
+-  Raise NotImplementedError if the ``robust`` flag is used in
+   ``CoxTimeVaryingFitter`` - that’s not ready yet.
+
+.. _section-21:
+
+0.15.0
+^^^^^^
+
+-  adding ``robust`` params to ``CoxPHFitter``\ ’s ``fit``. This enables
+   atleast i) using non-integer weights in the model (these could be
+   sampling weights like IPTW), and ii) mis-specified models (ex:
+   non-proportional hazards). Under the hood it’s a sandwich estimator.
+   This does not handle ties, so if there are high number of ties,
+   results may significantly differ from other software.
+-  ``standard_errors_`` is now a property on fitted ``CoxPHFitter``
+   which describes the standard errors of the coefficients.
+-  ``variance_matrix_`` is now a property on fitted ``CoxPHFitter``
+   which describes the variance matrix of the coefficients.
+-  new criteria for convergence of ``CoxPHFitter`` and
+   ``CoxTimeVaryingFitter`` called the Newton-decrement. Tests show it
+   is as accurate (w.r.t to previous coefficients) and typically shaves
+   off a single step, resulting in generally faster convergence. See
+   https://www.cs.cmu.edu/~pradeepr/convexopt/Lecture_Slides/Newton_methods.pdf.
+   Details about the Newton-decrement are added to the ``show_progress``
+   statements.
+-  Minimum suppport for scipy is 1.0
+-  Convergence errors in models that use Newton-Rhapson methods now
+   throw a ``ConvergenceError``, instead of a ``ValueError`` (the former
+   is a subclass of the latter, however).
+-  ``AalenAdditiveModel`` raises ``ConvergenceWarning`` instead of
+   printing a warning.
+-  ``KaplanMeierFitter`` now has a cumulative plot option. Example
+   ``kmf.plot(invert_y_axis=True)``
+-  a ``weights_col`` option has been added to ``CoxTimeVaryingFitter``
+   that allows for time-varying weights.
+-  ``WeibullFitter`` has a new ``show_progress`` param and additional
+   information if the convergence fails.
+-  ``CoxPHFitter``, ``ExponentialFitter``, ``WeibullFitter`` and
+   ``CoxTimeVaryFitter`` method ``print_summary`` is updated with new
+   fields.
+-  ``WeibullFitter`` has renamed the incorrect ``_jacobian`` to
+   ``_hessian_``.
+-  ``variance_matrix_`` is now a property on fitted ``WeibullFitter``
+   which describes the variance matrix of the parameters.
+-  The default ``WeibullFitter().timeline`` has changed from integers
+   between the min and max duration to *n* floats between the max and
+   min durations, where *n* is the number of observations.
+-  Performance improvements for ``CoxPHFitter`` (~20% faster)
+-  Performance improvements for ``CoxTimeVaryingFitter`` (~100% faster)
+-  In Python3, Univariate models are now serialisable with ``pickle``.
+   Thanks @dwilson1988 for the contribution. For Python2, ``dill`` is
+   still the preferred method.
+-  ``baseline_cumulative_hazard_`` (and derivatives of that) on
+   ``CoxPHFitter`` now correctly incorporate the ``weights_col``.
+-  Fixed a bug in ``KaplanMeierFitter`` when late entry times lined up
+   with death events. Thanks @pzivich
+-  Adding ``cluster_col`` argument to ``CoxPHFitter`` so users can
+   specify groups of subjects/rows that may be correlated.
+-  Shifting the “signficance codes” for p-values down an order of
+   magnitude. (Example, p-values between 0.1 and 0.05 are not noted at
+   all and p-values between 0.05 and 0.1 are noted with ``.``, etc.).
+   This deviates with how they are presented in other software. There is
+   an argument to be made to remove p-values from lifelines altogether
+   (*become the changes you want to see in the world* lol), but I worry
+   that people could compute the p-values by hand incorrectly, a worse
+   outcome I think. So, this is my stance. P-values between 0.1 and 0.05
+   offer *very* little information, so they are removed. There is a
+   growing movement in statistics to shift “signficant” findings to
+   p-values less than 0.01 anyways.
+-  New fitter for cumulative incidence of multiple risks
+   ``AalenJohansenFitter``. Thanks @pzivich! See “Methodologic Issues
+   When Estimating Risks in Pharmacoepidemiology” for a nice overview of
+   the model.
+
+.. _section-22:
+
+0.14.6
+^^^^^^
+
+-  fix for n > 2 groups in ``multivariate_logrank_test`` (again).
+-  fix bug for when ``event_observed`` column was not boolean.
+
+.. _section-23:
+
+0.14.5
+^^^^^^
+
+-  fix for n > 2 groups in ``multivariate_logrank_test``
+-  fix weights in KaplanMeierFitter when using a pandas Series.
+
+.. _section-24:
+
+0.14.4
+^^^^^^
+
+-  Adds ``baseline_cumulative_hazard_`` and ``baseline_survival_`` to
+   ``CoxTimeVaryingFitter``. Because of this, new prediction methods are
+   available.
+-  fixed a bug in ``add_covariate_to_timeline`` when using
+   ``cumulative_sum`` with multiple columns.
+-  Added ``Likelihood ratio test`` to ``CoxPHFitter.print_summary`` and
+   ``CoxTimeVaryingFitter.print_summary``
+-  New checks in ``CoxTimeVaryingFitter`` that check for immediate
+   deaths and redundant rows.
+-  New ``delay`` parameter in ``add_covariate_to_timeline``
+-  removed ``two_sided_z_test`` from ``statistics``
+
+.. _section-25:
+
+0.14.3
+^^^^^^
+
+-  fixes a bug when subtracting or dividing two ``UnivariateFitters``
+   with labels.
+-  fixes an import error with using ``CoxTimeVaryingFitter`` predict
+   methods.
+-  adds a ``column`` argument to ``CoxTimeVaryingFitter`` and
+   ``CoxPHFitter`` ``plot`` method to plot only a subset of columns.
+
+.. _section-26:
+
+0.14.2
+^^^^^^
+
+-  some quality of life improvements for working with
+   ``CoxTimeVaryingFitter`` including new ``predict_`` methods.
+
+.. _section-27:
+
+0.14.1
+^^^^^^
+
+-  fixed bug with using weights and strata in ``CoxPHFitter``
+-  fixed bug in using non-integer weights in ``KaplanMeierFitter``
+-  Performance optimizations in ``CoxPHFitter`` for up to 40% faster
+   completion of ``fit``.
+
+   -  even smarter ``step_size`` calculations for iterative
+      optimizations.
+   -  simple code optimizations & cleanup in specific hot spots.
+
+-  Performance optimizations in ``AalenAdditiveFitter`` for up to 50%
+   faster completion of ``fit`` for large dataframes, and up to 10%
+   faster for small dataframes.
+
+.. _section-28:
+
+0.14.0
+^^^^^^
+
+-  adding ``plot_covariate_groups`` to ``CoxPHFitter`` to visualize what
+   happens to survival as we vary a covariate, all else being equal.
+-  ``utils`` functions like ``qth_survival_times`` and
+   ``median_survival_times`` now return the transpose of the DataFrame
+   compared to previous version of lifelines. The reason for this is
+   that we often treat survival curves as columns in DataFrames, and
+   functions of the survival curve as index (ex:
+   KaplanMeierFitter.survival_function\_ returns a survival curve *at*
+   time *t*).
+-  ``KaplanMeierFitter.fit`` and ``NelsonAalenFitter.fit`` accept a
+   ``weights`` vector that can be used for pre-aggregated datasets. See
+   this
+   `issue <https://github.com/CamDavidsonPilon/lifelines/issues/396>`__.
+-  Convergence errors now return a custom ``ConvergenceWarning`` instead
+   of a ``RuntimeWarning``
+-  New checks for complete separation in the dataset for regressions.
+
+.. _section-29:
+
+0.13.0
+^^^^^^
+
+-  removes ``is_significant`` and ``test_result`` from
+   ``StatisticalResult``. Users can instead choose their significance
+   level by comparing to ``p_value``. The string representation of this
+   class has changed aswell.
+-  ``CoxPHFitter`` and ``AalenAdditiveFitter`` now have a ``score_``
+   property that is the concordance-index of the dataset to the fitted
+   model.
+-  ``CoxPHFitter`` and ``AalenAdditiveFitter`` no longer have the
+   ``data`` property. It was an *almost* duplicate of the training data,
+   but was causing the model to be very large when serialized.
+-  Implements a new fitter ``CoxTimeVaryingFitter`` available under the
+   ``lifelines`` namespace. This model implements the Cox model for
+   time-varying covariates.
+-  Utils for creating time varying datasets available in ``utils``.
+-  less noisy check for complete separation.
+-  removed ``datasets`` namespace from the main ``lifelines`` namespace
+-  ``CoxPHFitter`` has a slightly more intelligent (barely…) way to pick
+   a step size, so convergence should generally be faster.
+-  ``CoxPHFitter.fit`` now has accepts a ``weight_col`` kwarg so one can
+   pass in weights per observation. This is very useful if you have many
+   subjects, and the space of covariates is not large. Thus you can
+   group the same subjects together and give that observation a weight
+   equal to the count. Altogether, this means a much faster regression.
+
+.. _section-30:
+
+0.12.0
+^^^^^^
+
+-  removes ``include_likelihood`` from ``CoxPHFitter.fit`` - it was not
+   slowing things down much (empirically), and often I wanted it for
+   debugging (I suppose others do too). It’s also another exit
+   condition, so we many exit from the NR iterations faster.
+-  added ``step_size`` param to ``CoxPHFitter.fit`` - the default is
+   good, but for extremely large or small datasets this may want to be
+   set manually.
+-  added a warning to ``CoxPHFitter`` to check for complete seperation:
+   https://stats.idre.ucla.edu/other/mult-pkg/faq/general/faqwhat-is-complete-or-quasi-complete-separation-in-logisticprobit-regression-and-how-do-we-deal-with-them/
+-  Additional functionality to ``utils.survival_table_from_events`` to
+   bin the index to make the resulting table more readable.
+
+.. _section-31:
+
+0.11.3
+^^^^^^
+
+-  No longer support matplotlib 1.X
+-  Adding ``times`` argument to ``CoxPHFitter``\ ’s
+   ``predict_survival_function`` and ``predict_cumulative_hazard`` to
+   predict the estimates at, instead uses the default times of
+   observation or censorship.
+-  More accurate prediction methods parametrics univariate models.
+
+.. _section-32:
+
+0.11.2
+^^^^^^
+
+-  Changing liscense to valilla MIT.
+-  Speed up ``NelsonAalenFitter.fit`` considerably.
+
+.. _section-33:
+
+0.11.1
+^^^^^^
+
+-  Python3 fix for ``CoxPHFitter.plot``.
+
+.. _section-34:
+
+0.11.0
+^^^^^^
+
+-  fixes regression in ``KaplanMeierFitter.plot`` when using Seaborn and
+   lifelines.
+-  introduce a new ``.plot`` function to a fitted ``CoxPHFitter``
+   instance. This plots the hazard coefficients and their confidence
+   intervals.
+-  in all plot methods, the ``ix`` kwarg has been deprecated in favour
+   of a new ``loc`` kwarg. This is to align with Pandas deprecating
+   ``ix``
+
+.. _section-35:
+
+0.10.1
+^^^^^^
+
+-  fix in internal normalization for ``CoxPHFitter`` predict methods.
+
+.. _section-36:
+
+0.10.0
+^^^^^^
+
+-  corrected bug that was returning the wrong baseline survival and
+   hazard values in ``CoxPHFitter`` when ``normalize=True``.
+-  removed ``normalize`` kwarg in ``CoxPHFitter``. This was causing lots
+   of confusion for users, and added code complexity. It’s really nice
+   to be able to remove it.
+-  correcting column name in ``CoxPHFitter.baseline_survival_``
+-  ``CoxPHFitter.baseline_cumulative_hazard_`` is always centered, to
+   mimic R’s ``basehaz`` API.
+-  new ``predict_log_partial_hazards`` to ``CoxPHFitter``
+
+.. _section-37:
+
+0.9.4
+^^^^^
+
+-  adding ``plot_loglogs`` to ``KaplanMeierFitter``
+-  added a (correct) check to see if some columns in a dataset will
+   cause convergence problems.
+-  removing ``flat`` argument in ``plot`` methods. It was causing
+   confusion. To replicate it, one can set ``ci_force_lines=True`` and
+   ``show_censors=True``.
+-  adding ``strata`` keyword argument to ``CoxPHFitter`` on
+   initialization (ex: ``CoxPHFitter(strata=['v1', 'v2'])``. Why?
+   Fitters initialized with ``strata`` can now be passed into
+   ``k_fold_cross_validation``, plus it makes unit testing ``strata``
+   fitters easier.
+-  If using ``strata`` in ``CoxPHFitter``, access to strata specific
+   baseline hazards and survival functions are available (previously it
+   was a blended valie). Prediction also uses the specific baseline
+   hazards/survivals.
+-  performance improvements in ``CoxPHFitter`` - should see at least a
+   10% speed improvement in ``fit``.
+
+.. _section-38:
+
+0.9.2
+^^^^^
+
+-  deprecates Pandas versions before 0.18.
+-  throw an error if no admissable pairs in the c-index calculation.
+   Previously a NaN was returned.
+
+.. _section-39:
+
+0.9.1
+^^^^^
+
+-  add two summary functions to Weibull and Exponential fitter, solves
+   #224
+
+.. _section-40:
+
+0.9.0
+^^^^^
+
+-  new prediction function in ``CoxPHFitter``,
+   ``predict_log_hazard_relative_to_mean``, that mimics what R’s
+   ``predict.coxph`` does.
+-  removing the ``predict`` method in CoxPHFitter and
+   AalenAdditiveFitter. This is because the choice of ``predict_median``
+   as a default was causing too much confusion, and no other natual
+   choice as a default was available. All other ``predict_`` methods
+   remain.
+-  Default predict method in ``k_fold_cross_validation`` is now
+   ``predict_expectation``
+
+.. _section-41:
+
+0.8.1
+^^^^^
+
+-  supports matplotlib 1.5.
+-  introduction of a param ``nn_cumulative_hazards`` in
+   AalenAdditiveModel’s ``__init__`` (default True). This parameter will
+   truncate all non-negative cumulative hazards in prediction methods to
+   0.
+-  bug fixes including:
+
+   -  fixed issue where the while loop in ``_newton_rhaphson`` would
+      break too early causing a variable not to be set properly.
+   -  scaling of smooth hazards in NelsonAalenFitter was off by a factor
+      of 0.5.
+
+.. _section-42:
+
+0.8.0
+^^^^^
+
+-  reorganized lifelines directories:
+
+   -  moved test files out of main directory.
+   -  moved ``utils.py`` into it’s own directory.
+   -  moved all estimators ``fitters`` directory.
+
+-  added a ``at_risk`` column to the output of
+   ``group_survival_table_from_events`` and
+   ``survival_table_from_events``
+-  added sample size and power calculations for statistical tests. See
+   ``lifeline.statistics. sample_size_necessary_under_cph`` and
+   ``lifelines.statistics. power_under_cph``.
+-  fixed a bug when using KaplanMeierFitter for left-censored data.
+
+.. _section-43:
+
+0.7.1
+^^^^^
+
+-  addition of a l2 ``penalizer`` to ``CoxPHFitter``.
+-  dropped Fortran implementation of efficient Python version. Lifelines
+   is pure python once again!
+-  addition of ``strata`` keyword argument to ``CoxPHFitter`` to allow
+   for stratification of a single or set of categorical variables in
+   your dataset.
+-  ``datetimes_to_durations`` now accepts a list as ``na_values``, so
+   multiple values can be checked.
+-  fixed a bug in ``datetimes_to_durations`` where ``fill_date`` was not
+   properly being applied.
+-  Changed warning in ``datetimes_to_durations`` to be correct.
+-  refactor each fitter into it’s own submodule. For now, the tests are
+   still in the same file. This will also *not* break the API.
+
+.. _section-44:
+
+0.7.0
+^^^^^
+
+-  allow for multiple fitters to be passed into
+   ``k_fold_cross_validation``.
+-  statistical tests in ``lifelines.statistics``. now return a
+   ``StatisticalResult`` object with properties like ``p_value``,
+   ``test_results``, and ``summary``.
+-  fixed a bug in how log-rank statistical tests are performed. The
+   covariance matrix was not being correctly calculated. This resulted
+   in slightly different p-values.
+-  ``WeibullFitter``, ``ExponentialFitter``, ``KaplanMeierFitter`` and
+   ``BreslowFlemingHarringtonFitter`` all have a
+   ``conditional_time_to_event_`` property that measures the median
+   duration remaining until the death event, given survival up until
+   time t.
+
+.. _section-45:
+
+0.6.1
+^^^^^
+
+-  addition of ``median_`` property to ``WeibullFitter`` and
+   ``ExponentialFitter``.
+-  ``WeibullFitter`` and ``ExponentialFitter`` will use integer
+   timelines instead of float provided by ``linspace``. This is so if
+   your work is to sum up the survival function (for expected values or
+   something similar), it’s more difficult to make a mistake.
+
+.. _section-46:
+
+0.6.0
+^^^^^
+
+-  Inclusion of the univariate fitters ``WeibullFitter`` and
+   ``ExponentialFitter``.
+-  Removing ``BayesianFitter`` from lifelines.
+-  Added new penalization scheme to AalenAdditiveFitter. You can now add
+   a smoothing penalizer that will try to keep subsequent values of a
+   hazard curve close together. The penalizing coefficient is
+   ``smoothing_penalizer``.
+-  Changed ``penalizer`` keyword arg to ``coef_penalizer`` in
+   AalenAdditiveFitter.
+-  new ``ridge_regression`` function in ``utils.py`` to perform linear
+   regression with l2 penalizer terms.
+-  Matplotlib is no longer a mandatory dependency.
+-  ``.predict(time)`` method on univariate fitters can now accept a
+   scalar (and returns a scalar) and an iterable (and returns a numpy
+   array)
+-  In ``KaplanMeierFitter``, ``epsilon`` has been renamed to
+   ``precision``.
+
+.. _section-47:
+
+0.5.1
+^^^^^
+
+-  New API for ``CoxPHFitter`` and ``AalenAdditiveFitter``: the default
+   arguments for ``event_col`` and ``duration_col``. ``duration_col`` is
+   now mandatory, and ``event_col`` now accepts a column, or by default,
+   ``None``, which assumes all events are observed (non-censored).
+-  Fix statistical tests.
+-  Allow negative durations in Fitters.
+-  New API in ``survival_table_from_events``: ``min_observations`` is
+   replaced by ``birth_times`` (default ``None``).
+-  New API in ``CoxPHFitter`` for summary: ``summary`` will return a
+   dataframe with statistics, ``print_summary()`` will print the
+   dataframe (plus some other statistics) in a pretty manner.
+-  Adding “At Risk” counts option to univariate fitter ``plot`` methods,
+   ``.plot(at_risk_counts=True)``, and the function
+   ``lifelines.plotting.add_at_risk_counts``.
+-  Fix bug Epanechnikov kernel.
+
+.. _section-48:
+
+0.5.0
+^^^^^
+
+-  move testing to py.test
+-  refactor tests into smaller files
+-  make
+   ``test_pairwise_logrank_test_with_identical_data_returns_inconclusive``
+   a better test
+-  add test for summary()
+-  Alternate metrics can be used for ``k_fold_cross_validation``.
+
+.. _section-49:
+
+0.4.4
+^^^^^
+
+-  Lots of improvements to numerical stability (but something things
+   still need work)
+-  Additions to ``summary`` in CoxPHFitter.
+-  Make all prediction methods output a DataFrame
+-  Fixes bug in 1-d input not returning in CoxPHFitter
+-  Lots of new tests.
+
+.. _section-50:
+
+0.4.3
+^^^^^
+
+-  refactoring of ``qth_survival_times``: it can now accept an iterable
+   (or a scalar still) of probabilities in the q argument, and will
+   return a DataFrame with these as columns. If len(q)==1 and a single
+   survival function is given, will return a scalar, not a DataFrame.
+   Also some good speed improvements.
+-  KaplanMeierFitter and NelsonAalenFitter now have a ``_label``
+   property that is passed in during the fit.
+-  KaplanMeierFitter/NelsonAalenFitter’s inital ``alpha`` value is
+   overwritten if a new ``alpha`` value is passed in during the ``fit``.
+-  New method for KaplanMeierFitter: ``conditional_time_to``. This
+   returns a DataFrame of the estimate: med(S(t \| T>s)) - s, human
+   readable: the estimated time left of living, given an individual is
+   aged s.
+-  Adds option ``include_likelihood`` to CoxPHFitter fit method to save
+   the final log-likelihood value.
+
+.. _section-51:
+
+0.4.2
+^^^^^
+
+-  Massive speed improvements to CoxPHFitter.
+-  Additional prediction method: ``predict_percentile`` is available on
+   CoxPHFitter and AalenAdditiveFitter. Given a percentile, p, this
+   function returns the value t such that *S(t \| x) = p*. It is a
+   generalization of ``predict_median``.
+-  Additional kwargs in ``k_fold_cross_validation`` that will accept
+   different prediction methods (default is ``predict_median``).
+-  Bug fix in CoxPHFitter ``predict_expectation`` function.
+-  Correct spelling mistake in newton-rhapson algorithm.
+-  ``datasets`` now contains functions for generating the respective
+   datasets, ex: ``generate_waltons_dataset``.
+-  Bumping up the number of samples in statistical tests to prevent them
+   from failing so often (this a stop-gap)
+-  pep8 everything
+
+.. _section-52:
+
+0.4.1.1
+^^^^^^^
+
+-  Ability to specify default printing in statsitical tests with the
+   ``suppress_print`` keyword argument (default False).
+-  For the multivariate log rank test, the inverse step has been
+   replaced with the generalized inverse. This seems to be what other
+   packages use.
+-  Adding more robust cross validation scheme based on issue #67.
+-  fixing ``regression_dataset`` in ``datasets``.
+
+.. _section-53:
+
+0.4.1
+^^^^^
+
+-  ``CoxFitter`` is now known as ``CoxPHFitter``
+-  refactoring some tests that used redundant data from
+   ``lifelines.datasets``.
+-  Adding cross validation: in ``utils`` is a new
+   ``k_fold_cross_validation`` for model selection in regression
+   problems.
+-  Change CoxPHFitter’s fit method’s ``display_output`` to ``False``.
+-  fixing bug in CoxPHFitter’s ``_compute_baseline_hazard`` that errored
+   when sending Series objects to ``survival_table_from_events``.
+-  CoxPHFitter’s ``fit`` now looks to columns with too low variance, and
+   halts NR algorithm if a NaN is found.
+-  Adding a Changelog.
+-  more sanitizing for the statistical tests =)
+
+.. _section-54:
+
+0.4.0
+^^^^^
+
+-  ``CoxFitter`` implements Cox Proportional Hazards model in lifelines.
+-  lifelines moves the wheels distributions.
+-  tests in the ``statistics`` module now prints the summary (and still
+   return the regular values)
+-  new ``BaseFitter`` class is inherited from all fitters.
diff --git a/docs/References.rst b/docs/References.rst
new file mode 100644
index 000000000..b142d392e
--- /dev/null
+++ b/docs/References.rst
@@ -0,0 +1,15 @@
+*lifelines* reference
+======================
+
+.. toctree::
+
+    lifelines.fitters
+    lifelines.utils
+    lifelines.plotting
+    lifelines.datasets
+
+
+.. automodule:: lifelines
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/docs/Survival Regression.rst b/docs/Survival Regression.rst
index 6095cdd21..90ac7e169 100644
--- a/docs/Survival Regression.rst	
+++ b/docs/Survival Regression.rst	
@@ -782,7 +782,7 @@ A fitted model's concordance-index is present in the ``print_summary()``, but al
 
     # method three
     from lifelines.utils import concordance_index
-    print(concordance_index(rossi['week'], -cph.predict_partial_hazard(rossi).values, rossi['arrest']))
+    concordance_index(rossi['week'], -cph.predict_partial_hazard(rossi), rossi['arrest'])
 
 
 However, there are other, arguably better, methods to measure the fit of a model. Included in ``print_summary`` is the log-likelihood, which can be used in an `AIC calculation <https://en.wikipedia.org/wiki/Akaike_information_criterion>`_, and the `log-likelihood ratio statistic <https://en.wikipedia.org/wiki/Likelihood-ratio_test>`_. Generally, I personally loved this article by Frank Harrell, `"Statistically Efficient Ways to Quantify Added Predictive Value of New Measurements" <http://www.fharrell.com/post/addvalue/>`_.
diff --git a/docs/Survival analysis with lifelines.rst b/docs/Survival analysis with lifelines.rst
index c3224f9b2..50434424c 100644
--- a/docs/Survival analysis with lifelines.rst	
+++ b/docs/Survival analysis with lifelines.rst	
@@ -90,33 +90,7 @@ this data was record at, do not have observed death events)
 We next use the ``KaplanMeierFitter`` method ``fit`` to fit the model to
 the data. (This is similar to, and inspired by,
 `scikit-learn's <http://scikit-learn.org/stable/>`__
-fit/predict API)
-
-.. code::
-
-  KaplanMeierFitter.fit(durations, event_observed=None,
-                        timeline=None, entry=None, label='KM_estimate',
-                        alpha=None, left_censoring=False, ci_labels=None)
-
-  Parameters:
-    duration: an array, or pd.Series, of length n -- duration subject was observed for
-    timeline: return the best estimate at the values in timelines (postively increasing)
-    event_observed: an array, or pd.Series, of length n -- True if the the death was observed, False if the event
-       was lost (right-censored). Defaults all True if event_observed==None
-    entry: an array, or pd.Series, of length n -- relative time when a subject entered the study. This is
-       useful for left-truncated (not left-censored) observations. If None, all members of the population
-       were born at time 0.
-    label: a string to name the column of the estimate.
-    alpha: the alpha value in the confidence intervals. Overrides the initializing
-       alpha for this call to fit only.
-    left_censoring: True if durations and event_observed refer to left censoring events. Default False
-    ci_labels: add custom column names to the generated confidence intervals
-          as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
-
-
-  Returns:
-    a modified self, with new properties like 'survival_function_'.
-
+fit/predict API).
 
 Below we fit our data with the ``KaplanMeierFitter``:
 
diff --git a/docs/conf.py b/docs/conf.py
index 6ec8143f5..3b23192f3 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -12,12 +12,14 @@
 #
 # All configuration values have a default; values that are commented out
 # serve to show the default.
-
+from datetime import date
+import sys
+import os
 
 # If extensions (or modules to document with autodoc) are in another directory,
 # add these directories to sys.path here. If the directory is relative to the
 # documentation root, use os.path.abspath to make it absolute, like shown here.
-# sys.path.insert(0, os.path.abspath('.'))
+sys.path.insert(0, os.path.abspath("."))
 
 # -- General configuration ------------------------------------------------
 
@@ -52,7 +54,8 @@
 
 # General information about the project.
 project = "lifelines"
-copyright = "2014, Cam Davidson-Pilon"
+copyright = "2014-{},  Cam Davidson-Pilon".format(date.today().year)
+
 
 # The version info for the project you're documenting, acts as replacement for
 # |version| and |release|, also used in various other places throughout the
@@ -60,7 +63,7 @@
 #
 # The short X.Y version.
 
-version = "0.18.5"
+version = "0.18.6"
 # The full version, including dev info
 release = version
 
@@ -68,6 +71,16 @@
 # for a list of supported languages.
 # language = None
 
+autoclass_content = "both"  # include both class docstring and __init__
+autodoc_default_flags = [
+    # Make sure that any autodoc declarations show the right members
+    "members",
+    "inherited-members",
+    "show-inheritance",
+]
+autosummary_generate = True  # Make _autosummary files and include them
+
+
 # There are two options for replacing |today|: either, you set today to some
 # non-false value, then it is used:
 # today = ''
diff --git a/docs/index.rst b/docs/index.rst
index 56a43d685..767619643 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -36,6 +36,9 @@ Contents:
   jupyter_notebooks/Piecewise Exponential Models and Creating Custom Models.ipynb
   jupyter_notebooks/Modelling time-lagged conversion rates.ipynb
   Examples
+  References
+  Changelog
+
 
 
 Installation
diff --git a/docs/lifelines.datasets.rst b/docs/lifelines.datasets.rst
index 896dbe8b3..17f8186d9 100644
--- a/docs/lifelines.datasets.rst
+++ b/docs/lifelines.datasets.rst
@@ -1,20 +1,6 @@
-lifelines.datasets package
-==========================
+lifelines.datasets
+==================
 
-Submodules
-----------
-
-lifelines.datasets.dfcv\_dataset module
----------------------------------------
-
-.. automodule:: lifelines.datasets.dfcv_dataset
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-
-Module contents
----------------
 
 .. automodule:: lifelines.datasets
     :members:
diff --git a/docs/lifelines.fitters.rst b/docs/lifelines.fitters.rst
index e96cbf21d..7ab176b2f 100644
--- a/docs/lifelines.fitters.rst
+++ b/docs/lifelines.fitters.rst
@@ -1,8 +1,6 @@
-lifelines.fitters package
-=========================
+lifelines.fitters
+=================
 
-Submodules
-----------
 
 lifelines.fitters.aalen\_additive\_fitter module
 ------------------------------------------------
@@ -60,6 +58,22 @@ lifelines.fitters.kaplan\_meier\_fitter module
     :undoc-members:
     :show-inheritance:
 
+lifelines.fitters.log\_logistic\_fitter module
+----------------------------------------------
+
+.. automodule:: lifelines.fitters.log_logistic_fitter
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+lifelines.fitters.log\_normal\_fitter module
+--------------------------------------------
+
+.. automodule:: lifelines.fitters.log_normal_fitter
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 lifelines.fitters.nelson\_aalen\_fitter module
 ----------------------------------------------
 
@@ -68,6 +82,14 @@ lifelines.fitters.nelson\_aalen\_fitter module
     :undoc-members:
     :show-inheritance:
 
+lifelines.fitters.piecewise\_exponential\_fitter module
+-------------------------------------------------------
+
+.. automodule:: lifelines.fitters.piecewise_exponential_fitter
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 lifelines.fitters.weibull\_fitter module
 ----------------------------------------
 
@@ -77,9 +99,6 @@ lifelines.fitters.weibull\_fitter module
     :show-inheritance:
 
 
-Module contents
----------------
-
 .. automodule:: lifelines.fitters
     :members:
     :undoc-members:
diff --git a/docs/lifelines.plotting.rst b/docs/lifelines.plotting.rst
new file mode 100644
index 000000000..7b24f3b7b
--- /dev/null
+++ b/docs/lifelines.plotting.rst
@@ -0,0 +1,8 @@
+lifelines.plotting
+==================
+
+
+.. automodule:: lifelines.plotting
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/docs/lifelines.rst b/docs/lifelines.rst
index 642b6e9ec..534b2c430 100644
--- a/docs/lifelines.rst
+++ b/docs/lifelines.rst
@@ -1,61 +1,13 @@
-lifelines package
+lifelines modules
 =================
 
-Subpackages
------------
-
 .. toctree::
 
-    lifelines.datasets
     lifelines.fitters
     lifelines.utils
+    lifelines.plotting
+    lifelines.datasets
 
-Submodules
-----------
-
-lifelines.compat module
------------------------
-
-.. automodule:: lifelines.compat
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.generate\_datasets module
------------------------------------
-
-.. automodule:: lifelines.generate_datasets
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.plotting module
--------------------------
-
-.. automodule:: lifelines.plotting
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.statistics module
----------------------------
-
-.. automodule:: lifelines.statistics
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.version module
-------------------------
-
-.. automodule:: lifelines.version
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-
-Module contents
----------------
 
 .. automodule:: lifelines
     :members:
diff --git a/docs/lifelines.utils.rst b/docs/lifelines.utils.rst
index e74b9d2d7..ecd9bb6ff 100644
--- a/docs/lifelines.utils.rst
+++ b/docs/lifelines.utils.rst
@@ -1,36 +1,5 @@
-lifelines.utils package
-=======================
-
-Submodules
-----------
-
-lifelines.utils.btree module
-----------------------------
-
-.. automodule:: lifelines.utils.btree
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.utils.concordance module
-----------------------------------
-
-.. automodule:: lifelines.utils.concordance
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-lifelines.utils.lowess module
------------------------------
-
-.. automodule:: lifelines.utils.lowess
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-
-Module contents
----------------
+lifelines.utils
+===============
 
 .. automodule:: lifelines.utils
     :members:
diff --git a/docs/modules.rst b/docs/modules.rst
deleted file mode 100644
index dfcfad955..000000000
--- a/docs/modules.rst
+++ /dev/null
@@ -1,7 +0,0 @@
-lifelines
-=========
-
-.. toctree::
-   :maxdepth: 4
-
-   lifelines
diff --git a/lifelines/datasets/__init__.py b/lifelines/datasets/__init__.py
index b37e47234..ed5d7ebef 100644
--- a/lifelines/datasets/__init__.py
+++ b/lifelines/datasets/__init__.py
@@ -3,7 +3,7 @@
 from pkg_resources import resource_filename
 
 
-def load_dataset(filename, **kwargs):
+def _load_dataset(filename, **kwargs):
     """
     Load a dataset from lifelines.datasets
 
@@ -24,371 +24,415 @@ def load_dataset(filename, **kwargs):
 def load_recur(**kwargs):
     """
     From ftp://ftp.wiley.com/public/sci_tech_med/survival/, first published in
-    "Applied Survival Analysis: Regression Modeling of Time to Event Data, Second Edition"
+    "Applied Survival Analysis: Regression Modeling of Time to Event Data, Second Edition"::
 
-    ID          Subject Identification        1 - 400
-    AGE         Age                           years
-    TREAT       Treatment Assignment          0 = New
-                                              1 = Old
-    TIME0       Day of Previous Episode       Days
-    TIME1       Day of New Episode            Days
-                  or censoring
-    CENSOR      Indicator for Soreness        1 = Episode Occurred
-                  Episode or Censoring            at TIME1
-                                              0 = Censored
-    EVENT       Soreness Episode Number       0 to at most 4
+        ID          Subject Identification        1 - 400
+        AGE         Age                           years
+        TREAT       Treatment Assignment          0 = New
+                                                  1 = Old
+        TIME0       Day of Previous Episode       Days
+        TIME1       Day of New Episode            Days
+                      or censoring
+        CENSOR      Indicator for Soreness        1 = Episode Occurred
+                      Episode or Censoring            at TIME1
+                                                  0 = Censored
+        EVENT       Soreness Episode Number       0 to at most 4
 
-    Size: (1296, 7)
-    Example:
-        ID,AGE,TREAT,TIME0,TIME1,CENSOR,EVENT
-        1,43,0,9,56,1,3
-        1,43,0,56,88,1,4
-        1,43,0,0,6,1,1
-        1,43,0,6,9,1,2
+        Size: (1296, 7)
+        Example:
+            ID,AGE,TREAT,TIME0,TIME1,CENSOR,EVENT
+            1,43,0,9,56,1,3
+            1,43,0,56,88,1,4
+            1,43,0,0,6,1,1
+            1,43,0,6,9,1,2
 
     """
-    return load_dataset("recur.csv", **kwargs)
+    return _load_dataset("recur.csv", **kwargs)
 
 
 def load_multicenter_aids_cohort_study(**kwargs):
     """
-    Originally in [1]
+    Originally in [1]::
 
-    Siz: (78, 4)
+        Siz: (78, 4)
 
-    AIDSY: date of AIDS diagnosis
-    W: years from AIDS diagnosis to study entry
-    T: years from AIDS diagnosis to minimum of death or censoring 
-    D: indicator of death during follow up
+        AIDSY: date of AIDS diagnosis
+        W: years from AIDS diagnosis to study entry
+        T: years from AIDS diagnosis to minimum of death or censoring 
+        D: indicator of death during follow up
 
 
-    i   AIDSY       W      T        D
-    1   1990.425    4.575   7.575   0
-    2   1991.250    3.750   6.750   0
-    3   1992.014    2.986   5.986   0
-    4   1992.030    2.970   5.970   0
-    5   1992.072    2.928   5.928   0
-    6   1992.220    2.780   4.688   1
+        i   AIDSY       W      T        D
+        1   1990.425    4.575   7.575   0
+        2   1991.250    3.750   6.750   0
+        3   1992.014    2.986   5.986   0
+        4   1992.030    2.970   5.970   0
+        5   1992.072    2.928   5.928   0
+        6   1992.220    2.780   4.688   1
 
+    References
+    ----------
     [1] Cole SR, Hudgens MG. Survival analysis in infectious disease research: describing events in time. AIDS. 2010;24(16):2423-31.
     """
-    return load_dataset("multicenter_aids_cohort.tsv", sep="\t", index_col=0, **kwargs)
+    return _load_dataset("multicenter_aids_cohort.tsv", sep="\t", index_col=0, **kwargs)
 
 
 def load_holly_molly_polly(**kwargs):
     """
     From https://stat.ethz.ch/education/semesters/ss2011/seminar/contents/presentation_10.pdf
-    Used as a toy example for CoxPH in recurrent SA.
+    Used as a toy example for CoxPH in recurrent SA.::
 
-      ID  Status  Stratum  Start(days)  Stop(days)  tx    T
-    0  M       1        1            0         100   1  100
-    1  M       1        2          100         105   1    5
-    2  H       1        1            0          30   0   30
-    3  H       1        2           30          50   0   20
-    4  P       1        1            0          20   0   20
+          ID  Status  Stratum  Start(days)  Stop(days)  tx    T
+        0  M       1        1            0         100   1  100
+        1  M       1        2          100         105   1    5
+        2  H       1        1            0          30   0   30
+        3  H       1        2           30          50   0   20
+        4  P       1        1            0          20   0   20
 
     """
-    return load_dataset("holly_molly_polly.tsv", sep="\s", **kwargs)
+    return _load_dataset("holly_molly_polly.tsv", sep="\s", **kwargs)
 
 
 def load_leukemia(**kwargs):
     """
-    Leukemia dataset. From http://web1.sph.emory.edu/dkleinb/allDatasets/surv2datasets/anderson.dat
-    Size: (42,5)
-    Example:
-            t  status  sex  logWBC  Rx
-        0  35       0    1    1.45   0
-        1  34       0    1    1.47   0
-        2  32       0    1    2.20   0
-        3  32       0    1    2.53   0
-        4  25       0    1    1.78   0
+    Leukemia dataset.::
+
+        Size: (42,5)
+        Example:
+                t  status  sex  logWBC  Rx
+            0  35       0    1    1.45   0
+            1  34       0    1    1.47   0
+            2  32       0    1    2.20   0
+            3  32       0    1    2.53   0
+            4  25       0    1    1.78   0
+
+    References
+    ----------
+    From http://web1.sph.emory.edu/dkleinb/allDatasets/surv2datasets/anderson.dat
     """
-    return load_dataset("anderson.csv", sep=" ", **kwargs)
+    return _load_dataset("anderson.csv", sep=" ", **kwargs)
 
 
 def load_canadian_senators(**kwargs):
     """
-    A history of Canadian senators in office.
+    A history of Canadian senators in office.::
+
+        Size: (933,10)
+        Example:
+            Name                                        Abbott, John Joseph Caldwell
+            Political Affiliation at Appointment                Liberal-Conservative
+            Province / Territory                                              Quebec
+            Appointed on the advice of                     Macdonald, John Alexander
+            Term (yyyy.mm.dd)                       1887.05.12 - 1893.10.30  (Death)
+            start_date                                           1887-05-12 00:00:00
+            end_date                                             1893-10-30 00:00:00
+            reason                                                             Death
+            diff_days                                                           2363
+            observed                                                            True
 
-    Size: (933,10)
-    Example:
-        Name                                        Abbott, John Joseph Caldwell
-        Political Affiliation at Appointment                Liberal-Conservative
-        Province / Territory                                              Quebec
-        Appointed on the advice of                     Macdonald, John Alexander
-        Term (yyyy.mm.dd)                       1887.05.12 - 1893.10.30  (Death)
-        start_date                                           1887-05-12 00:00:00
-        end_date                                             1893-10-30 00:00:00
-        reason                                                             Death
-        diff_days                                                           2363
-        observed                                                            True
     """
-    return load_dataset("canadian_senators.csv", **kwargs)
+    return _load_dataset("canadian_senators.csv", **kwargs)
 
 
 def load_dd(**kwargs):
     """
-    Classification of political regimes as democracy and dictatorship. Classification of democracies as parliamentary, semi-presidential (mixed) and presidential. Classification of dictatorships as military, civilian and royal. Coverage: 202 countries, from 1946 or year of independence to 2008.
-
+    Classification of political regimes as democracy and dictatorship. 
+    Classification of democracies as parliamentary, semi-presidential (mixed) and presidential. 
+    Classification of dictatorships as military, civilian and royal. 
+    Coverage: 202 countries, from 1946 or year of independence to 2008.::
+
+        Size: (1808, 12)
+        Example:
+            ctryname                                                   Afghanistan
+            cowcode2                                                           700
+            politycode                                                         700
+            un_region_name                                           Southern Asia
+            un_continent_name                                                 Asia
+            ehead                                              Mohammad Zahir Shah
+            leaderspellreg       Mohammad Zahir Shah.Afghanistan.1946.1952.Mona...
+            democracy                                                Non-democracy
+            regime                                                        Monarchy
+            start_year                                                        1946
+            duration                                                             7
+            observed                                                             1
+
+    References
+    ----------
     Cheibub, José Antonio, Jennifer Gandhi, and James Raymond Vreeland. 2010. “Democracy and Dictatorship Revisited.” Public Choice, vol. 143, no. 2-1, pp. 67-101.
 
-    Size: (1808, 12)
-    Example:
-        ctryname                                                   Afghanistan
-        cowcode2                                                           700
-        politycode                                                         700
-        un_region_name                                           Southern Asia
-        un_continent_name                                                 Asia
-        ehead                                              Mohammad Zahir Shah
-        leaderspellreg       Mohammad Zahir Shah.Afghanistan.1946.1952.Mona...
-        democracy                                                Non-democracy
-        regime                                                        Monarchy
-        start_year                                                        1946
-        duration                                                             7
-        observed                                                             1
     """
-    return load_dataset("dd.csv", **kwargs)
+    return _load_dataset("dd.csv", **kwargs)
 
 
 def load_kidney_transplant(**kwargs):
     """
-    Size: (863,6)
-    Example:
-        time             5
-        death            0
-        age             51
-        black_male       0
-        white_male       1
-        black_female     0
+    ::
+
+        Size: (863,6)
+        Example:
+            time             5
+            death            0
+            age             51
+            black_male       0
+            white_male       1
+            black_female     0
 
     """
-    return load_dataset("kidney_transplant.csv", **kwargs)
+    return _load_dataset("kidney_transplant.csv", **kwargs)
 
 
 def load_larynx(**kwargs):
     """
-    Size: (89,6)
-    Example:
-            time  age  death  Stage II  Stage III  Stage IV
-        0    0.6   77      1         0          0         0
-        1    1.3   53      1         0          0         0
-        2    2.4   45      1         0          0         0
-        3    2.5   57      0         0          0         0
-        4    3.2   58      1         0          0         0
+    ::
+
+        Size: (89,6)
+        Example:
+                time  age  death  Stage II  Stage III  Stage IV
+            0    0.6   77      1         0          0         0
+            1    1.3   53      1         0          0         0
+            2    2.4   45      1         0          0         0
+            3    2.5   57      0         0          0         0
+            4    3.2   58      1         0          0         0
 
     """
-    return load_dataset("larynx.csv", **kwargs)
+    return _load_dataset("larynx.csv", **kwargs)
 
 
 def load_lung(**kwargs):
     """
-    Size: (288,10)
-    Example:
-        inst            3
-        time          306
-        status          2
-        age            74
-        sex             1
-        ph.ecog         1
-        ph.karno       90
-        pat.karno     100
-        meal.cal     1175
-        wt.loss       NaN
+    Survival in patients with advanced lung cancer from the North Central Cancer Treatment Group. Performance scores rate how well the patient can perform usual daily activities.::
+
+        Size: (288,10)
+        Example:
+           inst  time  status  age  sex  ph.ecog  ph.karno  pat.karno  meal.cal  wt.loss
+        0   3.0   306       2   74    1      1.0      90.0      100.0    1175.0      NaN
+        1   3.0   455       2   68    1      0.0      90.0       90.0    1225.0     15.0
+        2   3.0  1010       1   56    1      0.0      90.0       90.0       NaN     15.0
+        3   5.0   210       2   57    1      1.0      90.0       60.0    1150.0     11.0
+        4   1.0   883       2   60    1      0.0     100.0       90.0       NaN      0.0
+
+    References
+    -----------
+    Loprinzi CL. Laurie JA. Wieand HS. Krook JE. Novotny PJ. Kugler JW. Bartel J. Law M. Bateman M. Klatt NE. et al. Prospective evaluation of prognostic variables from patient-completed questionnaires. North Central Cancer Treatment Group. Journal of Clinical Oncology. 12(3):601-7, 1994.
 
     """
-    return load_dataset("lung.csv", **kwargs)
+    return _load_dataset("lung.csv", **kwargs)
 
 
 def load_panel_test(**kwargs):
     """
-    Size: (28,5)
-    Example:
-           id  t  E  var1  var2
-        0   1  1  0   0.0     1
-        1   1  2  0   0.0     1
-        2   1  3  0   4.0     3
-        3   1  4  1   8.0     4
-        4   2  1  0   1.2     1
+    ::
+
+        Size: (28,5)
+        Example:
+               id  t  E  var1  var2
+            0   1  1  0   0.0     1
+            1   1  2  0   0.0     1
+            2   1  3  0   4.0     3
+            3   1  4  1   8.0     4
+            4   2  1  0   1.2     1
 
     """
-    return load_dataset("panel_test.csv", **kwargs)
+    return _load_dataset("panel_test.csv", **kwargs)
 
 
 def load_psychiatric_patients(**kwargs):
     """
-    Size: (26,4)
-    Example:
-           Age   T  C  sex
-        0   51   1  1    2
-        1   58   1  1    2
-        2   55   2  1    2
-        3   28  22  1    2
-        4   21  30  0    1
+    ::
+
+        Size: (26,4)
+        Example:
+               Age   T  C  sex
+            0   51   1  1    2
+            1   58   1  1    2
+            2   55   2  1    2
+            3   28  22  1    2
+            4   21  30  0    1
 
     """
-    return load_dataset("psychiatric_patients.csv", **kwargs)
+    return _load_dataset("psychiatric_patients.csv", **kwargs)
 
 
 def load_static_test(**kwargs):
     """
-    Size: (7,5)
-    Example:
-           id  t  E  var1  var2
-        0   1  4  1    -1    -1
-        1   2  3  1    -2    -2
-        2   3  3  0    -3    -3
-        3   4  4  1    -4    -4
-        4   5  2  1    -5    -5
-        5   6  0  1    -6    -6
-        6   7  2  1    -7    -7
+    ::
+
+        Size: (7,5)
+        Example:
+               id  t  E  var1  var2
+            0   1  4  1    -1    -1
+            1   2  3  1    -2    -2
+            2   3  3  0    -3    -3
+            3   4  4  1    -4    -4
+            4   5  2  1    -5    -5
+            5   6  0  1    -6    -6
+            6   7  2  1    -7    -7
     """
-    return load_dataset("static_test.csv", **kwargs)
+    return _load_dataset("static_test.csv", **kwargs)
 
 
 def load_lcd(**kwargs):
     """
-    Size: (104,3)
-    Example:
-           C  T         group
-        0  0  1  alluvial_fan
-        1  0  1  alluvial_fan
-        2  0  1  alluvial_fan
-        3  0  1  alluvial_fan
-        4  1  1  alluvial_fan
+    ::
+
+        Size: (104,3)
+        Example:
+               C  T         group
+            0  0  1  alluvial_fan
+            1  0  1  alluvial_fan
+            2  0  1  alluvial_fan
+            3  0  1  alluvial_fan
+            4  1  1  alluvial_fan
     """
-    return load_dataset("CuZn-LeftCensoredDataset.csv", **kwargs)
+    return _load_dataset("CuZn-LeftCensoredDataset.csv", **kwargs)
 
 
 def load_waltons(**kwargs):
     """
-    Genotypes and number of days survived in Drosophila. Since we work with flies, we don't need to worry about left-censoring. We know the birth date of all flies. We do have issues with accidentally killing some or if some escape. These would be right-censored as we do not actually observe their death due to "natural" causes.
+    Genotypes and number of days survived in Drosophila. Since we work with flies, we don't need to worry about left-censoring. We know the birth date of all flies. We do have issues with accidentally killing some or if some escape. These would be right-censored as we do not actually observe their death due to "natural" causes.::
+
+        Size: (163,3)
+        Example:
+                T  E    group
+            0   6  1  miR-137
+            1  13  1  miR-137
+            2  13  1  miR-137
+            3  13  1  miR-137
+            4  19  1  miR-137
 
-    Size: (163,3)
-    Example:
-            T  E    group
-        0   6  1  miR-137
-        1  13  1  miR-137
-        2  13  1  miR-137
-        3  13  1  miR-137
-        4  19  1  miR-137
     """
-    return load_dataset("waltons_dataset.csv", **kwargs)
+    return _load_dataset("waltons_dataset.csv", **kwargs)
 
 
 def load_rossi(**kwargs):
     """
-    This data set is originally from Rossi et al. (1980), and is used as an example in Allison (1995). The data pertain to 432 convicts who were released from Maryland state prisons in the 1970s and who were followed up for one year after release. Half the released convicts were assigned at random to an experimental treatment in which they were given financial aid; half did not receive aid.
+    This data set is originally from Rossi et al. (1980), and is used as an example in Allison (1995). The data pertain to 432 convicts who were released from Maryland state prisons in the 1970s and who were followed up for one year after release. Half the released convicts were assigned at random to an experimental treatment in which they were given financial aid; half did not receive aid.::
+
 
+        Size: (432,9)
+        Example:
+            week      20
+            arrest     1
+            fin        0
+            age       27
+            race       1
+            wexp       0
+            mar        0
+            paro       1
+            prio       3
+
+    References
+    ----------
     Rossi, P.H., R.A. Berk, and K.J. Lenihan (1980). Money, Work, and Crime:     Some Experimental Results. New York: Academic Press.     John Fox, Marilia Sa Carvalho (2012). The RcmdrPlugin.survival Package: Extending the R Commander Interface to Survival Analysis. Journal of Statistical Software, 49(7), 1-32.
 
-    Size: (432,9)
-    Example:
-        week      20
-        arrest     1
-        fin        0
-        age       27
-        race       1
-        wexp       0
-        mar        0
-        paro       1
-        prio       3
     """
-    return load_dataset("rossi.csv", **kwargs)
+    return _load_dataset("rossi.csv", **kwargs)
 
 
 def load_regression_dataset(**kwargs):
     """
     Artificial regression dataset. Useful since there are no ties in this dataset.
-    Slightly edit in v0.15.0 to achieve this, however.
+    Slightly edit in v0.15.0 to achieve this, however.::
+
+        Size: (200,5)
+        Example:
+                   var1      var2      var3          T  E
+            0  0.595170  1.143472  1.571079  14.785479  1
+            1  0.209325  0.184677  0.356980   7.336734  1
+            2  0.693919  0.071893  0.557960   5.271527  1
+            3  0.443804  1.364646  0.374221  11.684168  1
+            4  1.613324  0.125566  1.921325   7.637764  1
 
-    Size: (200,5)
-    Example:
-               var1      var2      var3          T  E
-        0  0.595170  1.143472  1.571079  14.785479  1
-        1  0.209325  0.184677  0.356980   7.336734  1
-        2  0.693919  0.071893  0.557960   5.271527  1
-        3  0.443804  1.364646  0.374221  11.684168  1
-        4  1.613324  0.125566  1.921325   7.637764  1
     """
-    return load_dataset("regression.csv", **kwargs)
+    return _load_dataset("regression.csv", **kwargs)
 
 
 def load_g3(**kwargs):
     """
+    ::
+
+        Size: (17,7)
+        Example:
+            no.               1
+            age              41
+            sex          Female
+            histology    Grade3
+            group           RIT
+            event          True
+            time             53
 
-    Size: (17,7)
-    Example:
-        no.               1
-        age              41
-        sex          Female
-        histology    Grade3
-        group           RIT
-        event          True
-        time             53
     """
-    return load_dataset("g3.csv", **kwargs)
+    return _load_dataset("g3.csv", **kwargs)
 
 
 def load_stanford_heart_transplants(**kwargs):
     """
     This is a classic dataset for survival regression with time
     varying covariates. The original dataset is from [1], and
-    this dataset is from R's survival library.
-
+    this dataset is from R's survival library.::
+
+        Size: (172, 8)
+        Example:
+               start  stop  event        age      year  surgery  transplant  id
+            0    0.0  50.0      1 -17.155373  0.123203        0           0   1
+            1    0.0   6.0      1   3.835729  0.254620        0           0   2
+            2    0.0   1.0      0   6.297057  0.265572        0           0   3
+            3    1.0  16.0      1   6.297057  0.265572        0           1   3
+            4    0.0  36.0      0  -7.737166  0.490075        0           0   4
+
+    References
+    ----------
     [1] J Crowley and M Hu. Covariance analysis of heart transplant survival data. J American
         Statistical Assoc, 72:27–36, 1977.
 
-
-    Size: (172, 8)
-    Example:
-           start  stop  event        age      year  surgery  transplant  id
-        0    0.0  50.0      1 -17.155373  0.123203        0           0   1
-        1    0.0   6.0      1   3.835729  0.254620        0           0   2
-        2    0.0   1.0      0   6.297057  0.265572        0           0   3
-        3    1.0  16.0      1   6.297057  0.265572        0           1   3
-        4    0.0  36.0      0  -7.737166  0.490075        0           0   4
-
     """
-    return load_dataset("stanford_heart.csv", **kwargs)
+    return _load_dataset("stanford_heart.csv", **kwargs)
 
 
 def load_gbsg2(**kwargs):
     """
-    A data frame containing the observations from the GBSG2 study of 686 women.
-
+    A data frame containing the observations from the GBSG2 study of 686 women.::
+
+        Size: (686,10)
+        Example:
+            horTh           yes
+            age             56
+            menostat        Post
+            tsize           12
+            tgrade          II
+            pnodes          7
+            progrec         61
+            estrec          77
+            time            2018
+            cens            1
+
+    References
+    ----------
     W. Sauerbrei and P. Royston (1999). Building multivariable prognostic and diagnostic models: transformation of the predictors by using fractional polynomials. Journal of the Royal Statistics Society Series A, Volume 162(1), 71–94
 
     M. Schumacher, G. Basert, H. Bojar, K. Huebner, M. Olschewski, W. Sauerbrei, C. Schmoor, C. Beyerle, R.L.A. Neumann and H.F. Rauschecker for the German Breast Cancer Study Group (1994), Randomized 2 × 2 trial evaluating hormonal treatment and the duration of chemotherapy in node- positive breast cancer patients. Journal of Clinical Oncology, 12, 2086–2093
-
-    Size: (686,10)
-    Example:
-        horTh           yes
-        age             56
-        menostat        Post
-        tsize           12
-        tgrade          II
-        pnodes          7
-        progrec         61
-        estrec          77
-        time            2018
-        cens            1
     """
-    return load_dataset("gbsg2.csv", **kwargs)
+    return _load_dataset("gbsg2.csv", **kwargs)
 
 
 def load_dfcv():
     """
-    A toy example of a time dependent dataset. From http://www.math.ucsd.edu/~rxu/math284/slect7.pdf
+    A toy example of a time dependent dataset. ::
+
+
+        Size: (14, 6)
+        Example:
 
+            start  group  z  stop  id  event
+        0       0    1.0  0   3.0   1   True
+        1       0    1.0  0   5.0   2  False
+        2       0    1.0  1   5.0   3   True
+        3       0    1.0  0   6.0   4   True
 
-    Size: (14, 6)
-    Example:
 
-        start  group  z  stop  id  event
-    0       0    1.0  0   3.0   1   True
-    1       0    1.0  0   5.0   2  False
-    2       0    1.0  1   5.0   3   True
-    3       0    1.0  0   6.0   4   True
+    References
+    -----------
+    From http://www.math.ucsd.edu/~rxu/math284/slect7.pdf
     """
     from lifelines.datasets.dfcv_dataset import dfcv
 
@@ -397,18 +441,20 @@ def load_dfcv():
 
 def load_lymphoma(**kwargs):
     """
-    From https://www.statsdirect.com/help/content/survival_analysis/logrank.htm
-
+    ::
 
-    Size: (80, 3)
+        Size: (80, 3)
+        Example:
 
-    Example:
+           Stage_group  Time  Censor
+        0            1     6       1
+        1            1    19       1
+        2            1    32       1
+        3            1    42       1
+        4            1    42       1
 
-       Stage_group  Time  Censor
-    0            1     6       1
-    1            1    19       1
-    2            1    32       1
-    3            1    42       1
-    4            1    42       1
+    References
+    ----------
+    From https://www.statsdirect.com/help/content/survival_analysis/logrank.htm
     """
-    return load_dataset("lymphoma.csv", **kwargs)
+    return _load_dataset("lymphoma.csv", **kwargs)
diff --git a/lifelines/fitters/__init__.py b/lifelines/fitters/__init__.py
index 07214cba7..e7c22ce25 100644
--- a/lifelines/fitters/__init__.py
+++ b/lifelines/fitters/__init__.py
@@ -40,6 +40,9 @@
 from lifelines.compat import PY2, PY3
 
 
+__all__ = []
+
+
 def _must_call_fit_first(func):
     @wraps(func)
     def error_wrapper(*args, **kwargs):
@@ -165,7 +168,7 @@ def predict(self, times):
     @_must_call_fit_first
     def conditional_time_to_event_(self):
         """
-        Return a DataFrame, with index equal to survival_function_, that estimates the median
+        Return a DataFrame, with index equal to ``survival_function_``, that estimates the median
         duration remaining until the death event, given survival up until time t. For example, if an
         individual exists until age 1, their expected life remaining *given they lived to time 1*
         might be 9 years.
@@ -173,7 +176,7 @@ def conditional_time_to_event_(self):
         Returns
         -------
         conditional_time_to_: DataFrame 
-            with index equal to survival_function_
+            with index equal to ``survival_function_``
 
         """
         return self._conditional_time_to_event_()
@@ -445,13 +448,17 @@ def _compute_z_values(self):
     @property
     @_must_call_fit_first
     def summary(self):
-        """Summary statistics describing the fit.
-        Set alpha property in the object before calling.
+        """
+        Summary statistics describing the fit.
 
         Returns
         -------
         df : pd.DataFrame
             Contains columns coef, exp(coef), se(coef), z, p, lower, upper
+
+        See Also
+        --------
+        ``print_summary``
         """
         lower_upper_bounds = self._compute_confidence_bounds_of_parameters()
         df = pd.DataFrame(index=self._fitted_parameter_names)
@@ -518,8 +525,7 @@ def fit(
         durations: an array, or pd.Series
           length n, duration subject was observed for
         event_observed: numpy array or pd.Series, optional
-          length n, True if the the death was observed, False if the event
-           was lost (right-censored). Defaults all True if event_observed==None
+          length n, True if the the death was observed, False if the event was lost (right-censored). Defaults all True if event_observed==None
         timeline: list, optional
             return the estimate at the values in timeline (postively increasing)
         label: string, optional
@@ -528,13 +534,12 @@ def fit(
             the alpha value in the confidence intervals. Overrides the initializing
            alpha for this call to fit only.
         ci_labels: list, optional
-            add custom column names to the generated confidence intervals
-              as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
+            add custom column names to the generated confidence intervals as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
         show_progress: boolean, optional
             since this is an iterative fitting algorithm, switching this to True will display some iteration details.
-        entry: an array, or pd.Series, of length n -- relative time when a subject entered the study. This is
-             useful for left-truncated (not left-censored) observations. If None, all members of the population
-             entered study when they were "born": time zero.
+        entry: an array, or pd.Series, of length n 
+            relative time when a subject entered the study. This is useful for left-truncated (not left-censored) observations. If None, all members of the population
+            entered study when they were "born": time zero.
 
         Returns
         -------
@@ -617,42 +622,103 @@ def fit(
 
     @_must_call_fit_first
     def survival_function_at_times(self, times, label=None):
+        """
+        Return a Pandas series of the predicted survival value at specific times.
+
+        Parameters
+        -----------
+        times: iterable or float
+          values to return the survival function at.
+        label: string, optional
+          Rename the series returned. Useful for plotting. 
+
+        Returns
+        --------
+        pd.Series
+
+        """
         label = coalesce(label, self._label)
         return pd.Series(self._survival_function(self._fitted_parameters_, times), index=_to_array(times), name=label)
 
     @_must_call_fit_first
     def cumulative_hazard_at_times(self, times, label=None):
+        """
+        Return a Pandas series of the predicted cumulative hazard value at specific times.
+
+        Parameters
+        -----------
+        times: iterable or float
+          values to return the cumulative hazard at.
+        label: string, optional
+          Rename the series returned. Useful for plotting. 
+
+        Returns
+        --------
+        pd.Series
+
+        """
         label = coalesce(label, self._label)
         return pd.Series(self._cumulative_hazard(self._fitted_parameters_, times), index=_to_array(times), name=label)
 
     @_must_call_fit_first
     def hazard_at_times(self, times, label=None):
+        """
+        Return a Pandas series of the predicted hazard at specific times.
+
+        Parameters
+        -----------
+        times: iterable or float
+          values to return the hazard at.
+        label: string, optional
+          Rename the series returned. Useful for plotting. 
+
+        Returns
+        --------
+        pd.Series
+
+        """
         label = coalesce(label, self._label)
         return pd.Series(self._hazard(self._fitted_parameters_, times), index=_to_array(times), name=label)
 
     @property
     @_must_call_fit_first
     def median_(self):
+        """ 
+        Return the unique time point, t, such that S(t) = 0.5. This is the "half-life" of the population, and a 
+        robust summary statistic for the population, if it exists. 
+        """
         return median_survival_times(self.survival_function_)
 
     @property
     @_must_call_fit_first
     def confidence_interval_(self):
+        """
+        The confidence interval of the cumulative hazard. This is an alias for ``confidence_interval_cumulative_hazard_``.
+        """
         return self._compute_confidence_bounds_of_cumulative_hazard(self.alpha, self._ci_labels)
 
     @property
     @_must_call_fit_first
     def confidence_interval_cumulative_hazard_(self):
+        """
+        The confidence interval of the cumulative hazard. This is an alias for ``confidence_interval_``.
+        """
         return self.confidence_interval_
 
     @property
     @_must_call_fit_first
     def confidence_interval_hazard_(self):
+        """
+        The confidence interval of the hazard.
+        """
         return self._compute_confidence_bounds_of_transform(self._hazard, self.alpha, self._ci_labels)
 
     @property
     @_must_call_fit_first
     def confidence_interval_survival_function_(self):
+        """
+        The confidence interval of the survival function.
+        """
         return self._compute_confidence_bounds_of_transform(self._survival_function, self.alpha, self._ci_labels)
 
     @_must_call_fit_first
diff --git a/lifelines/fitters/aalen_johansen_fitter.py b/lifelines/fitters/aalen_johansen_fitter.py
index 05ceefa54..2fc9df1fc 100644
--- a/lifelines/fitters/aalen_johansen_fitter.py
+++ b/lifelines/fitters/aalen_johansen_fitter.py
@@ -14,14 +14,11 @@ class AalenJohansenFitter(UnivariateFitter):
     """Class for fitting the Aalen-Johansen estimate for the cumulative incidence function in a competing risks framework.
     Treating competing risks as censoring can result in over-estimated cumulative density functions. Using the Kaplan
     Meier estimator with competing risks as censored is akin to estimating the cumulative density if all competing risks
-    had been prevented. If you are interested in learning more, we recommend the following open-access
-    paper; Edwards JK, Hester LL, Gokhale M, Lesko CR. Methodologic Issues When Estimating Risks in
-    Pharmacoepidemiology. Curr Epidemiol Rep. 2016;3(4):285-296.
+    had been prevented.
 
     Aalen-Johansen cannot deal with tied times. We can get around this by randomy jittering the event times
     slightly. This will be done automatically and generates a warning.
 
-    AalenJohansenFitter(alpha=0.95, jitter_level=0.00001, seed=None, calculate_variance=True)
 
     Parameters
     ----------
@@ -40,6 +37,17 @@ class AalenJohansenFitter(UnivariateFitter):
         computationally intensive. For some procedures, like bootstrapping, the variance is not necessary. To reduce
         computation time during these procedures, `calculate_variance` can be set to `False` to skip the variance
         calculation.
+
+    Example
+    -------
+    >>> AalenJohansenFitter(alpha=0.95, jitter_level=0.00001, seed=None, calculate_variance=True)
+
+
+    References
+    ----------
+    If you are interested in learning more, we recommend the following open-access
+    paper; Edwards JK, Hester LL, Gokhale M, Lesko CR. Methodologic Issues When Estimating Risks in
+    Pharmacoepidemiology. Curr Epidemiol Rep. 2016;3(4):285-296.
     """
 
     def __init__(self, jitter_level=0.0001, seed=None, alpha=0.95, calculate_variance=True):
@@ -85,7 +93,7 @@ def fit(
         Returns
         -------
         self : AalenJohansenFitter
-          self, with new properties like 'cumulative_incidence_'.
+          self, with new properties like ``cumulative_incidence_``.
         """
         # Checking for tied event times
         ties = self._check_for_duplicates(durations=durations, events=event_observed)
diff --git a/lifelines/fitters/breslow_fleming_harrington_fitter.py b/lifelines/fitters/breslow_fleming_harrington_fitter.py
index 926a7a251..11fea4d41 100644
--- a/lifelines/fitters/breslow_fleming_harrington_fitter.py
+++ b/lifelines/fitters/breslow_fleming_harrington_fitter.py
@@ -23,7 +23,7 @@ class BreslowFlemingHarringtonFitter(UnivariateFitter):
     Parameters
     ----------
     alpha: float
-        The alpha value associated with the confidence intervals.
+      The alpha value associated with the confidence intervals.
 
     """
 
@@ -56,13 +56,12 @@ def fit(
             the alpha value in the confidence intervals. Overrides the initializing
            alpha for this call to fit only.
         ci_labels: iterable
-            add custom column names to the generated confidence intervals
-              as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
+            add custom column names to the generated confidence intervals as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
 
 
         Returns
         -------
-          self, with new properties like 'survival_function_'.
+          self, with new properties like ``survival_function_``.
 
         """
         self._label = label
diff --git a/lifelines/fitters/cox_time_varying_fitter.py b/lifelines/fitters/cox_time_varying_fitter.py
index acd8e4566..f084a97ca 100644
--- a/lifelines/fitters/cox_time_varying_fitter.py
+++ b/lifelines/fitters/cox_time_varying_fitter.py
@@ -46,13 +46,14 @@
     coalesce,
 )
 
+__all__ = ["CoxTimeVaryingFitter"]
 
-class CoxTimeVaryingFitter(BaseFitter):
 
-    """
+class CoxTimeVaryingFitter(BaseFitter):
+    r"""
     This class implements fitting Cox's time-varying proportional hazard model:
 
-        .. math::  h(t|x(t)) = h_0(t)*exp(x(t)'*beta)
+        .. math::  h(t|x(t)) = h_0(t)*\exp(x(t)'*beta)
 
     Parameters
     ----------
diff --git a/lifelines/fitters/coxph_fitter.py b/lifelines/fitters/coxph_fitter.py
index 5e19ba954..291a0620e 100644
--- a/lifelines/fitters/coxph_fitter.py
+++ b/lifelines/fitters/coxph_fitter.py
@@ -5,6 +5,7 @@
 import time
 from datetime import datetime
 import warnings
+from textwrap import dedent
 import numpy as np
 import pandas as pd
 
@@ -49,8 +50,11 @@
     string_justify,
     format_p_value,
     format_floats,
+    dataframe_interpolate_at_times,
 )
 
+__all__ = ["CoxPHFitter"]
+
 
 class BatchVsSingle:
     @staticmethod
@@ -1317,6 +1321,7 @@ def predict_cumulative_hazard(self, X, times=None):
                     left_index=True,
                 )
         else:
+
             c_0 = self.baseline_cumulative_hazard_
             v = self.predict_partial_hazard(X)
             col = _get_index(v)
@@ -1324,7 +1329,7 @@ def predict_cumulative_hazard(self, X, times=None):
 
         if times is not None:
             # non-linear interpolations can push the survival curves above 1 and below 0.
-            return cumulative_hazard_.reindex(cumulative_hazard_.index.union(times)).interpolate("index").loc[times]
+            return dataframe_interpolate_at_times(cumulative_hazard_, times)
         return cumulative_hazard_
 
     def predict_survival_function(self, X, times=None):
@@ -1451,7 +1456,6 @@ def _compute_baseline_hazard(self, X, durations, event_observed, weights, name):
             ind_hazards.groupby("event_at")[0].sum().sort_index(ascending=False).cumsum()
         )
         ind_hazards_summed_over_durations.name = "hazards"
-
         event_table = survival_table_from_events(durations, event_observed, weights=weights)
         event_table = event_table.join(ind_hazards_summed_over_durations)
         baseline_hazard = pd.DataFrame(event_table["observed"] / event_table["hazards"], columns=[name]).fillna(0)
@@ -1605,7 +1609,7 @@ def plot_covariate_groups(self, covariate, values, **kwargs):
         return axes
 
     def check_assumptions(
-        self, training_df, advice=True, show_plots=True, p_value_threshold=0.05, plot_n_bootstraps=10
+        self, training_df, advice=True, show_plots=False, p_value_threshold=0.05, plot_n_bootstraps=10
     ):
         """
         Use this function to test the proportional hazards assumption. See iterative usage example at 
@@ -1620,11 +1624,13 @@ def check_assumptions(
         advice: boolean, optional
             display advice as output to the user's screen
         show_plots: boolean, optional
-            display plots of the scaled schoenfeld residuals and loess curves. This is an eyeball test for violations
+            display plots of the scaled schoenfeld residuals and loess curves. This is an eyeball test for violations.
+            This will slow down the function significantly. 
         p_value_threshold: float, optional
             the threshold to use to alert the user of violations. See note below. 
         plot_n_bootstraps:
-            in the plots displayed, also display plot_n_bootstraps bootstrapped loess curves. 
+            in the plots displayed, also display plot_n_bootstraps bootstrapped loess curves. This will slow down
+            the function significantly. 
     
         
         Examples
@@ -1643,8 +1649,12 @@ def check_assumptions(
         -------
         The ``p_value_threshold`` is arbitrarily set at 0.05. Under the null, some covariates
         will be below the threshold (i.e. by chance). This is compounded when there are many covariates. 
+        
+        Similarly, when there are lots of observations, even minor deviances from the proportional hazard 
+        assumption will be flagged. 
+
         With that in mind, it's best to use a combination of statistical tests and eyeball tests to 
-        determine violations. 
+        determine the most serious violations. 
 
         
         References
@@ -1653,15 +1663,21 @@ def check_assumptions(
         http://www.mwsug.org/proceedings/2006/stats/MWSUG-2006-SD08.pdf
         http://eprints.lse.ac.uk/84988/1/06_ParkHendry2015-ReassessingSchoenfeldTests_Final.pdf
         """
+
+        if not training_df.index.is_unique:
+            raise IndexError(
+                "`training_df` index should be unique for this exercise. Please make it unique or use `.reset_index(drop=True)` to force a unique index"
+            )
+
         residuals = self.compute_residuals(training_df, kind="scaled_schoenfeld")
         test_results = proportional_hazard_test(
-            self, training_df, time_transform="all", precomputed_residuals=residuals
+            self, training_df, time_transform=["rank", "km"], precomputed_residuals=residuals
         )
 
-        results_and_duration = residuals.join(training_df[self.duration_col])
+        residuals_and_duration = residuals.join(training_df[self.duration_col])
 
         counter = 0
-        n = results_and_duration.shape[0]
+        n = residuals_and_duration.shape[0]
 
         for variable in self.hazards_.columns:
             minumum_observed_p_value = test_results.summary.loc[variable, "p"].min()
@@ -1671,13 +1687,31 @@ def check_assumptions(
             counter += 1
 
             if counter == 1:
-                print()
+                if advice:
+                    print(
+                        dedent(
+                            """
+                    The ``p_value_threshold`` is set at %.3f. Even under the null hypothesis of no violations, some covariates
+                    will be below the threshold (i.e. by chance). This is compounded when there are many covariates. 
+
+                    Similarly, when there are lots of observations, even minor deviances from the proportional hazard 
+                    assumption will be flagged. 
+
+                    With that in mind, it's best to use a combination of statistical tests and eyeball tests to 
+                    determine the most serious violations. 
+
+                    """
+                            % p_value_threshold
+                        )
+                    )
+
                 test_results.print_summary()
                 print()
 
+            print()
             print(
-                "%d. Variable '%s' failed the non-proportional test with threshold value %0.2f (p=%.4f.)"
-                % (counter, variable, p_value_threshold, minumum_observed_p_value)
+                "%d. Variable '%s' failed the non-proportional test: p-value is %s."
+                % (counter, variable, format_p_value(4)(minumum_observed_p_value))
             )
 
             if advice:
@@ -1689,18 +1723,18 @@ def check_assumptions(
                 # This should capture dichotomous / low cardinality values.
                 if n_uniques <= 10 and value_counts.min() >= 4:
                     print(
-                        "   Advice: with so few unique values (only {0}), you can try `strata=['{1}']` in the call in `.fit`. See documentation here: https://lifelines.readthedocs.io/en/latest/jupyter_notebooks/Proportional%20hazard%20assumption.html".format(
+                        "   Advice: with so few unique values (only {0}), you can try `strata=['{1}']` in the call in `.fit`. See documentation in link [A] and [B] below.".format(
                             n_uniques, variable
                         )
                     )
                 else:
                     print(
-                        """   Advice: try binning the variable '{var}' using pd.cut, and then specify it in `strata=['{var}']` in the call in `.fit`. See more documentation here: https://lifelines.readthedocs.io/en/latest/jupyter_notebooks/Proportional%20hazard%20assumption.html""".format(
+                        """   Advice: try binning the variable '{var}' using pd.cut, and then specify it in `strata=['{var}']` in the call in `.fit`. See documentation in link [A] and [B] below.""".format(
                             var=variable
                         )
                     )
                     print(
-                        """   Advice: try adding an interaction term with your time variable. See more documentation here: https://lifelines.readthedocs.io/en/latest/jupyter_notebooks/Proportional%20hazard%20assumption.html""".format(
+                        """   Advice: try adding an interaction term with your time variable. See documentation in link [A] and specifically link [C] below.""".format(
                             var=variable
                         )
                     )
@@ -1717,8 +1751,9 @@ def check_assumptions(
 
                     ax = fig.add_subplot(2, 2, i)
 
-                    y = results_and_duration[variable]
+                    y = residuals_and_duration[variable]
                     tt = transformer(self.durations, self.event_observed, self.weights)[self.event_observed.values]
+
                     ax.scatter(tt, y, alpha=0.75)
 
                     y_lowess = lowess(tt.values, y.values)
@@ -1741,6 +1776,18 @@ def check_assumptions(
                 plt.tight_layout()
                 plt.subplots_adjust(top=0.90)
 
+        if advice and counter > 0:
+            print(
+                dedent(
+                    """
+                ---
+                [A]  https://lifelines.readthedocs.io/en/latest/jupyter_notebooks/Proportional%20hazard%20assumption.html
+                [B]  https://lifelines.readthedocs.io/en/latest/Survival%20Regression.html#checking-the-proportional-hazards-assumption
+                [C]  https://lifelines.readthedocs.io/en/latest/jupyter_notebooks/Proportional%20hazard%20assumption.html#Option-2:-introduce-time-varying-covariates
+            """
+                )
+            )
+
         if counter == 0:
             print("Proportional hazard assumption looks okay.")
 
diff --git a/lifelines/fitters/exponential_fitter.py b/lifelines/fitters/exponential_fitter.py
index 365fb2e5f..ee63551a7 100644
--- a/lifelines/fitters/exponential_fitter.py
+++ b/lifelines/fitters/exponential_fitter.py
@@ -9,20 +9,18 @@ class ExponentialFitter(KnownModelParametericUnivariateFitter):
     This class implements an Exponential model for univariate data. The model has parameterized
     form:
 
-    .. math::  S(t) = exp(-(\lambda*t)),   \lambda >0
+    .. math::  S(t) = \exp(-\lambda t),   \lambda >0
 
     which implies the cumulative hazard rate is
 
-    .. math::  H(t) = \lambda*t
+    .. math::  H(t) = \lambda t
 
     and the hazard rate is:
 
     .. math::  h(t) = \lambda
 
-    After calling the `.fit` method, you have access to properties like:
-     'survival_function_', 'lambda_', 'cumulative_hazard_'
-
-    A summary of the fit is available with the method 'print_summary()'
+    After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``lambda_``, ``cumulative_hazard_``
+    A summary of the fit is available with the method ``print_summary()``
 
     Notes
     -----
diff --git a/lifelines/fitters/kaplan_meier_fitter.py b/lifelines/fitters/kaplan_meier_fitter.py
index 419b26f5d..b41d48d8d 100644
--- a/lifelines/fitters/kaplan_meier_fitter.py
+++ b/lifelines/fitters/kaplan_meier_fitter.py
@@ -75,7 +75,7 @@ def fit(
         Returns
         -------
         self: KaplanMeierFitter
-          self with new properties like 'survival_function_'.
+          self with new properties like ``survival_function_``.
 
         """
 
diff --git a/lifelines/fitters/log_logistic_fitter.py b/lifelines/fitters/log_logistic_fitter.py
index 53403a900..d6d84813a 100644
--- a/lifelines/fitters/log_logistic_fitter.py
+++ b/lifelines/fitters/log_logistic_fitter.py
@@ -11,15 +11,17 @@ class LogLogisticFitter(KnownModelParametericUnivariateFitter):
     This class implements a Log-Logistic model for univariate data. The model has parameterized
     form:
 
-    .. math::  S(t) = (1 + (t/\alpha)^{\beta})^{-1},   \alpha > 0, \beta > 0,
+    .. math::  S(t) = \left(1 + \left(\frac{t}{\alpha}\right)^{\beta}\right)^{-1},   \alpha > 0, \beta > 0,
 
     and the hazard rate is:
 
-    .. math::  h(t) = (\beta/\alpha)(t / \alpha) ^ {\beta-1} / (1 + (t/\alpha)^{\beta})
+    .. math::  h(t) = \frac{\left(\frac{\beta}{\alpha}\right)\left(\frac{t}{\alpha}\right) ^ {\beta-1}}{\left(1 + \left(\frac{t}{\alpha}\right)^{\beta}\right)}
 
-    After calling the `.fit` method, you have access to properties like:
-    ``cumulative_hazard_``, ``plot``, ``survival_function_``, ``alpha_`` and ``beta_``.
+    and the cumulative hazard is:
 
+    .. math:: H(t) = \log\left(\left(\frac{t}{\alpha}\right) ^ {\beta} + 1\right)
+
+    After calling the `.fit` method, you have access to properties like: ``cumulative_hazard_``, ``plot``, ``survival_function_``, ``alpha_`` and ``beta_``.
     A summary of the fit is available with the method 'print_summary()'
     
     Examples
@@ -42,4 +44,4 @@ def median_(self):
 
     def _cumulative_hazard(self, params, times):
         alpha_, beta_ = params
-        return np.log((times / alpha_) ** beta_ + 1)
+        return np.log1p((times / alpha_) ** beta_)
diff --git a/lifelines/fitters/log_normal_fitter.py b/lifelines/fitters/log_normal_fitter.py
index 94e581694..214e2000f 100644
--- a/lifelines/fitters/log_normal_fitter.py
+++ b/lifelines/fitters/log_normal_fitter.py
@@ -12,18 +12,15 @@ class LogNormalFitter(KnownModelParametericUnivariateFitter):
     This class implements an Log Normal model for univariate data. The model has parameterized
     form:
 
-    .. math::  S(t) = 1 - \Phi((log(t) - \mu)/\sigma),   \sigma >0
+    .. math::  S(t) = 1 - \Phi((\log(t) - \mu)/\sigma),   \sigma >0
 
     where :math:`\Phi` is the CDF of a standard normal random variable. 
     This implies the cumulative hazard rate is
 
-    .. math::  H(t) = -log(1 - \Phi((log(t) - \mu)/\sigma))
+    .. math::  H(t) = -\log(1 - \Phi((\log(t) - \mu)/\sigma))
 
-
-    After calling the `.fit` method, you have access to properties like:
-     'survival_function_', 'mu_', 'sigma_'
-
-    A summary of the fit is available with the method 'print_summary()'
+    After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``mu_``, ``sigma_``.
+    A summary of the fit is available with the method ``print_summary()``
 
     """
 
@@ -39,4 +36,4 @@ def _cumulative_hazard(self, params, times):
         Z = (np.log(times) - mu_) / sigma_
         cdf = norm.cdf(Z, loc=0, scale=1)
         cdf = np.clip(cdf, 0.0, 1 - 1e-14)
-        return -np.log(1 - cdf)
+        return -np.log1p(-cdf)
diff --git a/lifelines/fitters/nelson_aalen_fitter.py b/lifelines/fitters/nelson_aalen_fitter.py
index 3db7f4c74..c1084c626 100644
--- a/lifelines/fitters/nelson_aalen_fitter.py
+++ b/lifelines/fitters/nelson_aalen_fitter.py
@@ -25,8 +25,12 @@ class NelsonAalenFitter(UnivariateFitter):
 
     NelsonAalenFitter(alpha=0.95, nelson_aalen_smoothing=True)
 
-    alpha: The alpha value associated with the confidence intervals.
-    nelson_aalen_smoothing: If the event times are naturally discrete (like discrete years, minutes, etc.)
+    Parameters
+    ----------
+    alpha: float, optional
+        The alpha value associated with the confidence intervals.
+    nelson_aalen_smoothing: bool, optional
+        If the event times are naturally discrete (like discrete years, minutes, etc.)
       then it is advisable to turn this parameter to False. See [1], pg.84.
 
     Notes
@@ -79,8 +83,7 @@ def fit(
             the alpha value in the confidence intervals. Overrides the initializing
            alpha for this call to fit only.
         ci_labels: iterable
-            add custom column names to the generated confidence intervals
-              as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
+            add custom column names to the generated confidence intervals as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
         weights: n array, or pd.Series, of length n
             if providing a weighted dataset. For example, instead
             of providing every subject as a single element of `durations` and `event_observed`, one could
@@ -88,7 +91,7 @@ def fit(
 
         Returns
         -------
-          self, with new properties like 'cumulative_hazard_'.
+          self, with new properties like ``cumulative_hazard_``.
 
         """
 
@@ -211,7 +214,7 @@ def smoothed_hazard_confidence_intervals_(self, bandwidth, hazard_=None):
           bandwidth: float
             the bandwith to use in the Epanechnikov kernel. > 0
           hazard_: numpy array
-            a computed (n,) numpy array of estimated hazard rates. If none, uses naf.smoothed_hazard_
+            a computed (n,) numpy array of estimated hazard rates. If none, uses ``smoothed_hazard_``
         """
         if hazard_ is None:
             hazard_ = self.smoothed_hazard_(bandwidth).values[:, 0]
diff --git a/lifelines/fitters/piecewise_exponential_fitter.py b/lifelines/fitters/piecewise_exponential_fitter.py
index 69508ab1b..d1562d462 100644
--- a/lifelines/fitters/piecewise_exponential_fitter.py
+++ b/lifelines/fitters/piecewise_exponential_fitter.py
@@ -17,13 +17,11 @@ class PiecewiseExponentialFitter(KnownModelParametericUnivariateFitter):
                         ... 
                       \end{cases}
 
-    You specify the breakpoints, :math:`\tau_i`, and lifelines will find the 
+    You specify the breakpoints, :math:`\tau_i`, and *lifelines* will find the 
     optional values for the parameters. 
 
-    After calling the `.fit` method, you have access to properties like:
-     'survival_function_', 'plot', 'cumulative_hazard_'
-
-    A summary of the fit is available with the method 'print_summary()'
+    After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``plot``, ``cumulative_hazard_``
+    A summary of the fit is available with the method ``print_summary()``
 
     """
 
diff --git a/lifelines/fitters/weibull_fitter.py b/lifelines/fitters/weibull_fitter.py
index 03557fb76..1b2e38fbe 100644
--- a/lifelines/fitters/weibull_fitter.py
+++ b/lifelines/fitters/weibull_fitter.py
@@ -11,7 +11,7 @@ class WeibullFitter(KnownModelParametericUnivariateFitter):
     This class implements a Weibull model for univariate data. The model has parameterized
     form:
 
-    .. math::  S(t) = exp(-(\lambda t)^\rho),   \lambda > 0, \rho > 0,
+    .. math::  S(t) = \exp(-(\lambda t)^\rho),   \lambda > 0, \rho > 0,
 
     which implies the cumulative hazard rate is
 
@@ -21,10 +21,8 @@ class WeibullFitter(KnownModelParametericUnivariateFitter):
 
     .. math::  h(t) = \rho \lambda(\lambda t)^{\rho-1}
 
-    After calling the `.fit` method, you have access to properties like:
-    ``cumulative_hazard_``, ``survival_function_``, ``lambda_`` and ``rho_``.
-
-    A summary of the fit is available with the method 'print_summary()'
+    After calling the `.fit` method, you have access to properties like: ``cumulative_hazard_``, ``survival_function_``, ``lambda_`` and ``rho_``.
+    A summary of the fit is available with the method ``print_summary()``.
     
     Examples
     --------
diff --git a/lifelines/plotting.py b/lifelines/plotting.py
index 5589493e4..c15066e09 100644
--- a/lifelines/plotting.py
+++ b/lifelines/plotting.py
@@ -4,6 +4,8 @@
 import numpy as np
 from lifelines.utils import coalesce
 
+__all__ = ["add_at_risk_counts", "plot_lifetimes"]
+
 
 def is_latex_enabled():
     """
@@ -73,43 +75,41 @@ def add_at_risk_counts(*fitters, **kwargs):
     """
     Add counts showing how many individuals were at risk at each time point in
     survival/hazard plots.
-
-    Arguments:
+    
+    Parameters
+    ----------
+    fitters:
       One or several fitters, for example KaplanMeierFitter,
       NelsonAalenFitter, etc...
 
-    Keyword arguments (all optional):
-      ax: The axes to add the labels to. Default is the current axes.
-      fig: The figure of the axes. Default is the current figure.
-      labels: The labels to use for the fitters. Default is whatever was
-              specified in the fitters' fit-function. Giving 'None' will
-              hide fitter labels.
 
-    Returns:
+    Returns
+    --------
       ax: The axes which was used.
 
-    Examples:
-        # First train some fitters and plot them
-        fig = plt.figure()
-        ax = plt.subplot(111)
-
-        f1 = KaplanMeierFitter()
-        f1.fit(data)
-        f1.plot(ax=ax)
-
-        f2 = KaplanMeierFitter()
-        f2.fit(data)
-        f2.plot(ax=ax)
-
-        # There are equivalent
-        add_at_risk_counts(f1, f2)
-        add_at_risk_counts(f1, f2, ax=ax, fig=fig)
-
-        # This overrides the labels
-        add_at_risk_counts(f1, f2, labels=['fitter one', 'fitter two'])
-
-        # This hides the labels
-        add_at_risk_counts(f1, f2, labels=None)
+    Examples
+    --------
+    >>> # First train some fitters and plot them
+    >>> fig = plt.figure()
+    >>> ax = plt.subplot(111)
+    >>>
+    >>> f1 = KaplanMeierFitter()
+    >>> f1.fit(data)
+    >>> f1.plot(ax=ax)
+    >>>
+    >>> f2 = KaplanMeierFitter()
+    >>> f2.fit(data)
+    >>> f2.plot(ax=ax)
+    >>>
+    >>> # There are equivalent
+    >>> add_at_risk_counts(f1, f2)
+    >>> add_at_risk_counts(f1, f2, ax=ax, fig=fig)
+    >>>
+    >>> # This overrides the labels
+    >>> add_at_risk_counts(f1, f2, labels=['fitter one', 'fitter two'])
+    >>>
+    >>> # This hides the labels
+    >>> add_at_risk_counts(f1, f2, labels=None)
     """
     from matplotlib import pyplot as plt
 
@@ -181,12 +181,12 @@ def plot_lifetimes(
     **kwargs
 ):
     """
-    Retuns a lifetime plot, see examples: https://lifelines.readthedocs.io/en/latest/Survival%20Analysis%20intro.html#censorship
+    Retuns a lifetime plot, see examples: https://lifelines.readthedocs.io/en/latest/Survival%20Analysis%20intro.html#Censoring
     
     Parameters
     -----------
     durations: (n,) numpy array or pd.Series
-       duration subject was observed for.
+      duration subject was observed for.
     event_observed: (n,) numpy array or pd.Series
       array of booleans: True if event observed, else False.
     entry: (n,) numpy array or pd.Series 
diff --git a/lifelines/statistics.py b/lifelines/statistics.py
index ff516d0b9..8e5eac398 100644
--- a/lifelines/statistics.py
+++ b/lifelines/statistics.py
@@ -644,10 +644,6 @@ class TimeTransformers:
     def get(self, key_or_callable):
         return self.TIME_TRANSFOMERS.get(key_or_callable, key_or_callable)
 
-    def __iter__(self):
-        for key, item in self.TIME_TRANSFOMERS.items():
-            yield key, item
-
 
 def proportional_hazard_test(
     fitted_cox_model, training_df, time_transform="rank", precomputed_residuals=None, **kwargs
@@ -662,9 +658,9 @@ def proportional_hazard_test(
         but later CoxTimeVaryingFitter, too.
     training_df: DataFrame
         the DataFrame used in the call to the Cox model's ``fit``. 
-    time_transform: vectorized function or string, optional (default='rank')
+    time_transform: vectorized function, list, or string, optional (default='rank')
         {'all', 'km', 'rank', 'identity', 'log'} 
-        One of the strings above, or a function to transform the time (must accept (time, durations, weights) however). 'all' will present all the transforms. 
+        One of the strings above, a list of strings, or a function to transform the time (must accept (time, durations, weights) however). 'all' will present all the transforms. 
     precomputed_residuals: DataFrame, optional
         specify the residuals, if already computed. 
     kwargs: 
@@ -697,10 +693,14 @@ def compute_statistic(times, resids):
         return T
 
     if time_transform == "all":
+        time_transform = list(TimeTransformers.TIME_TRANSFOMERS.keys())
+
+    if isinstance(time_transform, list):
 
         result = StatisticalResult([], [], [])
 
-        for transform_name, transform in TimeTransformers():
+        # yuck
+        for transform_name, transform in ((_, TimeTransformers().get(_)) for _ in time_transform):
             times = transform(durations, events, weights)[events.values]
             T = compute_statistic(times, scaled_resids)
             p_values = _to_array([chisq_test(t, 1) for t in T])
diff --git a/lifelines/utils/__init__.py b/lifelines/utils/__init__.py
index bf4aec374..7fc5f4586 100644
--- a/lifelines/utils/__init__.py
+++ b/lifelines/utils/__init__.py
@@ -18,6 +18,7 @@
     "qth_survival_time",
     "median_survival_times",
     "survival_table_from_events",
+    "group_survival_table_from_events",
     "datetimes_to_durations",
     "concordance_index",
     "k_fold_cross_validation",
@@ -34,7 +35,6 @@ class StatError(Exception):
 
 class ConvergenceError(ValueError):
     # inherits from ValueError for backwards compatilibity reasons
-
     def __init__(self, msg, original_exception=""):
         super(ConvergenceError, self).__init__(msg + (": %s" % original_exception))
         self.original_exception = original_exception
@@ -64,7 +64,7 @@ def qth_survival_times(q, survival_functions, cdf=False):
 
     Returns
     -------
-      v: float, or DataFrame
+    float, or DataFrame
          if d==1, returns a float, np.inf if infinity.
          if d > 1, an DataFrame containing the first times the value was crossed.
 
@@ -74,14 +74,18 @@ def qth_survival_times(q, survival_functions, cdf=False):
     """
     # pylint: disable=cell-var-from-loop,misplaced-comparison-constant,no-else-return
     q = pd.Series(q)
+
     if not ((q <= 1).all() and (0 <= q).all()):
         raise ValueError("q must be between 0 and 1")
 
     survival_functions = pd.DataFrame(survival_functions)
     if survival_functions.shape[1] == 1 and q.shape == (1,):
-        return survival_functions.apply(lambda s: qth_survival_time(q[0], s, cdf=cdf)).iloc[0]
+        q = q[0]
+        return survival_functions.apply(lambda s: qth_survival_time(q, s, cdf=cdf)).iloc[0]
     else:
-        survival_times = pd.DataFrame({_q: survival_functions.apply(lambda s: qth_survival_time(_q, s)) for _q in q}).T
+        survival_times = pd.DataFrame(
+            {_q: survival_functions.apply(lambda s: qth_survival_time(_q, s, cdf=cdf)) for _q in q}
+        ).T
 
         #  Typically, one would expect that the output should equal the "height" of q.
         #  An issue can arise if the Series q contains duplicate values. We solve
@@ -106,13 +110,13 @@ def qth_survival_time(q, survival_function, cdf=False):
 
     Returns
     -------
-      v: float
+    float
 
     See Also
     --------
     qth_survival_times, median_survival_times
     """
-    if isinstance(survival_function, pd.DataFrame):
+    if type(survival_function) is pd.DataFrame:  # pylint: disable=unidiomatic-typecheck
         if survival_function.shape[1] > 1:
             raise ValueError(
                 "Expecting a dataframe (or series) with a single column. Provide that or use utils.qth_survival_times."
@@ -123,11 +127,11 @@ def qth_survival_time(q, survival_function, cdf=False):
     if cdf:
         if survival_function.iloc[0] > q:
             return np.inf
-        v = (survival_function <= q).idxmin(0)
+        v = survival_function.index[survival_function.searchsorted(q)]
     else:
         if survival_function.iloc[-1] > q:
             return np.inf
-        v = (survival_function <= q).idxmax(0)
+        v = survival_function.index[(-survival_function).searchsorted(-q)]
     return v
 
 
@@ -277,13 +281,13 @@ def survival_table_from_events(
 
     Returns
     -------
-    output: DataFrame
-        Pandas DataFrame with index as the unique times or intervals in event_times. The columns named
-        'removed' refers to the number of individuals who were removed from the population
-        by the end of the period. The column 'observed' refers to the number of removed
-        individuals who were observed to have died (i.e. not censored.) The column
-        'censored' is defined as 'removed' - 'observed' (the number of individuals who
-         left the population due to event_observed)
+    DataFrame
+      Pandas DataFrame with index as the unique times or intervals in event_times. The columns named
+      'removed' refers to the number of individuals who were removed from the population
+      by the end of the period. The column 'observed' refers to the number of removed
+      individuals who were observed to have died (i.e. not censored.) The column
+      'censored' is defined as 'removed' - 'observed' (the number of individuals who
+      left the population due to event_observed)
 
     Example
     -------
@@ -448,6 +452,17 @@ def datetimes_to_durations(
         array of floats representing the durations with time units given by freq.
     C: numpy array
         boolean array of event observations: 1 if death observed, 0 else.
+    
+    Examples
+    --------
+    >>> from lifelines.utils import datetimes_to_durations
+    >>> 
+    >>> start_dates = ['2015-01-01', '2015-04-01', '2014-04-05']
+    >>> end_dates = ['2016-02-02', None, '2014-05-06']
+    >>>
+    >>> T, E = datetimes_to_durations(start_dates, end_dates, freq="D")
+    >>> T # array([ 397., 1414.,   31.])
+    >>> E # array([ True, False,  True])
 
     """
     fill_date = pd.to_datetime(fill_date)
@@ -548,43 +563,43 @@ def k_fold_cross_validation(
     Parameters
     ----------
     fitters: model
-        one or several objects which possess a method:
-        fit(self, data, duration_col, event_col)
-        Note that the last two arguments will be given as keyword arguments,
-        and that event_col is optional. The objects must also have
-        the "predictor" method defined below.
+      one or several objects which possess a method:
+      fit(self, data, duration_col, event_col)
+      Note that the last two arguments will be given as keyword arguments,
+      and that event_col is optional. The objects must also have
+      the "predictor" method defined below.
     df: DataFrame
-        a Pandas dataframe with necessary columns `duration_col` and `event_col`, plus
-        other covariates. `duration_col` refers to the lifetimes of the subjects. `event_col`
-        refers to whether the 'death' events was observed: 1 if observed, 0 else (censored).
+      a Pandas dataframe with necessary columns `duration_col` and `event_col`, plus
+      other covariates. `duration_col` refers to the lifetimes of the subjects. `event_col`
+      refers to whether the 'death' events was observed: 1 if observed, 0 else (censored).
     duration_col: (n,) array
-        the column in dataframe that contains the subjects lifetimes.
+      the column in dataframe that contains the subjects lifetimes.
     event_col: (n,) array
-        the column in dataframe that contains the subject's death observation. If left
-        as None, assumes all individuals are non-censored.
+      the column in dataframe that contains the subject's death observation. If left
+      as None, assumes all individuals are non-censored.
     k: int
-        the number of folds to perform. n/k data will be withheld for testing on.
+      the number of folds to perform. n/k data will be withheld for testing on.
     evaluation_measure: function
-        a function that accepts either (event_times, predicted_event_times),
-        or (event_times, predicted_event_times, event_observed)
-        and returns something (could be anything).
-        Default: statistics.concordance_index: (C-index)
-        between two series of event times
+      a function that accepts either (event_times, predicted_event_times),
+      or (event_times, predicted_event_times, event_observed)
+      and returns something (could be anything).
+      Default: statistics.concordance_index: (C-index)
+      between two series of event times
     predictor: string
-       a string that matches a prediction method on the fitter instances.
-       For example, "predict_expectation" or "predict_percentile".
-       Default is "predict_expectation"
-       The interface for the method is:
-           predict(self, data, **optional_kwargs)
+      a string that matches a prediction method on the fitter instances.
+      For example, "predict_expectation" or "predict_percentile".
+      Default is "predict_expectation"
+      The interface for the method is:
+          predict(self, data, **optional_kwargs)
     fitter_kwargs: 
-        keyword args to pass into fitter.fit method
+      keyword args to pass into fitter.fit method
     predictor_kwargs: 
-        keyword args to pass into predictor-method.
+      keyword args to pass into predictor-method.
 
     Returns
     -------
     results: list
-        (k,1) list of scores for each fold. The scores can be anything.
+      (k,1) list of scores for each fold. The scores can be anything.
     """
     # Make sure fitters is a list
     try:
@@ -1316,7 +1331,7 @@ def format_floats(decimals):
 
 
 def dataframe_interpolate_at_times(df, times):
-    return df.reindex(df.index.union(_to_array(times))).interpolate("index").loc[times].squeeze()
+    return df.reindex(df.index.union(_to_array(times))).interpolate(method="index").loc[times].squeeze()
 
 
 string_justify = lambda width: lambda s: s.rjust(width, " ")
diff --git a/lifelines/utils/concordance.py b/lifelines/utils/concordance.py
index c3efc6433..2a64bef49 100644
--- a/lifelines/utils/concordance.py
+++ b/lifelines/utils/concordance.py
@@ -29,12 +29,20 @@ def concordance_index(event_times, predicted_scores, event_observed=None):
     c-index: float
       a value between 0 and 1.
 
-    Notes
+    References
     -----
     Harrell FE, Lee KL, Mark DB. Multivariable prognostic models: issues in
     developing models, evaluating assumptions and adequacy, and measuring and
     reducing errors. Statistics in Medicine 1996;15(4):361-87.
 
+    Examples
+    --------
+
+    >>> from lifelines.utils import concordance_index
+    >>> cph = CoxPHFitter().fit(df, 'T', 'E')
+    >>> concordance_index(df['T'], -cph.predict_partial_hazard(df), df['E'])
+
+
     """
     event_times = np.asarray(event_times, dtype=float)
     predicted_scores = np.asarray(predicted_scores, dtype=float)
diff --git a/lifelines/version.py b/lifelines/version.py
index 5d5c383a6..f9e8b144b 100644
--- a/lifelines/version.py
+++ b/lifelines/version.py
@@ -1,4 +1,4 @@
 # -*- coding: utf-8 -*-
 from __future__ import unicode_literals
 
-__version__ = "0.18.5"
+__version__ = "0.18.6"
diff --git a/perf_tests/cp_perf_test.py b/perf_tests/cp_perf_test.py
index 101d0adae..ed9ec78ec 100644
--- a/perf_tests/cp_perf_test.py
+++ b/perf_tests/cp_perf_test.py
@@ -12,9 +12,11 @@
 
     df = load_rossi()
     df = pd.concat([df] * 20)
+    # df = df.reset_index()
     # df['week'] = np.random.exponential(1, size=df.shape[0])
     cp = CoxPHFitter()
-    start_time = time.time()
     cp.fit(df, duration_col="week", event_col="arrest", batch_mode=True)
+    start_time = time.time()
+    print(cp.predict_median(df))
     print("--- %s seconds ---" % (time.time() - start_time))
     cp.print_summary(4)
diff --git a/tests/test_estimation.py b/tests/test_estimation.py
index 8323562e4..9389fdcc2 100644
--- a/tests/test_estimation.py
+++ b/tests/test_estimation.py
@@ -564,7 +564,7 @@ def test_lnf_inference_with_really_small_sigma(self, lnf):
         assert abs(sigma / lnf.sigma_ - 1) < 0.05
 
     def test_lnf_inference_no_censorship(self, lnf):
-        N = 250000
+        N = 800000
         mu = 10 * np.random.randn()
         sigma = np.random.exponential(10)
 
@@ -2688,6 +2688,14 @@ def test_what_happens_to_nans(self, rossi, cph):
         with pytest.raises(TypeError):
             cph.fit(rossi, duration_col="week", event_col="arrest")
 
+    def test_check_assumptions_fails_for_nonunique_index(self, cph, rossi):
+
+        cph.fit(rossi, "week", "arrest")
+
+        rossi.index = np.ones(rossi.shape[0])
+        with pytest.raises(IndexError):
+            cph.check_assumptions(rossi)
+
 
 class TestAalenAdditiveFitter:
     @pytest.fixture()
diff --git a/tests/test_statistics.py b/tests/test_statistics.py
index f940d7385..b44298e25 100644
--- a/tests/test_statistics.py
+++ b/tests/test_statistics.py
@@ -408,3 +408,36 @@ def test_proportional_hazard_test_with_kmf_with_some_censorship_and_weights():
         cph.fit(df, "T", "E", weights_col="w")
         results = stats.proportional_hazard_test(cph, df)
         npt.assert_allclose(results.summary.loc["var1"]["test_statistic"], 0.916, rtol=1e-2)
+
+
+def test_proportional_hazard_test_with_all():
+
+    df = pd.DataFrame(
+        {
+            "var1": [0.209325, 0.693919, 0.443804, 0.065636, 0.386294],
+            "T": [5.269797, 6.601666, 7.335846, 11.684092, 12.678458],
+            "E": [1, 1, 1, 0, 1],
+        }
+    )
+
+    cph = CoxPHFitter()
+    cph.fit(df, "T", "E")
+    results = stats.proportional_hazard_test(cph, df, time_transform="all")
+    assert results.summary.shape[0] == 1 * 4
+
+
+def test_proportional_hazard_test_with_list():
+
+    df = pd.DataFrame(
+        {
+            "var1": [0.209325, 0.693919, 0.443804, 0.065636, 0.386294],
+            "var2": [1, 0, 1, 0, 1],
+            "T": [5.269797, 6.601666, 7.335846, 11.684092, 12.678458],
+            "E": [1, 1, 1, 0, 1],
+        }
+    )
+
+    cph = CoxPHFitter()
+    cph.fit(df, "T", "E")
+    results = stats.proportional_hazard_test(cph, df, time_transform=["rank", "km"])
+    assert results.summary.shape[0] == 2 * 2