import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
np.random.seed(42)

def generate_synthetic_data(n=100):
    
    # Observed features
    length = np.random.uniform(1., 8., size=n)
    width = np.random.uniform(0.5, 4., size=n)
    widget_factor = np.random.uniform(0.2, 2., size=n)
    X = np.stack([length, width, widget_factor], axis=-1)

    # True DGP (Unobserved)
    epsilon = np.random.normal(0, 0.1,size=n)
    U = 1 - 0.1*length - 0.1*width - widget_factor + epsilon
    rate = np.exp(U)

    # Observed outcomes
    Y = np.exp(-rate) * 10
    
    return X, Y
    
X, Y = generate_synthetic_data(n=10000)

plt.hist(Y)
plt.title('Distribution of Widget Time-Until-Failure')
plt.xlabel('Years')
plt.show()

from survivaldnn import SurvivalDNNModel

model = SurvivalDNNModel()

# Internally, this is used to determine the support points
# t_1, t_2, ..., t_{numSupport}
support = model.discretize_outcome_support(Y, numSupport=10)
support

array([1.32513751, 3.83058098, 4.6781604 , 5.39642685, 6.00376299,
       6.57914055, 7.09105098, 7.54190942, 7.99987867, 9.00493482])

numFeatures = X.shape[-1]
model.compile(numFeatures=numFeatures,
              numSupport=100,
              loss='loglik',
              architecture='resnet',
              layers=5)

# Standardize features
X = (X - X.mean(axis=0)) / X.std(axis=0)

# Train the model
model.fit(X, Y,
          epochs=2000)

  0%|          | 0/2000 [00:00<?, ?it/s]

Y_hat = model.predict(X)

def compare_predictions(res):
    fig, ax = plt.subplots(figsize=(12,7))
    ax.set_xlim((0,10))
    ax.set_ylim((0,10))
    res.plot.scatter(x='True', y='Predicted', ax=ax)
    a, b = res.min().max(), res.max().min()
    plt.plot([a, b], [a, b], 'r--', lw=2, label='Perfect Prediction')
    plt.legend()
    plt.show()

res = pd.DataFrame(np.stack([Y, Y_hat], axis=-1), columns=['True', 'Predicted'])
compare_predictions(res)

# Suppose we inspected widgets halfway and
# observed they haven't failed yet
elapsed = Y / 2
Y_hat_cond = model.predict_conditional(X, elapsed)

res = pd.DataFrame(np.stack([Y, Y_hat_cond], axis=-1), columns=['True', 'Predicted'])
compare_predictions(res)

survFunc, support = model.predict_survival_function(X[:100,:])

model.plot_survival_function(X[:100,:])

model.plot_distribution(X[:100,:])

SurvivalDNN Usage Example¶

Data¶

Model¶

Discretization¶

Compilation¶

Train¶

Inference¶

Point Estimates/Predictions¶

Conditional Point Estimates/Predictions¶

Survival Function¶

Cumulative Distribution Function¶