!pip install https://github.com/vankesteren/tensorsem/archive/master.zip
!pip install deepirtools


import torch
import tensorsem as ts
import deepirtools

import pandas as pd
from pathlib import Path
import sys
import os
import urllib.request
import shutil
import numpy as np
import itertools
import timeit

deepirtools.manual_seed(123) # Set seed for reproducibility.
                             # This sets seeds for PyTorch, NumPy, and the Python module "random".


data_dir = Path("./data")  # Directory where the data is stored.
lr = 0.01  # Learning rate for stochastic gradient optimizer.
tol = 1e-20  # Loss change tolerance.
max_iter = 5000  # Maximum number of epochs (i.e., full passes through the data set) allowed.

opts = ts.SemOptions.from_file(data_dir / "hs_mod.pkl")  # This defines starting values, constraints, free parameters,
                                                         # and parameter shapes. You need to specify this for every
                                                         # model you fit, which is unwieldly but gives you a decent
                                                         # amount of control.
df = pd.read_csv(data_dir / "hs.csv")[opts.ov_names]  # Read in data and order columns.
df -= df.mean(0)  # Center the data.
sample_size, n_items = df.shape

data = torch.tensor(df.values, dtype = torch.float64, requires_grad = False)

model = ts.StructuralEquationModel(opt = opts, dtype = torch.float64)  # Create the model.
optimizer = torch.optim.Adam(model.parameters(), lr = lr)  # Create stochastic gradient optimizer.
lls = []  # For saving the log-likelihood values during fitting.
start = timeit.default_timer()
for epoch in range(max_iter):
    if epoch % 100 == 1:
        print("Epoch: {:d}".format(epoch), " mean loss: {:.2f}".format(lls[-1] / sample_size))
    optimizer.zero_grad() 
    Sigma = model()  # This computes the model-implied covariance matrix.
    loss = ts.mvn_negloglik(data, Sigma)  # Compute the negative log-likelihood.
    lls.append(-loss.item())
    loss.backward()
    optimizer.step()
    if epoch > 1:
        if abs(lls[-1] - lls[-2]) < tol: # Stop if log-likelihood hasn't changed more than tolerance.
            break
stop = timeit.default_timer()
print("Fitting ended in {:.2f} seconds".format(stop-start, ))

Epoch: 1  mean loss: -13.19
Epoch: 101  mean loss: -12.42
Epoch: 201  mean loss: -12.42
Epoch: 301  mean loss: -12.42
Fitting ended in 0.47 seconds


print("\nLoadings:\n", model.Lam.data,
      "\n\nFactor covariance matrix:\n", model.Psi.data,
      "\n\nResidual covariance matrix:\n", model.Tht.data)

Loadings:
 tensor([[0.8996, 0.0000, 0.0000],
        [0.4979, 0.0000, 0.0000],
        [0.6562, 0.0000, 0.0000],
        [0.0000, 0.9897, 0.0000],
        [0.0000, 1.1016, 0.0000],
        [0.0000, 0.9166, 0.0000],
        [0.0000, 0.0000, 0.6195],
        [0.0000, 0.0000, 0.7309],
        [0.0000, 0.0000, 0.6700]], dtype=torch.float64) 

Factor covariance matrix:
 tensor([[1.0000, 0.4585, 0.4705],
        [0.4585, 1.0000, 0.2830],
        [0.4705, 0.2830, 1.0000]], dtype=torch.float64) 

Residual covariance matrix:
 tensor([[0.5491, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 1.1338, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8443, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.3712, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.4463, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.3562, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.7994, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.4877, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.5661]],
       dtype=torch.float64)


Q = torch.block_diag(*[torch.ones([3, 1])] * 3) # Binary matrix imposing simple structure on the loadings.

model = deepirtools.IWAVE(
    model_type = "normal", # Normal linear factor model.
    learning_rate = lr,
    Q = Q,
    ints_mask = torch.zeros(9), # Constrain all intercepts to zero.
    inference_net_sizes = [20], # Hidden layer size for inference neural network.
    latent_size = 3, # Number of latent variables.
    n_items = 9,
    correlated_factors = [0, 1, 2], # Which factors should be correlated.
    n_intervals = 10 # This is the convergence criterion for I-WAVE.
)
model.fit(data,
          batch_size = sample_size, # We are doing full sample gradient descent rather than
                                    # sampling mini-batches of observations. If requested, DeepIRTools
                                    # handles mini-batch sampling behind the scenes.
          iw_samples = 100) # Increasing iw_samples improves the approximation to the
                            # exact log-likelihood.

Initializing model parameters
Initialization ended in  0.0  seconds

Fitting started
Epoch =     1100 Iter. =     1101 Cur. loss =   12.40   Intervals no change =   10
Fitting ended in  27.78  seconds


print("\nLoadings:\n", model.loadings,
      "\n\nFactor covariance matrix:\n", model.cov,
      "\n\nResidual covariance matrix:\n", model.residual_std.pow(2).diag())

Loadings:
 tensor([[0.9006, 0.0000, 0.0000],
        [0.4951, 0.0000, 0.0000],
        [0.6510, 0.0000, 0.0000],
        [0.0000, 0.9934, 0.0000],
        [0.0000, 1.1054, 0.0000],
        [0.0000, 0.9125, 0.0000],
        [0.0000, 0.0000, 0.6221],
        [0.0000, 0.0000, 0.7278],
        [0.0000, 0.0000, 0.6708]]) 

Factor covariance matrix:
 tensor([[1.0000, 0.4604, 0.4658],
        [0.4604, 1.0000, 0.2784],
        [0.4658, 0.2784, 1.0000]]) 

Residual covariance matrix:
 tensor([[0.5460, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 1.1346, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8484, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.3692, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.4464, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.3568, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.7979, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.4894, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.5637]])


# Download data.
filepath = "./data/IPIP-FFM-data-8Nov2018/data-final.csv"
if not os.path.exists(filepath):
    os.makedirs(os.path.dirname("./data/"), exist_ok=True)
    urllib.request.urlretrieve("https://openpsychometrics.org/_rawdata/IPIP-FFM-data-8Nov2018.zip",
                               "./data/ipip-ffm.zip")
    shutil.unpack_archive("./data/ipip-ffm.zip", "./data/")

# Pre-processing.
df = pd.read_csv(filepath, sep = "\t", header = 0)
df = df[df["IPC"] == 1] # Drop multiple submissions from same IP address.
df.iloc[:, :100] = df.iloc[:, :100].dropna() # Drop people with all NaN responses.
df = df[df.iloc[:, 0:50].sum(1) > 0] # Drop people with all missing responses.
df = df[(df["country"] != "NONE") & (~df["country"].isna())] # Drop people for whom no country was recorded.
rc_items = ["EXT2", "EXT4", "EXT6", "EXT8", "EXT10", "AGR1", "AGR3", "AGR5", "AGR7",
            "CSN2", "CSN4", "CSN6", "CSN8", "EST2", "EST4", "OPN2", "OPN4", "OPN6"]
df[rc_items] = ((1 - df[rc_items] / 5) * 5 + 1).mask(lambda col: col == 6, 0) # Reverse-code reverse-coded items.
Y = torch.from_numpy(df.iloc[:, :50].to_numpy()) - 1 # Collect item responses.
T = torch.from_numpy(df.iloc[:, 50:100].to_numpy()) / 1000 # Collect response times in seconds.

missing_mask = 1 * (Y != -1)
Y[Y == -1] = 0
T[T == 0] = 1e-7 # Set zero response times (which indicate missingness) to a small value.

keeps = (((T < 0).sum(dim = 1) == 0) & ((T > 100).sum(dim = 1) == 0)) # Drop negative or overly long response times
                                                                      # and missing baseline covariates.
Y, T, missing_mask = Y[keeps], T[keeps], missing_mask[keeps]

print(Y.shape) # Matrix of shape (sample_size, n_items).

torch.Size([621307, 50])


lr = 0.01  # Learning rate for stochastic gradient optimizer.

batch_size = 100
checker = deepirtools.utils.ConvergenceChecker(n_intervals = 50,   # This determines convergence for stochastic
                                               log_interval = 100) # gradient optimizers by smoothing over intervals.

# As noted above, this is pretty unwieldly, but does provide a lot of control.
# This object is called a dictionary. It is a container for key : object pairs where
# key is a string and object is some object. Here, we're providing starting values,
# free values (i.e., which values should be estimated), fixed values, parameter shapes,
# and variable names, respectively.
opt_dict = {"delta_start" : (([1.] * 10 + [0.] * 50) * 4 + [1.] * 10 +
                             list(itertools.chain.from_iterable([[1.] + [0.] * (50 - i) for i in range(1, 51)])) +
                             list(itertools.chain.from_iterable([[1.] + [0.] * (5 - i) for i in range(1, 6)])) +
                             [0.] * 25
                            ),
            "delta_free" : (([1.] * 10 + [0.] * 50) * 4 + [1.] * 10 +
                            list(itertools.chain.from_iterable([[1.] + [0.] * (50 - i) for i in range(1, 51)])) +
                            list(itertools.chain.from_iterable([[0.] + [1.] * (5 - i) for i in range(1, 6)])) +
                            [0.] * 25
                           ),
            "delta_value" : ([0.] * (250 + 1275) + 
                             list(itertools.chain.from_iterable([[1.] + [0.] * (5 - i) for i in range(1, 6)])) +
                             [0.] * 25),
            "delta_sizes" : [250, 1275, 15, 25], 
            "psi_shape" : [5, 5],
            "b_0_shape" : [5, 5],
            "lam_shape" : [50, 5],
            "tht_shape" : [50, 50],
            "ov_names" : ["x" + str(i) for i in range(1, 51)]
           }

opts = ts.SemOptions.from_dict(opt_dict) # Create the SemOptions object from our dictionary.
data = Y - Y.mean(dim = 0)
data = data[missing_mask.sum(dim = 1).eq(50)] # Listwise delete observations with missing values.
print(data.shape)                             # DeepIRTools can handle missingness, but it's not straightforward with
                                              # Tensorsem (to my knowledge).
sample_size, n_items = data.shape

model = ts.StructuralEquationModel(opt = opts, dtype = torch.float64)
optimizer = torch.optim.Adam(model.parameters(), lr = lr)
lls = []
epoch = 0
start = timeit.default_timer()
while not checker.converged:
    for fit_iter in range(sample_size // batch_size):
        idxs = np.random.choice(sample_size, size = batch_size, replace = False) # Indices for random sample.
        batch = data[idxs] # Select the random sample.
        optimizer.zero_grad()
        Sigma = model()
        loss = ts.mvn_negloglik(batch, Sigma)
        lls.append(-loss.item())
        loss.backward()
        optimizer.step()
        
        checker.check_convergence(epoch, len(lls), loss.item())
        if checker.converged:
            break
    epoch += 1
stop = timeit.default_timer()
print("\nFitting ended in {:.2f} seconds".format(stop-start, ))

torch.Size([540952, 50])
Epoch =        1 Iter. =     7401 Cur. loss = 7003.08   Intervals no change =   50
Fitting ended in 110.59 seconds


print("\nLoadings:\n", model.Lam.data,
      "\n\nFactor covariance matrix:\n", model.Psi.data,
      "\n\nResidual covariance matrix:\n", model.Tht.data)

Loadings:
 tensor([[0.8412, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9280, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.7921, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.8976, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9588, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.7761, 0.0000, 0.0000, 0.0000, 0.0000],
        [1.0249, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.7633, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.8413, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9098, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8959, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6754, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6496, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.5616, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6413, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9654, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9333, 0.0000, 0.0000, 0.0000],
        [0.0000, 1.0069, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8788, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9016, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6814, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6516, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.4834, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8624, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8121, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6902, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.7855, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6051, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8109, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.4859, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.6712, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.8292, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.4066, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.8188, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.7608, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.9239, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.5439, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.6448, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.7247, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.4709, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5825],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5803],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5876],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5154],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.6291],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.6012],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.3914],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5950],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.2998],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.7292]], dtype=torch.float64) 

Factor covariance matrix:
 tensor([[ 1.0000, -0.2188,  0.3302,  0.1150,  0.2410],
        [-0.2188,  1.0000, -0.0069, -0.2994, -0.0926],
        [ 0.3302, -0.0069,  1.0000,  0.0850,  0.1103],
        [ 0.1150, -0.2994,  0.0850,  1.0000,  0.0601],
        [ 0.2410, -0.0926,  0.1103,  0.0601,  1.0000]], dtype=torch.float64) 

Residual covariance matrix:
 tensor([[0.7902, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8151, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.7605,  ..., 0.0000, 0.0000, 0.0000],
        ...,
        [0.0000, 0.0000, 0.0000,  ..., 1.0678, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.7933, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.4377]],
       dtype=torch.float64)


Q = torch.block_diag(*[torch.ones([10, 1])] * 5)

model = deepirtools.IWAVE(model_type = "normal",
                          learning_rate = lr,
                          Q = Q,
                          ints_mask = torch.zeros(n_items),
                          latent_size = 5,
                          n_items = n_items,
                          correlated_factors = [0, 1, 2, 3, 4],
                          n_intervals = 50
                         )
model.fit(data, batch_size = 100, iw_samples = 20)

Initializing model parameters
Initialization ended in  0.0  seconds

Fitting started
Epoch =        1 Iter. =     8901 Cur. loss =   72.33   Intervals no change =   50
Fitting ended in  71.8  seconds


print("\nLoadings:\n", model.loadings,
      "\n\nFactor covariance matrix:\n", model.cov,
      "\n\nResidual covariance matrix:\n", model.residual_std.pow(2).diag())

Loadings:
 tensor([[0.8761, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9460, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.8202, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9295, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9256, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.7333, 0.0000, 0.0000, 0.0000, 0.0000],
        [1.0365, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.6733, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.7923, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.9434, 0.0000, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9173, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6535, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6673, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.4805, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.6543, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9212, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.9338, 0.0000, 0.0000, 0.0000],
        [0.0000, 1.0045, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8527, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8556, 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.7103, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6635, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.4515, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8681, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8283, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6733, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.7649, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.6031, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.8198, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.4855, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.6741, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.8271, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.3547, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.7507, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.7548, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.9388, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.5886, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.6112, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.7413, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.4456, 0.0000],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5532],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5902],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5897],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5550],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5843],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5948],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.4048],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.5883],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.3053],
        [0.0000, 0.0000, 0.0000, 0.0000, 0.7160]]) 

Factor covariance matrix:
 tensor([[ 1.0000, -0.2493,  0.3579,  0.0751,  0.2274],
        [-0.2493,  1.0000, -0.0103, -0.2530, -0.1102],
        [ 0.3579, -0.0103,  1.0000,  0.1108,  0.1663],
        [ 0.0751, -0.2530,  0.1108,  1.0000,  0.0274],
        [ 0.2274, -0.1102,  0.1663,  0.0274,  1.0000]]) 

Residual covariance matrix:
 tensor([[0.7743, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.8230, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.7074,  ..., 0.0000, 0.0000, 0.0000],
        ...,
        [0.0000, 0.0000, 0.0000,  ..., 1.1188, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.7851, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.4416]])

Foundations of Deep Learning for the Social Sciences:
Day 2 Python Tutorial

Holzinger-Swineford Example¶

Big-Five Personality Factors Example¶

Foundations of Deep Learning for the Social Sciences:Day 2 Python Tutorial

Holzinger-Swineford Example¶

Big-Five Personality Factors Example¶

Foundations of Deep Learning for the Social Sciences:
Day 2 Python Tutorial