diff --git a/RidgeSC/cross_validation.py b/RidgeSC/cross_validation.py
index b452bb5..eb07a42 100644
--- a/RidgeSC/cross_validation.py
+++ b/RidgeSC/cross_validation.py
@@ -1,4 +1,3 @@
-
 from RidgeSC.fit_fold import  fold_v_matrix, fold_score
 from RidgeSC.fit_loo import  loo_v_matrix, loo_score, loo_weights
 from RidgeSC.fit_ct import  ct_v_matrix, ct_score
@@ -409,19 +408,19 @@ def repeatfunc(func, times=None, *args):
         return itertools.starmap(func, itertools.repeat(args))
     return itertools.starmap(func, itertools.repeat(args, times))
 
-def _gen_placebo_stats_from_diffs(N, effect_vec, std_effect_vec, joint_effect, joint_std_effect,
+def _gen_placebo_stats_from_diffs(N1, effect_vec, std_effect_vec, joint_effect, joint_std_effect,
                                  control_effect_vecs, control_std_effect_vecs, control_joint_effects, control_joint_std_effects,
                                  max_n_pl = 1000000, ret_pl = False, ret_CI=False, level=0.95):
     #ret_p1s=False
     keep_pl = ret_pl or ret_CI
-    C = control_effect_vecs.shape[0]
+    N0 = control_effect_vecs.shape[0]
     T1 = len(effect_vec)
-    n_pl = _ncr(C, N)
+    n_pl = _ncr(N0, N1)
     if (max_n_pl > 0 & n_pl > max_n_pl): #randomize
-        comb_iter = itertools.combinations(range(C), N)
+        comb_iter = itertools.combinations(range(N0), N1)
         comb_len = max_n_pl
     else:
-        comb_iter = repeatfunc(random_combination, n_pl, range(C), N)
+        comb_iter = repeatfunc(random_combination, n_pl, range(N0), N1)
         comb_len = n_pl
     placebo_effect_vecs = None
     if keep_pl:
@@ -483,13 +482,13 @@ def _gen_placebo_stats_from_diffs(N, effect_vec, std_effect_vec, joint_effect, j
 
 def estimate_effects(X, Y_pre, Y_post, treated_units, max_n_pl = 1000000, ret_pl = False, ret_CI=False, level=0.95, **kwargs):
     #TODO: Cleanup returning placebo distribution (incl pre?)
-    N = len(treated_units)
+    N1 = len(treated_units)
     X_and_Y_pre = np.hstack( ( X, Y_pre,) )
-    C_N = X_and_Y_pre.shape[0]
-    #C = C_N - N
+    N = X_and_Y_pre.shape[0]
+    #N0 = N - N1
     #T1 = Y_post.shape[1]
-    control_units = list(set(range(C_N)) - set(treated_units)) 
-    all_units = list(range(C_N))
+    control_units = list(set(range(N)) - set(treated_units)) 
+    all_units = list(range(N))
     Y_post_c = Y_post[control_units, :]
     Y_post_tr = Y_post[treated_units, :]
     X_and_Y_pre_c = X_and_Y_pre[control_units, :]
@@ -537,7 +536,7 @@ def estimate_effects(X, Y_pre, Y_post, treated_units, max_n_pl = 1000000, ret_pl
     joint_effect = np.mean(joint_effects)
     joint_std_effect = np.mean(joint_effects / pre_tr_rmspes)
 
-    return _gen_placebo_stats_from_diffs(N, effect_vec, std_effect_vec, joint_effect, joint_std_effect,
+    return _gen_placebo_stats_from_diffs(N1, effect_vec, std_effect_vec, joint_effect, joint_std_effect,
                                  control_effect_vecs, control_std_effect_vecs, control_joint_effects, control_joint_std_effects,
                                  max_n_pl, ret_pl, ret_CI, level)
 
diff --git a/RidgeSC/fit_ct.py b/RidgeSC/fit_ct.py
index fa5af52..ed29faf 100644
--- a/RidgeSC/fit_ct.py
+++ b/RidgeSC/fit_ct.py
@@ -72,7 +72,7 @@ def ct_v_matrix(X,
         raise TypeError( "L2_PEN_W is not a number")
 
     # CONSTANTS
-    C, N, K = len(control_units), len(treated_units), X.shape[1]
+    N0, N1, K = len(control_units), len(treated_units), X.shape[1]
     if start is None: 
         start = zeros(K) # formerly: .1 * ones(K) 
     Y_treated = Y[treated_units,:]
@@ -106,7 +106,7 @@ def ct_v_matrix(X,
         weights, A, _, AinvB = _weights(dv)
         Ey = (Y_treated - weights.T.dot(Y_control)).getA()
         dGamma0_dV_term2 = zeros(K)
-        dPI_dV = zeros((C, N))
+        dPI_dV = zeros((N0, N1))
         #Ai = A.I
         for k in range(K):
             if verbose:  # for large sample sizes, linalg.solve is a huge bottle neck,
@@ -121,12 +121,12 @@ def ct_v_matrix(X,
 
     L2_PEN_W_mat = 2 * L2_PEN_W * diag(ones(X_control.shape[0]))
     def _weights(V):
-        weights = zeros((C, N))
+        weights = zeros((N0, N1))
         A = X_control.dot(2*V).dot(X_control.T) + L2_PEN_W_mat # 5
         B = X_treated.dot(2*V).dot(X_control.T).T # 6
         b = linalg.solve(A,B)
         if intercept:
-            weights = b + 1/C
+            weights = b + 1/N0
         else:
             weights = b
         return weights, A, B,b
@@ -154,7 +154,7 @@ def ct_v_matrix(X,
     #    _do_gradient_check()
     if intercept: 
         # not above, b/c Y_treated was already offset at the start
-        weights += 1/C 
+        weights += 1/N0 
     return weights, v_mat, ts_score, ts_loss, L2_PEN_W, opt
 
 def ct_weights(X, V, L2_PEN_W, treated_units = None, control_units = None, intercept = True):
@@ -166,7 +166,7 @@ def ct_weights(X, V, L2_PEN_W, treated_units = None, control_units = None, inter
     if control_units is None: 
         control_units = list(set(range(X.shape[0])) - set(treated_units)) 
 
-    C = len(control_units)
+    N0 = len(control_units)
     X_treated = X[treated_units,:]
     X_control = X[control_units,:]
 
@@ -175,7 +175,7 @@ def ct_weights(X, V, L2_PEN_W, treated_units = None, control_units = None, inter
 
     weights = linalg.solve(A,B)
     if intercept:
-        weights += 1/C
+        weights += 1/N0
     return weights.T
 
 def ct_score(Y, X, V, L2_PEN_W, LAMBDA = 0, treated_units = None, control_units = None,**kwargs):
diff --git a/RidgeSC/fit_fold.py b/RidgeSC/fit_fold.py
index 064e268..caf9fde 100644
--- a/RidgeSC/fit_fold.py
+++ b/RidgeSC/fit_fold.py
@@ -105,11 +105,11 @@ def fold_v_matrix(X,
                  (i, len(treated_units),len(split[0]), len(split[1]), ))
 
     # CONSTANTS
-    C, N, K = len(control_units), len(treated_units), X.shape[1]
+    N0, N1, K = len(control_units), len(treated_units), X.shape[1]
     if start is None: 
         start = zeros(K) # formerly: .1 * ones(K) 
-    assert N > 0, "No control units"
-    assert C > 0, "No treated units"
+    assert N1 > 0, "No control units"
+    assert N0 > 0, "No treated units"
     assert K > 0, "variables to fit (X.shape[1] == 0)"
 
     # CREATE THE INDEX THAT INDICATES THE ELIGIBLE CONTROLS FOR EACH TREATED UNIT
@@ -131,9 +131,9 @@ def fold_v_matrix(X,
     Y_control = Y[control_units,:]
 
     # INITIALIZE PARTIAL DERIVATIVES
-    dA_dV_ki = [ [None,] *N for i in range(K)]
-    dB_dV_ki = [ [None,] *N for i in range(K)]
-    b_i = [None,] *N 
+    dA_dV_ki = [ [None,] *N1 for i in range(K)]
+    dB_dV_ki = [ [None,] *N1 for i in range(K)]
+    b_i = [None,] *N1 
     for i, k in  itertools.product(range(len(splits)), range(K)): # TREATED unit i, moment k
         _, test = splits[i]
         Xc = X[in_controls[i], : ]
@@ -160,7 +160,7 @@ def fold_v_matrix(X,
         weights, A, _ = _weights(dv)
         Ey = (Y_treated - weights.T.dot(Y_control)).getA()
         dGamma0_dV_term2 = zeros(K)
-        dPI_dV = zeros((C, N))
+        dPI_dV = zeros((N0, N1))
         for k in range(K):
             if verbose:  # for large sample sizes, linalg.solve is a huge bottle neck,
                 print("Calculating gradient, for moment %s of %s" % (k ,K,))
@@ -176,7 +176,7 @@ def fold_v_matrix(X,
         return LAMBDA - 2 * dGamma0_dV_term2 
 
     def _weights(V):
-        weights = zeros((C, N))
+        weights = zeros((N0, N1))
         A = X.dot(V + V.T).dot(X.T) + 2 * L2_PEN_W * diag(ones(X.shape[0])) # 5
         B = X.dot(V + V.T).dot(X.T).T # 6
         for i, (_,test) in enumerate(splits):
@@ -235,7 +235,7 @@ def fold_weights(X,
             control_units = list(set(range(X.shape[0])) - set(treated_units)) 
     control_units = np.array(control_units)
     treated_units = np.array(treated_units)
-    [C, N] = [len(control_units), len(treated_units)]
+    [N0, N1] = [len(control_units), len(treated_units)]
 
     splits = grad_splits # for readability...
     try:
@@ -249,7 +249,7 @@ def fold_weights(X,
     in_controls = [list(set(control_units) - set(treated_units[test])) for _,test in splits]
     in_controls2 = [np.ix_(i,i) for i in in_controls] # this is a much faster alternative to A[:,index][index,:]
 
-    # index of the controls relative to the rows of the outgoing C x N matrix of weights
+    # index of the controls relative to the rows of the outgoing N0 x N1 matrix of weights
     ctrl_rng = np.arange(len(control_units))
     out_controls = [ctrl_rng[np.logical_not(np.isin(control_units, treated_units[test]))] for _,test in splits] 
     # this is non-trivial when there control units are also being predicted:
@@ -258,7 +258,7 @@ def fold_weights(X,
     # constants for indexing
     # X_control = X[control_units,:]
     # X_treat = X[treated_units,:]
-    weights = zeros((C, N))
+    weights = zeros((N0, N1))
 
     A = X.dot(V + V.T).dot(X.T) + 2 * L2_PEN_W * diag(ones(X.shape[0])) # 5
     B = X.dot(V + V.T).dot(X.T).T # 6
diff --git a/RidgeSC/fit_loo.py b/RidgeSC/fit_loo.py
index 4fe37fe..ea197e2 100644
--- a/RidgeSC/fit_loo.py
+++ b/RidgeSC/fit_loo.py
@@ -7,19 +7,19 @@ import warnings
 from RidgeSC.optimizers.cd_line_search import cdl_search
 warnings.filterwarnings('ignore')
 
-def complete_treated_control_list(C_N, treated_units = None, control_units = None):
+def complete_treated_control_list(N, treated_units = None, control_units = None):
     if treated_units is None: 
         if control_units is None: 
             # both not provided, include all samples as both treat and control unit.
-            control_units = list(range(C_N))
+            control_units = list(range(N))
             treated_units = control_units 
         else:
             # Set the treated units to the not-control units
-            treated_units = list(set(range(C_N)) - set(control_units))  
+            treated_units = list(set(range(N)) - set(control_units))  
     else:
         if control_units is None: 
             # Set the control units to the not-treated units
-            control_units = list(set(range(C_N)) - set(treated_units)) 
+            control_units = list(set(range(N)) - set(treated_units)) 
     return(treated_units, control_units)
 
 def loo_v_matrix(X,
@@ -90,11 +90,11 @@ def loo_v_matrix(X,
     assert not non_neg_weights, "Bounds not implemented"
 
     # CONSTANTS
-    C, N, K = len(control_units), len(treated_units), X.shape[1]
+    N0, N1, K = len(control_units), len(treated_units), X.shape[1]
     if start is None:
         start = zeros(K) # formerly: .1 * ones(K) 
-    assert N > 0, "No control units"
-    assert C > 0, "No treated units"
+    assert N1 > 0, "No control units"
+    assert N0 > 0, "No treated units"
     assert K > 0, "variables to fit (X.shape[1] == 0)"
 
     # CREATE THE INDEX THAT INDICATES THE ELIGIBLE CONTROLS FOR EACH TREATED UNIT
@@ -117,10 +117,10 @@ def loo_v_matrix(X,
     # only used by step-down method: X_control = X[control_units,:]
 
     # INITIALIZE PARTIAL DERIVATIVES
-    dA_dV_ki = [ [None,] *N for i in range(K)]
-    dB_dV_ki = [ [None,] *N for i in range(K)]
-    b_i = [None,] *N 
-    for i, k in  itertools.product(range(N), range(K)): # TREATED unit i, moment k
+    dA_dV_ki = [ [None,] *N1 for i in range(K)]
+    dB_dV_ki = [ [None,] *N1 for i in range(K)]
+    b_i = [None,] *N1 
+    for i, k in  itertools.product(range(N1), range(K)): # TREATED unit i, moment k
         Xc = X[in_controls[i], : ]
         Xt = X[treated_units[i], : ]
         dA_dV_ki [k][i] = Xc[:, k ].dot(Xc[:, k ].T) + Xc[:, k ].dot(Xc[:, k ].T) # 8
@@ -148,7 +148,7 @@ def loo_v_matrix(X,
         weights, A, _ = _weights(dv)
         Ey = (Y_treated - weights.T.dot(Y_control)).getA()
         dGamma0_dV_term2 = zeros(K)
-        dPI_dV = zeros((C, N))
+        dPI_dV = zeros((N0, N1))
         # if solve_method == "step-down": Ai_cache = all_subinverses(A)
         for k in range(K):
             if verbose:  # for large sample sizes, linalg.solve is a huge bottle neck,
@@ -171,7 +171,7 @@ def loo_v_matrix(X,
         return LAMBDA - 2 * dGamma0_dV_term2 
 
     def _weights(V):
-        weights = zeros((C, N))
+        weights = zeros((N0, N1))
         if solve_method == "step-down":
             raise NotImplementedError("The solve_method 'step-down' is currently not implemented")
             # A = X_control.dot(V + V.T).dot(X_control.T) + 2 * L2_PEN_W * diag(ones(X_control.shape[0])) # 5
@@ -227,14 +227,14 @@ def loo_weights(X, V, L2_PEN_W, treated_units = None, control_units = None, inte
     treated_units, control_units = complete_treated_control_list(X.shape[0], treated_units, control_units)
     control_units = np.array(control_units)
     treated_units = np.array(treated_units)
-    [C, N] = [len(control_units), len(treated_units)]
+    [N0, N1] = [len(control_units), len(treated_units)]
 
 
     # index with positions of the controls relative to the incoming data
     in_controls = [list(set(control_units) - set([trt_unit])) for trt_unit in treated_units]
     in_controls2 = [np.ix_(i,i) for i in in_controls] # this is a much faster alternative to A[:,index][index,:]
 
-    # index of the controls relative to the rows of the outgoing C x N matrix of weights
+    # index of the controls relative to the rows of the outgoing N0 x N1 matrix of weights
     ctrl_rng = np.arange(len(control_units))
     out_controls = [ctrl_rng[control_units != trt_unit] for trt_unit in treated_units] 
     # this is non-trivial when there control units are also being predicted:
@@ -243,7 +243,7 @@ def loo_weights(X, V, L2_PEN_W, treated_units = None, control_units = None, inte
     # constants for indexing
     # > only used by the step-down method (currently not implemented) X_control = X[control_units,:]
     # > only used by the step-down method (currently not implemented) X_treat = X[treated_units,:]
-    weights = zeros((C, N))
+    weights = zeros((N0, N1))
 
     if solve_method == "step-down":
         raise NotImplementedError("The solve_method 'step-down' is currently not implemented")
diff --git a/RidgeSC/tests.py b/RidgeSC/tests.py
index 05af795..da019b3 100644
--- a/RidgeSC/tests.py
+++ b/RidgeSC/tests.py
@@ -3,14 +3,14 @@ import numpy as np
 import random
 import RidgeSC as SC
 
-def ge_dgp(C,N,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model= "full"):
+def ge_dgp(N0,N1,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model= "full"):
     """
     From example-code.py
     """
 
     # COVARIATE EFFECTS
-    X_control = np.matrix(np.random.normal(0,1,((C)*groups, K+S+R)))
-    X_treated = np.matrix(np.random.normal(0,1,((N)*groups, K+S+R)))
+    X_control = np.matrix(np.random.normal(0,1,((N0)*groups, K+S+R)))
+    X_treated = np.matrix(np.random.normal(0,1,((N1)*groups, K+S+R)))
 
     # CAUSAL 
     b_cause = np.random.exponential(1,K)
@@ -26,19 +26,19 @@ def ge_dgp(C,N,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model
     # GROUP EFFECTS (hidden)
 
     Y_pre_group_effects = np.random.normal(0,group_scale,(groups,T0))
-    Y_pre_ge_control = Y_pre_group_effects[np.repeat(np.arange(groups),C)]
-    Y_pre_ge_treated = Y_pre_group_effects[np.repeat(np.arange(groups),N)]
+    Y_pre_ge_control = Y_pre_group_effects[np.repeat(np.arange(groups),N0)]
+    Y_pre_ge_treated = Y_pre_group_effects[np.repeat(np.arange(groups),N1)]
 
     Y_post_group_effects = np.random.normal(0,group_scale,(groups,T1))
-    Y_post_ge_control = Y_post_group_effects[np.repeat(np.arange(groups),C)]
-    Y_post_ge_treated = Y_post_group_effects[np.repeat(np.arange(groups),N)]
+    Y_post_ge_control = Y_post_group_effects[np.repeat(np.arange(groups),N0)]
+    Y_post_ge_treated = Y_post_group_effects[np.repeat(np.arange(groups),N1)]
 
     # RANDOM ERRORS
-    Y_pre_err_control = np.matrix(np.random.random( ( C*groups, T0, ) )) 
-    Y_pre_err_treated = np.matrix(np.random.random( ( N*groups, T0, ) )) 
+    Y_pre_err_control = np.matrix(np.random.random( ( N0*groups, T0, ) )) 
+    Y_pre_err_treated = np.matrix(np.random.random( ( N1*groups, T0, ) )) 
 
-    Y_post_err_control = np.matrix(np.random.random( ( C*groups, T1, ) )) 
-    Y_post_err_treated = np.matrix(np.random.random( ( N*groups, T1, ) )) 
+    Y_post_err_control = np.matrix(np.random.random( ( N0*groups, T1, ) )) 
+    Y_post_err_treated = np.matrix(np.random.random( ( N1*groups, T1, ) )) 
 
     # THE DATA GENERATING PROCESS
 
@@ -78,11 +78,11 @@ def ge_dgp(C,N,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model
     return X_control, X_treated, Y_pre_control, Y_pre_treated, Y_post_control, Y_post_treated
 
 
-def factor_dgp(C,N,T0,T1,K,R,F):
+def factor_dgp(N0,N1,T0,T1,K,R,F):
     
     # COVARIATE EFFECTS
-    X_control = np.matrix(np.random.normal(0,1,((C), K+R)))
-    X_treated = np.matrix(np.random.normal(0,1,((N), K+R)))
+    X_control = np.matrix(np.random.normal(0,1,((N0), K+R)))
+    X_treated = np.matrix(np.random.normal(0,1,((N1), K+R)))
  
     b_cause = np.random.exponential(1,K)
     b_cause *= b_cause.max()
@@ -90,8 +90,8 @@ def factor_dgp(C,N,T0,T1,K,R,F):
     beta = np.matrix(np.concatenate( ( b_cause , np.zeros(R)) ) ).T
 
     # FACTORS
-    Loadings_control = np.matrix(np.random.normal(0,1,((C), F)))
-    Loadings_treated = np.matrix(np.random.normal(0,1,((N), F)))
+    Loadings_control = np.matrix(np.random.normal(0,1,((N0), F)))
+    Loadings_treated = np.matrix(np.random.normal(0,1,((N1), F)))
 
     Factors_pre = np.matrix(np.random.normal(0,1,((F), T0)))
     Factors_post = np.matrix(np.random.normal(0,1,((F), T1)))
@@ -99,10 +99,10 @@ def factor_dgp(C,N,T0,T1,K,R,F):
     
     
     # RANDOM ERRORS
-    Y_pre_err_control = np.matrix(np.random.random( ( C, T0, ) )) 
-    Y_pre_err_treated = np.matrix(np.random.random( ( N, T0, ) )) 
-    Y_post_err_control = np.matrix(np.random.random( ( C, T1, ) )) 
-    Y_post_err_treated = np.matrix(np.random.random( ( N, T1, ) )) 
+    Y_pre_err_control = np.matrix(np.random.random( ( N0, T0, ) )) 
+    Y_pre_err_treated = np.matrix(np.random.random( ( N1, T0, ) )) 
+    Y_post_err_control = np.matrix(np.random.random( ( N0, T1, ) )) 
+    Y_post_err_treated = np.matrix(np.random.random( ( N1, T1, ) )) 
 
     # OUTCOMES
     Y_pre_control = X_control.dot(beta) + Loadings_control.dot(Factors_pre) + Y_pre_err_control
@@ -116,10 +116,10 @@ def factor_dgp(C,N,T0,T1,K,R,F):
 
 class TestDGPs(unittest.TestCase):
     def testFactorDGP(self):
-        N, C = 1,100
+        N1, N0 = 1,100
         T0,T1 = 20, 10
         K, R, F = 5, 5, 5
-        X_control, X_treated, Y_pre_control, Y_pre_treated, Y_post_control, Y_post_treated = factor_dgp(C,N,T0,T1,K,R,F)
+        X_control, X_treated, Y_pre_control, Y_pre_treated, Y_post_control, Y_post_treated = factor_dgp(N0,N1,T0,T1,K,R,F)
         
         Y_post = np.vstack( (Y_post_treated,Y_post_control, ) )
         X = np.vstack( (X_treated, X_control, ) )
diff --git a/example-code.py b/example-code.py
index 9d32778..3c79f3c 100644
--- a/example-code.py
+++ b/example-code.py
@@ -16,7 +16,7 @@ import numpy as np
 import random
 
 
-# def setup(C,N,T,K,g,gs,bs ): # controls (C), treated units (N) , time periods (T), Predictors (K), groups (g), g-scale, b-scale
+# def setup(N0,N1,T,K,g,gs,bs ): # controls (N0), treated units (N1) , time periods (T), Predictors (K), groups (g), g-scale, b-scale
 
 if __name__ == "__main__":
 
@@ -32,7 +32,7 @@ if __name__ == "__main__":
     np.random.seed(10101)
 
     # Controls (per group), Treated (per group), pre-intervention Time points,  post intervention time-periods
-    C,N,T0,T1 = 5,5,4,4
+    N0,N1,T0,T1 = 5,5,4,4
     # Causal Covariates, Confounders , Random Covariates 
     K,S,R = 7,4,5
     # Number of Groups, Scale of the Group Effect, (groups make the time series correlated for reasons other than the observed covariates...)
@@ -41,7 +41,7 @@ if __name__ == "__main__":
     beta_scale,confounders_scale = 4,1
 
     X_control, X_treated, Y_pre_control, Y_pre_treated, \
-        Y_post_control, Y_post_treated = ge_dgp(C,N,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model= "full")
+        Y_post_control, Y_post_treated = ge_dgp(N0,N1,T0,T1,K,S,R,groups,group_scale,beta_scale,confounders_scale,model= "full")
 
     # JOIN THE TREAT AND CONTROL DATA
     X = np.vstack( (X_control, X_treated,) )
@@ -53,8 +53,8 @@ if __name__ == "__main__":
     X_and_Y_pre_control = np.hstack( ( X_control, Y_pre_control,) )
 
     # IDENTIFIERS FOR TREAT AND CONTROL UNITS
-    # control_units = np.arange( C * groups )
-    # treated_units = np.arange( N * groups ) + C
+    # control_units = np.arange( N0 * groups )
+    # treated_units = np.arange( N1 * groups ) + N0
 
     # ------------------------------------------------------------
     # ------------------------------------------------------------