mind-inria
diff --git a/‎examples/plot_2D_simulation_example.py‎
Lines changed: 4 additions & 4 deletions b/‎examples/plot_2D_simulation_example.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎examples/plot_dcrt_example.py‎
Lines changed: 16 additions & 8 deletions b/‎examples/plot_dcrt_example.py‎
Lines changed: 16 additions & 8 deletions
diff --git a/‎examples/plot_importance_classification_iris.py‎
Lines changed: 1 addition & 1 deletion b/‎examples/plot_importance_classification_iris.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/plot_knockoff_aggregation.py‎
Lines changed: 29 additions & 7 deletions b/‎examples/plot_knockoff_aggregation.py‎
Lines changed: 29 additions & 7 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 6 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/hidimstat/_utils/exception.py‎
Lines changed: 12 additions & 0 deletions b/‎src/hidimstat/_utils/exception.py‎
Lines changed: 12 additions & 0 deletions
@@ -69,7 +69,7 @@
     ensemble_clustered_inference_pvalue,
 )
 from hidimstat.statistical_tools.p_values import zscore_from_pval
-from hidimstat._utils.scenario import multivariate_simulation
+from hidimstat._utils.scenario import multivariate_simulation_spatial
 
 #############################################################################
 # Specific plotting functions
@@ -167,12 +167,12 @@ def plot(maps, titles):
 shape = (40, 40)
 n_features = shape[1] * shape[0]
 roi_size = 4  # size of the edge of the four predictive regions
-sigma = 2.0  # noise standard deviation
+signal_noise_ratio = 10.0  # noise standard deviation
 smooth_X = 1.0  # level of spatial smoothing introduced by the Gaussian filter
 
 # generating the data
-X_init, y, beta, epsilon, _, _ = multivariate_simulation(
-    n_samples, shape, roi_size, sigma, smooth_X, seed=1
+X_init, y, beta, epsilon = multivariate_simulation_spatial(
+    n_samples, shape, roi_size, signal_noise_ratio, smooth_X, seed=1
 )
 
 ##############################################################################
 
@@ -20,7 +20,7 @@
 from sklearn.linear_model import LassoCV
 
 from hidimstat import D0CRT
-from hidimstat._utils.scenario import multivariate_1D_simulation
+from hidimstat._utils.scenario import multivariate_simulation
 
 #############################################################################
 # Processing the computations
@@ -38,14 +38,20 @@
     # Number of relevant variables
     n_signal = 2
     # Signal-to-noise ratio
-    snr = 4
+    signal_noise_ratio = 4
     # Correlation coefficient
     rho = 0.8
     # Nominal false positive rate
     alpha = 5e-2
 
-    X, y, _, __ = multivariate_1D_simulation(
-        n_samples=n, n_features=p, support_size=n_signal, rho=rho, seed=sim_ind
+    X, y, beta_true, noise = multivariate_simulation(
+        n_samples=n,
+        n_features=p,
+        support_size=n_signal,
+        rho=rho,
+        signal_noise_ratio=signal_noise_ratio,
+        shuffle=True,
+        seed=sim_ind,
     )
 
     # Applying a reLu function on the outcome y to get non-linear relationships
@@ -58,8 +64,9 @@
     results_list.append(
         {
             "model": "Lasso",
-            "type-1 error": sum(pvals_lasso[n_signal:] < alpha) / (p - n_signal),
-            "power": sum(pvals_lasso[:n_signal] < alpha) / (n_signal),
+            "type-1 error": sum(pvals_lasso[np.logical_not(beta_true)] < alpha)
+            / (p - n_signal),
+            "power": sum(pvals_lasso[beta_true] < alpha) / (n_signal),
         }
     )
 
@@ -73,8 +80,9 @@
     results_list.append(
         {
             "model": "RF",
-            "type-1 error": sum(pvals_forest[n_signal:] < alpha) / (p - n_signal),
-            "power": sum(pvals_forest[:n_signal] < alpha) / (n_signal),
+            "type-1 error": sum(pvals_forest[np.logical_not(beta_true)] < alpha)
+            / (n_signal),
+            "power": sum(pvals_forest[beta_true] < alpha) / (n_signal),
         }
     )
 
 
@@ -116,7 +116,7 @@ def run_one_fold(X, y, model, train_index, test_index, vim_name="CFI", groups=No
     GridSearchCV(SVC(kernel="rbf"), {"C": np.logspace(-3, 3, 10)}),
 ]
 cv = KFold(n_splits=5, shuffle=True, random_state=0)
-groups = {ft: i for i, ft in enumerate(dataset.feature_names)}
+groups = {ft: [i] for i, ft in enumerate(dataset.feature_names)}
 out_list = Parallel(n_jobs=5)(
     delayed(run_one_fold)(
         X, y, model, train_index, test_index, vim_name=vim_name, groups=groups
 
@@ -31,7 +31,7 @@
     model_x_knockoff_pvalue,
 )
 from hidimstat.statistical_tools.multiple_testing import fdp_power
-from hidimstat._utils.scenario import multivariate_1D_simulation_AR
+from hidimstat._utils.scenario import multivariate_simulation
 
 
 #############################################################################
@@ -49,14 +49,14 @@
 # Number of variables
 n_features = 150
 # Correlation parameter
-rho = 0.4
+rho = 0.5
 # Ratio of number of variables with non-zero coefficients over total
 # coefficients
 sparsity = 0.2
 # Desired controlled False Discovery Rate (FDR) level
 fdr = 0.1
 # signal noise ration
-snr = 10
+signal_noise_ratio = 10
 # number of repetitions for the bootstraps
 n_bootstraps = 25
 # seed for the random generator
@@ -73,11 +73,26 @@
 #######################################################################
 # Define the function for running the three procedures on the same data
 # ---------------------------------------------------------------------
-def single_run(n_samples, n_features, rho, sparsity, snr, fdr, n_bootstraps, seed=None):
+def single_run(
+    n_samples,
+    n_features,
+    rho,
+    sparsity,
+    signal_noise_ratio,
+    fdr,
+    n_bootstraps,
+    seed=None,
+):
     # Generate data
-    X, y, _, non_zero_index = multivariate_1D_simulation_AR(
-        n_samples, n_features, rho=rho, sparsity=sparsity, seed=seed, snr=snr
+    X, y, beta_true, noise = multivariate_simulation(
+        n_samples,
+        n_features,
+        rho=rho,
+        support_size=int(n_features * sparsity),
+        signal_noise_ratio=signal_noise_ratio,
+        seed=seed,
     )
+    non_zero_index = np.where(beta_true)[0]
 
     # Use model-X Knockoffs [1]
     selected, test_scores, threshold, X_tildes = model_x_knockoff(
@@ -165,7 +180,14 @@ def effect_number_samples(n_samples):
     parallel = Parallel(n_jobs, verbose=joblib_verbose)
     results = parallel(
         delayed(single_run)(
-            n_samples, n_features, rho, sparsity, snr, fdr, n_bootstraps, seed=seed
+            n_samples,
+            n_features,
+            rho,
+            sparsity,
+            signal_noise_ratio,
+            fdr,
+            n_bootstraps,
+            seed=seed,
         )
         for seed in seed_list
     )
 
@@ -110,3 +110,9 @@ markers = ["slow: marks tests as slow (deselect with '-m \"not slow\"')"]
 # pytest-timeout
 timeout = 60           # on individual test should not take more than 10s
 session_timeout = 1200 # all the tests should be run in 5 min
+
+[tool.pytest_env]
+OPENBLAS_NUM_THREADS = 1
+BLIS_NUM_THREADS = 1
+MKL_NUM_THREADS = 1
+OMP_NUM_THREADS = 1
@@ -0,0 +1,12 @@
+class InternalError(BaseException):
+    """
+    Create an error for internal error of the library
+
+    Parameters
+    ----------
+    message: str
+        Message of explanation of the error
+    """
+
+    def __init__(self, message):
+        self.message = message
Original file line number	Diff line number	Diff line change
`@@ -116,7 +116,7 @@ def run_one_fold(X, y, model, train_index, test_index, vim_name="CFI", groups=No`
`116`	`116`	`GridSearchCV(SVC(kernel="rbf"), {"C": np.logspace(-3, 3, 10)}),`
`117`	`117`	`]`
`118`	`118`	`cv = KFold(n_splits=5, shuffle=True, random_state=0)`
`119`		`-groups = {ft: i for i, ft in enumerate(dataset.feature_names)}`
	`119`	`+groups = {ft: [i] for i, ft in enumerate(dataset.feature_names)}`
`120`	`120`	`out_list = Parallel(n_jobs=5)(`
`121`	`121`	`delayed(run_one_fold)(`
`122`	`122`	`X, y, model, train_index, test_index, vim_name=vim_name, groups=groups`