diff --git a/structured_data_profiling/profiler/profiler.py b/structured_data_profiling/profiler/profiler.py index 587ab1c..f4dd3f8 100644 --- a/structured_data_profiling/profiler/profiler.py +++ b/structured_data_profiling/profiler/profiler.py @@ -119,7 +119,7 @@ def __init__( if n_samples is None: n_samples = int(0.1 * df.shape[0]) - samples = np.random.choice(df.shape[0], min(n_samples, df.shape[0])) + samples = np.random.choice(df.shape[0], min(n_samples, df.shape[0]), replace=False) self.n_samples = n_samples self.samples = samples