From 452412cba3d8401a82a7b718e57bfc6c3b0e6efc Mon Sep 17 00:00:00 2001
From: Vivian Miranda <vivian.miranda.astro@gmail.com>
Date: Thu, 2 Apr 2026 15:50:43 -0400
Subject: [PATCH] merge from main - fix bugs on dataset_generator

---
 emultraining/dataset_generator_baosn.py      | 1370 +++++++++++++++---
 emultraining/dataset_generator_baosn_copy.py |  268 ++++
 emultraining/dataset_generator_cmb.py        |  189 +--
 emultraining/dataset_generator_lensing.py    |  181 +--
 4 files changed, 1608 insertions(+), 400 deletions(-)
 create mode 100644 emultraining/dataset_generator_baosn_copy.py

diff --git a/emultraining/dataset_generator_baosn.py b/emultraining/dataset_generator_baosn.py
index ba0fdb4..8f19801 100644
--- a/emultraining/dataset_generator_baosn.py
+++ b/emultraining/dataset_generator_baosn.py
@@ -1,268 +1,1170 @@
 import numpy as np
-import cobaya
-from cobaya.yaml import yaml_load
+import emcee, argparse, os, sys, yaml, time, traceback
+import psutil, gc, math, copy, tempfile
 from cobaya.model import get_model
-import sys
-import os
-import platform
-import yaml
 from mpi4py import MPI
-from scipy.stats import qmc
-import copy
-import functools, iminuit, copy, argparse, random, time 
-import emcee, itertools
+from pathlib import Path
+from getdist import loadMCSamples
+from collections import deque
+from contextlib import contextmanager
+from numpy.lib.format import open_memmap
+import contextlib, io
 from cobaya.likelihood import Likelihood
-from schwimmbad import MPIPool
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Example how to run this program
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# The script below computes data vectors for BAO/SN emulators.
+#
+#     mpirun -n 10 --oversubscribe \
+#       python external_modules/code/emulators/emultrf/emultraining/dataset_generator_baosn.py \
+#         --root projects/example/  \
+#         --fileroot emulators/ \
+#         --nparams 10000 \
+#         --yaml 'w0wa_lowacc_mlp.yaml' \
+#         --datavsfile 'w0wa_lowacc_dvs_train' \
+#         --paramfile 'w0wa_lowacc_params_train' \
+#         --failfile  'w0wa_lowacc_params_failed_train' \
+#         --chain 0 \
+#         --unif 0 \
+#         --temp 64 \
+#         --maxcorr 0.15 \
+#         --freqchk 2000 \
+#         --loadchk 0 \
+#         --append 0 \
+#         --boundary 1.0 \
+#         --zhd 3.0 \
+#         --nzhd 600 \
+#         --zhd 1200.0 \
+#         --nzmax 200
+#
+#- The requested number of data vectors is given by the `--nparams` flag.
+#
+#- There are two possible samplings.
+#  - The option `--unif 1` sets the sampling to follow a uniform distribution (respecting parameter boundaries set in the YAML file)
+#  - The option `--unif 0` sets the sampling to follow a Gaussian distribution with the following options
+#    -  The covariance matrix is set in the YAML file (keyword `params_covmat_file` inside the `train_args` block).
+#       For example, our provided YAML selects the Fisher-based *w0wa_fisher_covmat.txt* covariance matrix
+#    -  Temperature reduces the curvature of the likelihood (`cov = cov/T`) and is set by `--temp` flag 
+#    -  The correlations of the original covariance matrix are reduced to be less than `--maxcorr`.
+#
+#  Even on Uniform Sampling, the temperature parameter is needed to set hard boundary on parameters with Gaussian prior
+#
+#- For visualization purposes, setting `--chain 1` sets the script to generate the training parameters without computing the data vectors.
+#
+#- The output files are
+#
+#      # Distribution of training points ready to be plotted by GetDist
+#      w0wa_lowacc_params_train_cs_64.1.txt
+#      w0wa_lowacc_params_train_cs_64.covmat
+#      w0wa_lowacc_params_train_cs_64.paramnames
+#      w0wa_lowacc_params_train_cs_64.ranges
+#
+#      #Corresponding data vectors
+#      w0wa_lowacc_dvs_train_cs_64.npy
+#      # Training parameters in which the data vector computation failed (or not computed)
+#      w0wa_lowacc_params_failed_train_cs_64.txt
+#
+#- The flags `--freqchk`, `--loadchk`, and `--append` are related to checkpoints. 
+#  - The option `--freqchk` sets the frequency at which the code saves checkpoints (chk).
+#  - The options `--loadchk` and `--append` specify whether the code loads the parameters and data vectors from a chk.
+#    In the two cases below, the code determines which remaining data vectors to compute based on the flags saved in the `--failfile` file.
+#      - Case 1 (`--loadchk 1` and `--append 1`): the code loads params from the chk and appends `~nparams` models to it. 
+#      - Case 2 (`--loadchk 1` and `--append 0`): the code loads the params.
+#
+#- The flags `--zhd`, `--nzhd`, `--zhd` and `--nzmax` set the size of the data vector
 
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Command line args
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+parser = argparse.ArgumentParser(prog='dataset_generator_baosn')
 
-parser = argparse.ArgumentParser(prog='cos_uniform')
+parser.add_argument("--yaml",
+                    dest="yaml",
+                    help="The training YAML containing the training_args block",
+                    type=str,
+                    required=True)
+parser.add_argument("--root",
+                    dest="root",
+                    help="Project folder",
+                    type=str,
+                    required=True)
+parser.add_argument("--fileroot",
+                    dest="fileroot",
+                    help="Subfolder of Project folder where we find yaml and fisher",
+                    type=str,
+                    required=True)
+parser.add_argument("--datavsfile",
+                    dest="datavsfile",
+                    help="File to save data vectors",
+                    type=str,
+                    required=True)
+parser.add_argument("--paramfile",
+                    dest="paramfile",
+                    help="File to save parameters",
+                    type=str,
+                    required=True)
+parser.add_argument("--failfile",
+                    dest="failfile",
+                    help="File that tells which cosmo param fail to compute dvs",
+                    type=str,
+                    required=True)
+parser.add_argument("--chain",
+                    dest="chain",
+                    help="only compute and output train/test/val chain",
+                    type=int,
+                    choices=[0,1],
+                    default=0)
+parser.add_argument("--nparams",
+                    dest="nparams",
+                    help="Requested Number of Parameters",
+                    type=int,
+                    required=True)
+parser.add_argument("--unif",
+                    dest="unif",
+                    help="Choose Between Uniform and Fisher based samples",
+                    type=int,
+                    choices=[0,1],
+                    required=True)
+parser.add_argument("--temp",
+                    dest="temp",
+                    help="Number of Parameters to Generate",
+                    type=int)
+parser.add_argument("--maxcorr",
+                    dest="maxcorr",
+                    help="Max correlation allowed",
+                    type=float)
+parser.add_argument("--loadchk",
+                    dest="loadchk",
+                    help="Load from chk if exists",
+                    type=int,
+                    choices=[0,1])
+parser.add_argument("--freqchk",
+                    dest="freqchk",
+                    help="Load from chk if exists",
+                    type=int)
+parser.add_argument("--append",
+                    dest="append",
+                    help="Append more models (only trye of loadchk == true)",
+                    type=int,
+                    choices=[0,1])
+parser.add_argument("--boundary",
+                    dest="boundary",
+                    help="Boundary setup: test/val requires boundaries to be cut",
+                    type=float)
+parser.add_argument("--zhd", 
+                    dest="zhd",
+                    help="Emulator will emulator from z = 0 to z = zhd with n = nzhd points",
+                    type=float)
+parser.add_argument("--nzhd",
+                    dest="nzhd",
+                    help="Emulator will emulator from z = 0 to z = zhd with n = nzhd points",
+                    type=int)
+parser.add_argument("--zmax",
+                    dest="zmax",
+                    help="Emulator will emulator from z = zhd to z = zmax with n = nzmax points",
+                    type=float)
+parser.add_argument("--nzmax",
+                    dest="nzmax",
+                    help="Emulator will emulator from z = zhd to z = zmax with n = nzmax points",
+                    type=int)
+args, unknown = parser.parse_known_args()
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Free Functions
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+@contextmanager
+def capture_native_output():
+  """
+  Redirect OS-level file descriptors to capture Fortran/C output.
+  Unlike contextlib.redirect_stderr, this catches writes from any language
+  (Fortran, C, etc.) that go directly to fd 1 (stdout) or fd 2 (stderr).
+  Author: From Claude AI.
+  """
+  stdout_fd = sys.stdout.fileno()  # fd 1 — where stdout currently points
+  stderr_fd = sys.stderr.fileno()  # fd 2 — where stderr currently points
+  stdout_dup = os.dup(stdout_fd)   # bookmark original stdout destination
+  stderr_dup = os.dup(stderr_fd)   # bookmark original stderr destination
+  tmp = tempfile.TemporaryFile(mode='w+')
+  try:
+    os.dup2(tmp.fileno(), stdout_fd) # fd 1 now writes to tmp (not terminal)
+    os.dup2(tmp.fileno(), stderr_fd) # fd 2 now writes to tmp (not terminal)
+    yield tmp
+  finally: # this block is always executed  regardless of exception generation
+    os.dup2(stdout_dup, stdout_fd)   # restore fd 1 → terminal
+    os.dup2(stderr_dup, stderr_fd)   # restore fd 2 → terminal
+    os.close(stdout_dup)             # release the bookmarks
+    os.close(stderr_dup)
+    tmp.close()
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Class Definition
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+class baosn_aux_likelihood(Likelihood):
+  zhd: float  = 3.0
+  nzhd: int   = 600
+  zmax: float = 1200.0
+  nzmax: int  = 200
 
+  def initialize(self):
+    if args.zhd   is not None: self.zhd   = abs(args.zhd)
+    if args.nzhd  is not None: self.nzhd  = int(abs(args.nzhd))
+    if args.zmax  is not None: self.zmax  = abs(args.zmax)
+    if args.nzmax is not None: self.nzmax = int(abs(args.nzmax))
+    self.nztotal = self.nzhd + self.nzmax
 
-class SimpleBAODVLikelihood(Likelihood):
-    # Example data can also be passed via YAML or hardcoded here
-    def initialize(self):
-        # Define data inside the class (or pass from outside if needed)
-        z1=np.linspace(0,3,600, endpoint=False)
-        z2=np.linspace(3,1200,200)
-        self.z_data = np.concatenate((z1,z2),axis=0)  # example redshifts
+    self.z1 = np.linspace(0.0, self.zhd, self.nzhd, endpoint = False)
+    self.z2 = np.linspace(self.zhd, self.zmax, self.nzmax, endpoint = True)
+    if (len(self.z1) + len(self.z2)) != self.nztotal:
+      raise ValueError("len(z1) + len(z2) != self.nztotal (internal logic error)")
+    self.data = np.concatenate((self.z1, self.z2), axis = 0)
+  
+  def get_requirements(self):
+    return {
+      "angular_diameter_distance": {"z": self.data},
+      "Hubble": {"z": self.data}  
+    }
+  
+  def logp(self, **params_values):
+    return -0.5
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# Class Definition
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+class dataset:  
+  #-----------------------------------------------------------------------------
+  # init
+  #-----------------------------------------------------------------------------  
+  def __init__(self):
+    self.setup = False
+    self.__setup_flags()
 
-    def get_requirements(self):
-        # Tell Cobaya which theory quantities you need at these redshifts
-        return {
-            "angular_diameter_distance": {"z": self.z_data},
-            "Hubble": {"z": self.z_data}
-            
-        }
+    comm = MPI.COMM_WORLD
+    rank = comm.Get_rank()
+    if rank == 0:
+      self.__run_mcmc()
+    if not args.chain == 1:
+      self.__generate_datavectors()
 
-    def logp(self, **params_values):
-        # Get required theory quantities
-        return -0.5
+  def __setup_flags(self):
+    #---------------------------------------------------------------------------
+    # Basic definitions
+    #---------------------------------------------------------------------------
+    root_env = os.environ.get("ROOTDIR")
+    if not root_env:
+      raise RuntimeError("ROOTDIR environment variable is not set")
+    root = root_env.rstrip("/")
+    root = f"{root}/{args.root.rstrip('/')}"
+    fileroot = f"{root}/{args.fileroot.rstrip('/')}"
+    Path(f"{root}/chains").mkdir(parents=True, exist_ok=True)
+    
+    self.append = 0 if args.append is None else args.append
+    self.bounds = None
+    self.bounds_adj = (
+      args.boundary if args.boundary is not None and 0 < args.boundary < 1 else 1
+    )    
+    self.covmat = None 
+    self.dtype = np.float32
+    self.dvsf = None 
+    self.derived = None
+    self.dvs_is_memmap = False
+    self.freqchk = 5000 if args.freqchk is None else args.freqchk
+    if self.freqchk < 1000:
+      raise ValueError("--freqchk must be >= 1000") # avoid too much chk
+    self.failed = None        # track which models failed to compute dv
+    self.failf = None
+    self.fiducial = None
+    self.inv_covmat = None
+    self.loadchk = 0 if args.loadchk is None else args.loadchk 
+    self.loadedfromchk = False  # check if loaded from checkpoint sucessfully
+    self.loadedsamples = False  # check loaded samples sucessfully
+    self.maxcorr = 0.15 if args.maxcorr is None else args.maxcorr
+    if not (0.01 < self.maxcorr <= 1):
+      raise ValueError("--maxcorr must be between (0.01,1]")
+    self.names = None
+    self.model = None
+    self.nparams = 10000 if args.nparams is None else args.nparams
+    if self.nparams < 200:
+      raise ValueError("--nparams must be >= 200")
+    self.paramsf = None 
+    self.probe = None
+    self.sampled_params = None 
+    self.samples = None
+    self.temp = 128 if args.temp is None else args.temp
+    if self.temp < 1:
+      raise ValueError("--temp must be => 1")
+    self.unif = 0 if args.unif is None else args.unif
+    self.yaml = f"{fileroot}/test.yaml" if args.yaml is None else f"{fileroot}/{args.yaml}"
+    if not os.path.isfile(f"{self.yaml}"):
+      raise FileNotFoundError(f"YAML file not found: {self.yaml}")
+    #---------------------------------------------------------------------------
+    # Load yaml
+    #---------------------------------------------------------------------------
+    with open(self.yaml, 'r') as stream:
+      info = yaml.safe_load(stream)
+    
+    if info is None:
+      raise ValueError(f"YAML file is empty or invalid: {self.yaml}")
+    
+    if not isinstance(info, dict):
+      raise ValueError(f"Cobaya YAML did not parse to a dict: {self.yaml}")
+    
+    missing = [k for k in ['params', 'likelihood', 'train_args'] if k not in info]
+    if missing:
+      raise KeyError(f"Cobaya YAML missing required blocks {missing}: {self.yaml}") 
 
-parser.add_argument("--N",
-                    dest="N",
-                    help="Number of points requested",
-                    type=int,
-                    nargs='?',
-                    const=1,
-                    default=100)
+    train_args = info["train_args"]
+    required_keys = ['probe', 'ord']
+    if not self.unif == 1:
+      required_keys += ['fiducial', 'params_covmat_file']
 
-parser.add_argument("--mode",
-                    dest="mode",
-                    help="mode of points generated",
-                    type=str,
-                    nargs='?',
-                    const=1,
-                    default='train')
-parser.add_argument("--data_path",
-                    dest="data_path",
-                    help="Directory for saving the data files",
-                    type=str,
-                    nargs='?',
-                    const=1,
-                    default='/data/')
-parser.add_argument("--datavectors_file",
-                    dest="datavectors_file",
-                    help="Name for data vector files (no .npy included)",
-                    type=str,
-                    nargs='?',
-                    const=1,
-                    default='cos_uni')
-parser.add_argument("--parameters_file",
-                    dest="parameters_file",
-                    help="Name for Parameter files (.npy included)",
-                    type=str,
-                    nargs='?',
-                    const=1,
-                    default='cos_uni_input.npy')
-args, unknown = parser.parse_known_args()
+    missing = [k for k in required_keys if k not in train_args]
+    if missing:
+      raise KeyError(f"Cobaya YAML missing required keys {missing}: {self.yaml}")
+
+    #---------------------------------------------------------------------------
+    # Load Cobaya model (needed for computing likelihood), cov matrix...
+    #--------------------------------------------------------------------------- 
+    if "baosn_aux_likelihood" not in sys.modules:
+      sys.modules["baosn_aux_likelihood"] = sys.modules[__name__]
+
+    try:
+      self.model = get_model(info)
+    except Exception as e:
+      raise RuntimeError(f"get_model failed for {self.yaml}: {e}") from e
+
+    self.zarray = self.model.likelihood['dummy'].data.copy()
+    self.zhd    = self.model.likelihood['dummy'].zhd
+    self.nzhd   = self.model.likelihood['dummy'].nzhd
+    self.zmax   = self.model.likelihood['dummy'].zmax
+    self.nzmax  = self.model.likelihood['dummy'].nzmax
+    self.nztotal = self.nzhd + self.nzmax
+    if len(self.zarray) != self.nztotal:
+      raise ValueError("len(self.zarray) != self.nztotal (internal logic error)")
+
+    self.probe = "baosn"
 
-####add yaml here, and make all input paratemers passing in
-yaml_string=r"""
+    self.sampled_params = train_args['ord']  # preferred ordering of params
 
-likelihood:
-  dummy:
-    class: SimpleBAODVLikelihood
+    self.derived = train_args['derived'] if 'derived' in train_args else []
 
-params:
+    if not self.unif == 1:
+      fid = train_args["fiducial"] # load fiducial data vector
+      
+      # load cov param matrix --------------------------------------------------
+      raw_covmat_file = train_args["params_covmat_file"]
+      with open(f"{fileroot}/{raw_covmat_file}") as f:
+        raw_covmat_params_names = np.array(f.readline().split()[1:])
+        raw_covmat = np.loadtxt(f) 
+      
+      #-------------------------------------------------------------------------
+      # Reorder fiducial, bounds and covmat to follow ['train_args']['ord']
+      #-------------------------------------------------------------------------
+      # Reorder fiducial -------------------------------------------------------
+      self.fiducial = np.array([fid[p] for p in self.sampled_params], 
+                               copy=True, dtype=self.dtype)
+
+      # Reorder covmat ---------------------------------------------------------
+      pidx = {p : i for i, p in enumerate(raw_covmat_params_names)}
+      try:
+        idx = np.array([pidx[p] for p in self.sampled_params], 
+                       copy=True, 
+                       dtype=int)
+      except KeyError as e:
+        raise ValueError(f"{e.args[0]!r} not found in cov header") from None
+      covmat = raw_covmat[np.ix_(idx, idx)]
+      
+    # Reorder bounds -----------------------------------------------------------
+    self.names = list(self.model.parameterization.sampled_params().keys())
+    idx = self.reorder_idx_from_yaml_to_ord()
+    
+    # Here T (temp) stretch the hard bounds on parameters with Gaussian prior --
+    tmp = np.array(self.model.prior.bounds(confidence=1.0),
+                                           copy=True, 
+                                           dtype=self.dtype)[idx,:]
+    self.bounds = np.array(self.model.prior.bounds(confidence=0.9999994),
+                           copy=True, 
+                           dtype=self.dtype)[idx,:]
+    for i in range(len(tmp)):
+      if math.isinf(tmp[i,0]) or math.isinf(tmp[i,1]): 
+        width = (self.bounds[i, 1] - self.bounds[i, 0])
+        if math.isinf(tmp[i,0]):
+          self.bounds[i,0] -= self.temp*width/5.0
+        if math.isinf(tmp[i,1]):
+          self.bounds[i,1] += self.temp*width/5.0
+
+    # near the bds: emulator accuracy degrades: (val/test) must reduce bds -----
+    if self.bounds_adj < 1:
+      margin = (1-self.bounds_adj) * 0.5*(self.bounds[:, 1]-self.bounds[:, 0])
+      self.bounds[:, 0] += margin
+      self.bounds[:, 1] -= margin
+
+    # adjust covmat- -----------------------------------------------------------
+    if not self.unif == 1:
+      #-------------------------------------------------------------------------
+      # Reduce correlation on the covariance matrix to max = args.maxcorr
+      #-------------------------------------------------------------------------
+      sig   = np.sqrt(np.diag(covmat))
+      n = len(sig)
+      outer = np.outer(sig, sig)
+      corr  = covmat / outer 
+      m = np.abs(corr - np.eye(n)).max()
+      if m > self.maxcorr:
+        corr /= max(1.0, m / self.maxcorr) if m > 0 else 1.0
+        np.fill_diagonal(corr, 1.0)
+      covmat = corr * outer
+
+      #-------------------------------------------------------------------------
+      # Compute covmat inverse
+      #-------------------------------------------------------------------------
+      C = 0.5 * (covmat + covmat.T)  # enforce symmetry
+      jitt = 0.0
+      for _ in range(10):
+        try:
+          L = np.linalg.cholesky(C + jitt*np.eye(C.shape[0]))
+          break
+        except np.linalg.LinAlgError:
+          scale = np.mean(np.diag(C)) # scale jitt to matrix sz start tiny -> grow
+          jitt = (1e-12 * scale if jitt == 0 else jitt*10)
+      else:
+        raise np.linalg.LinAlgError("could not stabilized cov to SPD w/ jitter")
+      I = np.eye(C.shape[0])
+      self.covmat = C + jitt*np.eye(C.shape[0])
+      self.inv_covmat = np.linalg.solve(L.T, np.linalg.solve(L, I))
+
+    #---------------------------------------------------------------------------
+    # Define output files
+    #---------------------------------------------------------------------------
+    datavsfile = Path(args.datavsfile).stem
+    paramfile = Path(args.paramfile).stem
+    failfile = Path(args.failfile).stem
+    if not self.unif == 1:
+      self.dvsf = f"{root}/chains/{datavsfile}_{self.probe}_{self.temp}"
+      self.paramsf = f"{root}/chains/{paramfile}_{self.probe}_{self.temp}"
+      self.failf = f"{root}/chains/{failfile}_{self.probe}_{self.temp}"
+    else:
+      self.dvsf = f"{root}/chains/{datavsfile}_{self.probe}_unifs"
+      self.paramsf = f"{root}/chains/{paramfile}_{self.probe}_unifs"
+      self.failf = f"{root}/chains/{failfile}_{self.probe}_unifs"
+    
+    #---------------------------------------------------------------------------
+    # Setup Done
+    #---------------------------------------------------------------------------
+    self.setup = True
+
+  #-----------------------------------------------------------------------------
+  # reorder indexes to match YAML original ordering
+  #-----------------------------------------------------------------------------
+  def reorder_idx_from_yaml_to_ord(self):
+    pidx = {p : i for i, p in enumerate(self.names)}
+    return np.array([pidx[p] for p in self.sampled_params], 
+                    copy=True, 
+                    dtype=int)
+  
+  def reorder_idx_from_ord_to_yaml(self):
+    pidx = {p : i for i, p in enumerate(self.sampled_params)}
+    return np.array([pidx[p] for p in self.names], 
+                    copy=True, 
+                    dtype=int)
+
+  #-----------------------------------------------------------------------------
+  # save/load checkpoint
+  #-----------------------------------------------------------------------------
+  def __load_chk(self):
+    rtnvar = False
+    if self.loadchk == 1:
+      loadchk = all([os.path.isfile(x) for x in [f"{self.dvsf}.npy", 
+                                                 f"{self.failf}.txt",
+                                                 f"{self.paramsf}.covmat", 
+                                                 f"{self.paramsf}.ranges",
+                                                 f"{self.paramsf}.1.txt"]])
+      if loadchk:
+        # load sample file begins ----------------------------------------------       
+        # row 0/1 rows are weights, lnp. Last row is chi2
+        self.samples = np.atleast_2d(np.loadtxt(f"{self.paramsf}.1.txt", 
+                                                dtype=self.dtype))[:,2:-1]
+        if self.samples.ndim != 2:
+          raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
+        # load sample file ends ------------------------------------------------ 
+
+        # load fail file begins ------------------------------------------------
+        self.failed = np.atleast_1d(np.loadtxt(f"{self.failf}.txt", 
+                                               dtype=np.uint8))
+        self.failed = np.asarray(self.failed).astype(bool)
+        if self.failed.ndim != 1:
+          raise ValueError(f"failed must be 1D, got {self.failed.shape}") 
+        
+        if self.samples.shape[0] != self.failed.shape[0]:
+          raise ValueError(f"Incompatible samples/failed chk files")
+        # load fail file ends --------------------------------------------------
+
+        # load datavectors begins ----------------------------------------------
+        arr = np.load(f"{self.dvsf}.npy", 
+                      mmap_mode = "r", 
+                      allow_pickle = False)
+        RAMneed = (arr.nbytes + 
+                   self.samples.nbytes + 
+                   self.failed.nbytes)
+        RAMavail = psutil.virtual_memory().available
+        if RAMneed < 0.75 * RAMavail:
+          self.datavectors = np.load(f"{self.dvsf}.npy", allow_pickle = False)
+          self.dvs_is_memmap = False
+        else:
+          print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
+                f"There is {RAMavail/1e9:.2f} GB of RAM available. "
+                f"We will read dvs from HD (slow)")
+          self.datavectors = np.load(f"{self.dvsf}.npy", 
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
+          self.dvs_is_memmap = True
+        del arr
+        # load datavectors ends ------------------------------------------------
+
+        if self.datavectors.ndim != 3:
+          raise ValueError(f"datavectors must be 3D, got {self.datavectors.shape}") 
+        if self.datavectors.shape[0] != self.samples.shape[0]:
+          raise ValueError(f"Incompatible samples/datavector chk files")  
+        print("Loaded models from chk")
+        if self.append == 0:
+          self.loadedsamples = True
+          self.loadedfromchk = True
+        rtnvar = True
+    return rtnvar
   
-  omegabh2:
-    prior:
-      min: 0.0
-      max: 0.04
-    ref:
-      dist: norm
-      loc: 0.022383
-      scale: 0.005
-    proposal: 0.005
-    latex: \Omega_\mathrm{b} h^2
-  omegach2:
-    prior:
-      min: 0.0
-      max: 0.5
-    ref:
-      dist: norm
-      loc: 0.12011
-      scale: 0.03
-    proposal: 0.03
-    latex: \Omega_\mathrm{c} h^2
-  H0:
-    prior:
-      min: 20
-      max: 120
-    ref:
-      dist: norm
-      loc: 67
-      scale: 2
-    proposal: 0.001
-    latex: H_0
-  tau:
-    value: 0.06
-    latex: \tau_\mathrm{reio}
-
-  logA:
-    value: 3.04
-    latex: \log(10^{10} A_\mathrm{s})
-    drop: true
-  ns:
-    value: 0.95
-    latex: n_\mathrm{s}
-  As:
-    value: 'lambda logA: 1e-10*np.exp(logA)'
-    latex: A_\mathrm{s}
-
-  mnu:
-    value: 0.06
-  thetastar:
-    derived: true
-    latex: \Theta_\star
-  rdrag:
-    derived: True
-    latex: r_\mathrm{drag}
-
-theory:
-  camb:
-    path: ./external_modules/code/CAMB
-    extra_args:
-      #dark_energy_model: ppf
-      lmax: 1000
-
-
-
-
-
-"""
-
-
-####add main function.
-
-
-#===================================================================================================
-# datavectors
-
-def generate_parameters(N, u_bound, l_bound, mode, parameters_file, save=True):
-    D = len(u_bound)
-
-    if mode=='train':
+  def __save_chk(self):
+    # save data vector file ----------------------------------------------------
+    if self.dvs_is_memmap == True:
+      self.datavectors.flush()  # checkpoint dv in-place
+    else:
+      # save (flush) dvs to tmp file (safer) -----------------------------------
+      np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+      # save data vector file (from tmp) ---------------------------------------
+      os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+    # save fail file -----------------------------------------------------------
+    # save (flush) dvs to tmp file (safer) -------------------------------------
+    np.savetxt(f"{self.failf}.tmp.txt", self.failed.astype(np.uint8), fmt="%d")
+    # save data vector file (from tmp) -----------------------------------------
+    os.replace(f"{self.failf}.tmp.txt", f"{self.failf}.txt")
+
+  #-----------------------------------------------------------------------------
+  # likelihood
+  #-----------------------------------------------------------------------------
+  def __param_logprior(self, x):
+    # because we shrink the prior, we need to do this check
+    if np.all((x >= self.bounds[:, 0]) & (x <= self.bounds[:, 1])):
+      return 0.0 
+    else:
+      return -np.inf
+
+  def __param_logpost(self,x):
+    y = x - self.fiducial
+    logprior = self.model.prior.logp(x[self.reorder_idx_from_ord_to_yaml()])
+    if math.isinf(logprior):
+      return -np.inf 
+    elif math.isinf(self.__param_logprior(x)):
+      # this is important when --boundary command line option is < 1
+      return -np.inf
+    else:
+      logp = (-0.5*(y @ self.inv_covmat @ y) + logprior)/self.temp
+      return logp
+
+  #-----------------------------------------------------------------------------
+  # run mcmc
+  #-----------------------------------------------------------------------------
+  def __run_mcmc(self):
+    try:
+      loadedfromchk = self.__load_chk()
+    except Exception as e:
+      sys.stderr.write(f"[load_chk] failed: {e}\n")
+      traceback.print_exc(file=sys.stderr)
+      loadedfromchk = False
+    
+    if (loadedfromchk == False) or (loadedfromchk == True and self.append == 1):
+      ndim     = len(self.sampled_params)
+      names    = list(self.sampled_params)
+      
+      if not self.unif == 1:
+        # high number of samples: make sure we get unique samples
+        nparam  = 40*self.nparams if self.bounds_adj < 1 else 20*self.nparams
+        nparams  = max(nparam, 5000000)
+        nwalkers = int(10*ndim)
+        nsteps   = int(max(7500, nparams/nwalkers)) # (for safety we assume tau>100)
+        burnin   = int(0.1*nsteps)                  # 10% burn-in
         
-        N_LHS = int(0.05*N)
-        sampler = qmc.LatinHypercube(d=D)
-        sample = sampler.random(n=N_LHS)
-        sample_scaled = qmc.scale(sample, l_bound, u_bound)
-
-        N_uni = N-N_LHS
-        data = np.random.uniform(low=l_bound, high=u_bound, size=(N_uni, D))
-        samples = np.concatenate((sample_scaled, data), axis=0)
+        sampler = emcee.EnsembleSampler(nwalkers = nwalkers, 
+                                        ndim = ndim, 
+                                        moves=[(emcee.moves.DEMove(), 0.9),
+                                               (emcee.moves.DESnookerMove(), 0.1)],
+                                        log_prob_fn = self.__param_logpost)
+        sampler.run_mcmc(initial_state = self.fiducial[np.newaxis] + 
+                                         0.5*np.sqrt(np.diag(self.covmat))*
+                                         np.random.normal(size=(nwalkers,ndim)), 
+                         nsteps=nsteps, 
+                         progress=False)
+        xf  = sampler.get_chain(flat=True, discard=burnin, thin=1)
+        xf, keep = np.unique(xf, axis=0, return_index=True)
+        lnp = sampler.get_log_prob(flat=True, discard=burnin, thin=1)[keep, None]
+        if len(xf) < self.nparams:
+          print(f"Warning: only {len(xf)} unique rows, requested {self.nparams}")
+        else:
+          indices = np.random.choice(np.arange(len(xf)), size=self.nparams, replace=False)
+          xf  = xf[indices,:]
+          lnp = lnp[indices,:]
+        nparams = len(xf)        
+      else:
+        nparams  = self.nparams
+        bds = self.bounds.copy()
+        # extra safety so logprior is not -infty --------------------
+        bds[:,0] = np.where(bds[:,0] > 0, 1.0001*self.bounds[:,0],0.9999*self.bounds[:,0])
+        bds[:,1] = np.where(bds[:,1] > 0, 0.9999*self.bounds[:,1],1.0001*self.bounds[:,1])
+        xf  = np.random.uniform(low  = bds[:,0], 
+                                high = bds[:,1], 
+                                size = (nparams,ndim))
+        lnp = np.ones((nparams,1), dtype=self.dtype)
+        # Double check that prior is not -infty --------------------------------
+        for i, x in enumerate(xf):
+          idx = self.reorder_idx_from_ord_to_yaml()
+          logprior = self.model.prior.logp(x[idx])
+          if math.isinf(logprior):
+              raise ValueError(f"Sample {i} has -inf prior. (should not happen)"
+                               f"Values: {dict(zip(self.sampled_params, x))}")
+      w = np.ones((nparams,1), dtype=self.dtype)
+      chi2 = -2*lnp
+
+      if not loadedfromchk:
+        # Output some debug messaging ------------------------------------------
+        if not self.unif == 1:
+          try:
+            tau = np.array(sampler.get_autocorr_time(quiet=True, has_walkers=True),
+                           copy=True, 
+                           dtype=self.dtype).max()
+            print(f"Partial Result: tau = {tau}\n"
+                  f"nwalkers={nwalkers}\n"
+                  f"nsteps (per walker) = {nsteps}\n"
+                  f"nsteps/tau = {nsteps/tau} (min should be ~50)\n"
+                  f"nparams (after thin)={nparams}\n")
+          except Exception as e:
+            print(f"Partial Result: tau = N/A (emcee threw an exception)\n"
+                  f"nwalkers={nwalkers}\n"
+                  f"nsteps (per walker) = {nsteps}\n"
+                  f"nparams (after thin)={nparams}\n")
+            tau = 1 # make sure main MPI worker does not crash over trivial check
+        
+        # save a range files ---------------------------------------------------
+        bds = self.bounds.copy()
+        hd  = ["weights","lnp"] + names
+        rows = [(str(n),float(l),float(h)) for n,l,h in zip(names,bds[:,0],bds[:,1])]
+        with open(f"{self.paramsf}.ranges", "w") as f: 
+          f.write(f"# {' '.join(hd)}\n")
+          f.writelines(f"{n} {l:.5e} {h:.5e}\n" for n, l, h in rows)
+                
+        # save chain begins ----------------------------------------------------
+        fname = f"{self.paramsf}.1.txt";
+        if not self.unif == 1:
+          hd=f"nwalkers={nwalkers}\n"
+        else:
+          hd=f"Uniform Sampling\n"
+        np.savetxt(fname,
+                   np.concatenate([w, lnp, xf, chi2], axis=1),
+                   fmt="%.9e",
+                   header=hd + ' '.join(["weights", "lnp"] + names + ["chi2*"]),
+                   comments="# ")
+        
+        # copy samples to self.samples  ----------------------------------------
+        self.samples = np.array(xf, copy=True, dtype=self.dtype)
+
+        # save paramname files -------------------------------------------------
+        param_info = self.model.info()['params']
+        latex  = [param_info[x]['latex'] for x in names]
+        paramnames = copy.deepcopy(names)
+        paramnames.append("chi2*")
+        latex.append("\\chi^2")
+        np.savetxt(f"{self.paramsf}.paramnames", 
+                   np.column_stack((paramnames,latex)),
+                   fmt="%s")
+
+        # save a cov matrix ------------------------------------------------------
+        with contextlib.redirect_stdout(io.StringIO()): # so getdist dont write in terminal
+          np.savetxt(f"{self.paramsf}.covmat",
+                     np.array(loadMCSamples(f"{self.paramsf}", 
+                                            settings={'ignore_rows': u'0.'}).cov(pars=names), 
+                              copy=True, 
+                              dtype=self.dtype),
+                     fmt="%.9e",
+                     header=' '.join(names),
+                     comments="# ")
+
+        # delete arrays (save RAM) ---------------------------------------------
+        del w         # save RAM memory
+        del xf        # save RAM memory
+        del lnp       # save RAM memory
+        del chi2      # save RAM memory
+        gc.collect()  # save RAM memory
+      else:
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
+        # This option = loadedfromchk == True and self.append == 1
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
+        # append chain file begins ---------------------------------------------
+        fname = f"{self.paramsf}.1.txt";
+        with open(fname, "a") as f: # append mode
+          hd = ' '.join(["weights","lnp"] + names + ["chi2*"])
+          np.savetxt(f, 
+                     np.concatenate([w, lnp, xf, chi2], axis=1), 
+                     header = hd if (os.path.getsize(fname) == 0) else "",
+                     fmt = "%.9e")
+        del w         # save RAM memory
+        del xf        # save RAM memory
+        del lnp       # save RAM memory
+        del chi2      # save RAM memory
+        gc.collect()  # save RAM memory
+        
+        self.samples = np.atleast_2d(np.loadtxt(fname, dtype=self.dtype))[:,2:-1]
+        if self.samples.ndim != 2:
+          raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
+        # append chain file ends -----------------------------------------------
+
+        # append fail file begins ----------------------------------------------
+        fname = f"{self.failf}.txt";
+        failed = np.ones((nparams, 1), dtype=np.uint8) # start w/ all failed
+        with open(fname, "a") as f: # append mode
+          np.savetxt(f, failed.astype(np.uint8), fmt="%d")
+
+        self.failed = np.atleast_1d(np.loadtxt(fname, dtype=np.uint8))
+        self.failed = np.asarray(self.failed).astype(bool)
+        if self.failed.ndim != 1:
+          raise ValueError(f"failed must be 1D, got {self.failed.shape}") 
+
+        if self.samples.shape[0] != self.failed.shape[0]:
+          raise ValueError(f"Incompatible samples/failed chk files")
+        # append fail file begins ----------------------------------------------
+
+        # append dvs (with zeros) begins ---------------------------------------
+        nrows = self.datavectors.shape[0]
+        ncols = self.datavectors.shape[1]
+        nstride = 3 # 0: angular_diameter_distance data vector,
+                    # 1: Hubble data vector,
+                    # 2: derived parameters
+        RAMneed = ( self.samples.nbytes + 
+                    self.failed.nbytes + 
+                    self.datavectors.nbytes + 
+                    (nrows + nparams)*ncols*nstride*self.datavectors.dtype.itemsize)
+        RAMavail = psutil.virtual_memory().available
+        if RAMneed < 0.75 * RAMavail:
+          # setup new datavector numpy array -----------------------------------
+          self.datavectors = np.vstack((self.datavectors, 
+                                        np.zeros((nparams, ncols, nstride), dtype=self.dtype)))
+          # save (flush) dvs to tmp file (safer) -------------------------------
+          np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+          # save data vector file (from tmp) -----------------------------------
+          os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+          self.dvs_is_memmap = False
+        else:
+          print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
+                f"There is {RAMavail/1e9:.2f} GB of RAM available. "
+                f"We will read dvs from HD (slow)")
+          # setup new datavector numpy array -----------------------------------
+          datavectors = open_memmap(f"{self.dvsf}.tmp.npy", 
+                                    mode = "w+",
+                                    shape = (nrows + nparams, ncols, nstride),
+                                    dtype = self.datavectors.dtype)
+          for s in range(0, nrows, 2500): # read dvs in chunks: avoid RAM spikes
+            e = min(nrows, s + 2500)
+            datavectors[s:e] = self.datavectors[s:e]
+          for s in range(nrows, nrows + nparams, 2500):
+            e = min(nrows + nparams, s + 2500)
+            datavectors[s:e] = 0
+          # save (flush) data vector (in-place) --------------------------------
+          datavectors.flush()
+          del datavectors
+          # save data vector file (from tmp) -----------------------------------
+          os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+          # finally, load the new dv numpy array from file ---------------------
+          self.datavectors = np.load(f"{self.dvsf}.npy", 
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
+          self.dvs_is_memmap = True
+        # append dvs ends ------------------------------------------------------
+        
+        # check final dimensions -----------------------------------------------
+        if self.datavectors.shape[0] != self.samples.shape[0]:
+          raise ValueError(f"Incompatible samples/datavector chk files")
+
+        # update a parameter cov matrix ----------------------------------------
+        with contextlib.redirect_stdout(io.StringIO()): # so getdist dont write in terminal
+          np.savetxt(f"{self.paramsf}.covmat",
+                     np.array(loadMCSamples(f"{self.paramsf}", 
+                                            settings={'ignore_rows': u'0.'}).cov(pars=names), 
+                              copy=True, 
+                              dtype=self.dtype),
+                     fmt="%.9e",
+                     header=' '.join(names),
+                     comments="# ")
+        # set self.loadedfromchk -----------------------------------------------
+        self.loadedfromchk = True
+    # set self.loadedsamples ---------------------------------------------------
+    self.loadedsamples = True
+
+  #-----------------------------------------------------------------------------
+  # datavectors
+  #-----------------------------------------------------------------------------
+  def __allocate_data_vector(self, nrows, ncols, nstride):
+    RAMneed = ( self.samples.nbytes + 
+                self.failed.nbytes + 
+                nrows*ncols*nstride*np.dtype(self.dtype).itemsize )
+    RAMavail = psutil.virtual_memory().available
+    if RAMneed < 0.75 * RAMavail:
+      self.datavectors = np.zeros((nrows, ncols, nstride), dtype=self.dtype)
+      self.dvs_is_memmap = False
     else:
-        samples = np.random.uniform(low=l_bound, high=u_bound, size=(N, D))
-
-    if save:
-        np.save(parameters_file, samples)
-        print('(Input Parameters) Saved!')
-    return samples
-mode = args.mode
-N = args.N
-PATH = os.environ.get("ROOTDIR") + '/' + args.data_path
-parameters_file  = PATH + args.parameters_file
-
-if __name__ == '__main__':
-    f = yaml_load(yaml_string)
-    sys.modules["SimpleBAODVLikelihood"] = sys.modules[__name__]
-    model = get_model(f)
+      print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
+            f"There is {RAMavail/1e9:.2f} GB of RAM available. "
+            f"We will read dvs from HD (slow)")
+      self.datavectors = open_memmap(f"{self.dvsf}.npy", 
+                                     mode = "w+",
+                                     shape = (nrows, ncols, nstride),
+                                     dtype = self.dtype)
+      self.datavectors[::] = 0.0
+      self.datavectors.flush()
+      self.dvs_is_memmap = True
+
+  def _compute_dvs_from_sample(self, sample):
+    # Define fortran errors we want to capture ---------------------------------
+    camb_error_keywords = {"ERROR", "error", "Did not converge"}
+
+    # Compute data vector (within using cobaya API) ----------------------------
+    idx = self.reorder_idx_from_ord_to_yaml()
+    param = dict(self.model.parameterization.to_input(
+        sampled_params_values=dict(zip(self.names, sample[idx])))
+    )
+    self.model.provider.set_current_input_params(param)
+
+    # Check prior before attempting computation --------------------------------
+    if math.isinf(self.model.prior.logp(sample[idx])):
+      raise RuntimeError(f"Prior is -inf (this should not happen). "
+                         f"Values: {dict(zip(self.sampled_params, sample))}")
+
+    # Compute data vector (within using cobaya API) ----------------------------
+    nrows = self.nztotal
+    ncols = 3
+    out = np.zeros((nrows, ncols), dtype=self.dtype)
+
+    captured = 0 # variable that will hold terminal output 
+    with capture_native_output() as tmp:
+      for (x, _), z in zip(self.model._component_order.items(),
+                           self.model._params_of_dependencies):
+        x.check_cache_and_compute(
+            params_values_dict = dict({p: param[p] for p in x.input_params}),
+            want_derived = self.derived,
+            dependency_params = list(param.keys()),
+            cached = True
+        )
+      tmp.seek(0)
+      captured = tmp.read() # copy terminal output -----------------------------
     
-    prior_params = list(model.parameterization.sampled_params())
-    sampling_dim = len(prior_params)
-    datavectors_file_path = PATH + args.datavectors_file
+    # check for CAMB errors in the terminal output -----------------------------
+    if any(kw in captured for kw in camb_error_keywords):
+      raise RuntimeError(f"CAMB Fortran error: {captured.strip()}")
+    
+    # get results from Theory block (already computed) -------------------------
+    for (x, _), z in zip(self.model._component_order.items(),
+                         self.model._params_of_dependencies):
+      if (hasattr(x,'get_angular_diameter_distance') and
+          callable(getattr(x, 'get_angular_diameter_distance')) and
+          hasattr(x,'get_Hubble') and
+          callable(getattr(x, 'get_Hubble'))
+          ):   
+
+        tmp1 = x.get_angular_diameter_distance(self.zarray)*(1+self.zarray)**2
+        tmp2 = x.get_Hubble(self.zarray) 
+        if (len(tmp1) != self.nztotal):
+          raise ValueError("len(angular_diameter_distance) != self.nztotal")
+        if (len(tmp2) != self.nztotal):
+          raise ValueError("len(Hubble) != self.nztotal")
+        out[:,0] = tmp1.copy()
+        out[:,1] = tmp2.copy()
+        if hasattr(x, 'get_param') and callable(getattr(x, 'get_param')):
+          for i, p in enumerate(self.derived):
+            try:
+              out[i,2] = x.get_param(p)
+            except Exception:
+              pass
+    return out
+
+  def __generate_datavectors(self):
+    if not self.setup:
+      raise RuntimeError(f"Initial Setup not successful")
+    TTAG = 1      # Task tag
+    STAG = 0      # Stop tag
+    RTAG = 2      # Result tag
+    DTAG = 3      # Done (not crashed) tag
+    TASK_TIMEOUT = 1800
+    STOP_TIMEOUT = 300.0 
     comm = MPI.COMM_WORLD
     rank = comm.Get_rank()
-    num_ranks = comm.Get_size()
-
-    print('rank',rank,'is at barrier')
-           
-    z = model.likelihood['dummy'].z_data
-    len_z = len(z)
-    num_output = 2
-    SN_DIR = datavectors_file_path + '_baosn.npy'
-    u_bound = model.prior.bounds()[:,1]
-    l_bound = model.prior.bounds()[:,0]
-    if rank == 0:
-        samples = generate_parameters(N, u_bound, l_bound, mode, parameters_file)
-        total_num_dvs = len(samples)
-
-        param_info = samples[0:total_num_dvs:num_ranks]#reading for 0th rank input
-        for i in range(1,num_ranks):#sending other ranks' data
-            comm.send(
-                samples[i:total_num_dvs:num_ranks], 
-                dest = i, 
-                tag  = 1
-            )
-                
-    else:
-            
-        param_info = comm.recv(source = 0, tag = 1)
+    size = comm.Get_size()
+    nworkers = size - 1
+        
+    if size == 1:
+      if not self.loadedsamples:
+        raise RuntimeError(f"Model Samples not loaded/computed")
 
-            
-    num_datavector = len(param_info)
+      nparams = len(self.samples)
 
-    BAOSN = np.zeros(
-            (num_datavector, len_z, num_output), dtype = "float32"
-        ) 
+      if not self.loadedfromchk:
+        # Allocate failed array begins -----------------------------------------
+        self.failed = np.ones(nparams, dtype = np.uint8) # start w/ all failed
+        self.failed = np.asarray(self.failed).astype(bool)
+        
+        # Allocate data vectors begins -----------------------------------------
+        nrows   = nparams
+        ncols   = self.nztotal
+        nstride = 3 # 0: angular_diameter_distance data vector,
+                    # 1: Hubble data vector,
+                    # 2: derived parameters
+        self.__allocate_data_vector(nrows=nrows, ncols=ncols, nstride=nstride)
+        # Allocate data vectors end --------------------------------------------
+        
+        idx = np.arange(0, nparams) # indexes to compute data vectors
+      else:
+        idx = np.where(self.failed == True)[0] # indexes to compute data vectors
 
-    for i in range(num_datavector):
-        input_params = model.parameterization.to_input(param_info[i])  
+      for i in idx:
         try:
-            model.loglike(input_params)
-            theory = list(model.theory.values())[1]
-            H = theory.get_Hubble(z)
-            Dl = theory.get_angular_diameter_distance(z)*(1+z)**2
-                
-        except:
-            print('fail')
-        else:
-            BAOSN[i,:,0] = H
-            BAOSN[i,:,1] = Dl
-            
+          dvs = self._compute_dvs_from_sample(self.samples[i])
+          self.failed[i] = False
+        except Exception as e: # set datavector to zero and continue
+          self.failed[i] = True
+          self.datavectors[i,:,:] = 0.0
+          sys.stderr.write(f"[Rank 0] Worker failed at idx={i}\n")
+          sys.stderr.write(f"[Rank 0] Exception type: {type(e).__name__}\n")
+          sys.stderr.write(f"[Rank 0] Exception message: {e}\n")
+          sys.stderr.write(f"[Rank 0] Traceback: {traceback.format_exc(limit=8)}\n")
+          sys.stderr.flush()
+          continue
+        self.datavectors[i,:,:] = dvs[:,:]
+        if i % self.freqchk == 0 and i > 0:
+          print(f"Model number: {i+1} (total: {nparams}) - checkpoint", flush=True)
+          self.__save_chk()
+      self.__save_chk()
+    else:        
+      if rank == 0:
+        if not self.loadedsamples:
+          sys.stderr.write(f"Model Samples not loaded/computed\n")
+          sys.stderr.flush()
+          comm.Abort(1)
+        status = MPI.Status() 
+        block = self.freqchk
+        next_block = 1 
+        too_frequent = True
+        nparams = len(self.samples)   
+        completed = np.zeros(nparams, dtype=bool)
 
-    if rank == 0:
-        result_baosn   = np.zeros((total_num_dvs, len_z, num_output), dtype="float32")
-        result_baosn[0:total_num_dvs:num_ranks] = BAOSN
+        if not self.loadedfromchk:
+          self.failed = np.ones(nparams, dtype=np.uint8) # start w/ all failed
+          self.failed = np.asarray(self.failed).astype(bool)
+          
+          # Allocate data vectors begins ---------------------------------------
+          nrows = nparams
+          ncols = self.nztotal
+          nstride = 3 # 0: angular_diameter_distance data vector,
+                      # 1: Hubble data vector,
+                      # 2: derived parameters
+          self.__allocate_data_vector(nrows=nrows, ncols=ncols, nstride=nstride)
+          # Allocate data vectors end ------------------------------------------
 
-        for i in range(1,num_ranks):        
-            result_baosn[i:total_num_dvs:num_ranks] = comm.recv(source = i, tag = 10)
+          idx0 = np.arange(0, nparams) # indexes to compute data vectors
+        else:
+          completed = ~self.failed
+          idx0 = np.where(self.failed == True)[0] # indexes to compute data vectors
+        
+        tasks   = deque(idx0.tolist())
+        nactive = min(nworkers, len(tasks))
+        active  = {} # Dict: key = worker (src), value: (idx, t_start)
+        
+        # Start MPI workers ----------------------------------------------------
+        for w in range(1, nactive+1):
+          j = tasks.popleft() 
+          comm.send((j, self.samples[j]), dest = w, tag = TTAG)
+          active[w] = (j, MPI.Wtime())
 
-        np.save(SN_DIR, result_baosn)
+        # Send all tasks to active MPI workers ---------------------------------
+        count  = 0
+        while tasks:
+          # comm.Iprobe = non-blocking operation used to check for an incoming 
+          #               message without actually receiving it
+          # Why? protect the script against crashes (like CAMB/Class crash)
+          if comm.Iprobe(source = MPI.ANY_SOURCE, tag = RTAG, status = status):
+            kind, idx, payload = comm.recv(source = MPI.ANY_SOURCE,
+                                       tag = RTAG,
+                                       status = status)
+            count += 1
+            src = status.Get_source()
+            if src in active:
+              del active[src]
             
-    else:    
-        comm.send(BAOSN, dest = 0, tag = 10)
+            if kind == "err": # set datavector to zero and continue
+              self.datavectors[idx,:,:] = 0.0
+              self.failed[idx] = True
+              sys.stderr.write(f"[Rank 0] Worker {src} failed at idx={idx}\n"
+                               f"[Rank 0] Traceback: {payload}\n")
+              sys.stderr.flush() 
+            else:
+              self.datavectors[idx,:,:] = payload[:,:] 
+              self.failed[idx] = False
+            completed[idx] = True
 
+            if not self.loadedfromchk:
+              if count%block == 0:
+                too_frequent = False
 
+              if not too_frequent:
+                start = (next_block - 1) * block
+                end   = min(nparams, next_block * block)
+                if completed[start:end].all():
+                  self.__save_chk()
+                  too_frequent = True
+                  next_block += 1
+            else:
+              if count%block == 0:
+                self.__save_chk()
+
+            j = tasks.popleft() 
+            comm.send((j, self.samples[j]), 
+                      dest = src, 
+                      tag  = TTAG)
+            active[src] = (j, MPI.Wtime())
+          else:
+            doabort = False
+            for w, (idx, t0) in list(active.items()):
+              if (MPI.Wtime()-t0) > TASK_TIMEOUT: # no task runtime > TIMEOUT
+                sys.stderr.write(f"[Rank 0] Worker {w} at idx={idx} timed out (MPI RTAG)")
+                sys.stderr.flush()
+                doabort = True
+            if doabort:
+              for w, (idx, t0) in list(active.items()): # mark all running tasks as failed
+                self.datavectors[idx,:,:] = 0.0
+                self.failed[idx] = True
+                completed[idx] = True
+              self.__save_chk() # save before crashing
+              comm.Abort(1) 
+            time.sleep(.1) # avoid 100% CPU usage
+        # end of while loop  
+
+        # drain last tasks from active MPI workers -----------------------------
+        while active: 
+          # comm.Iprobe = non-blocking operation used to check for an incoming 
+          #               message without actually receiving it
+          # Why? protect the script against crashes (like CAMB/Class crash)
+          if comm.Iprobe(source = MPI.ANY_SOURCE, tag = RTAG, status = status):
+            kind, idx, payload = comm.recv(source = MPI.ANY_SOURCE, 
+                                           tag = RTAG, 
+                                           status = status) # drain results 
+            src = status.Get_source()
+            if kind == "err":
+              self.datavectors[idx,:,:] = 0.0
+              self.failed[idx] = True
+              sys.stderr.write(f"[Rank 0] Worker {src} failed at idx={idx}\n"
+                               f"(MPI) Msg: {payload}\n")
+              sys.stderr.flush()
+            else:
+              self.datavectors[idx,:,:] = payload[:,:]
+              self.failed[idx] = False
+            completed[idx] = True
+            if src in active: # Remove worker from active list
+              del active[src]
+          else:
+            doabort = False
+            for w, (idx, t0) in list(active.items()):
+              if (MPI.Wtime()-t0) > TASK_TIMEOUT: # no task runtime > TIMEOUT
+                sys.stderr.write(f"[Rank 0] Worker {w} at idx={idx} timed out (MPI RTAG)")
+                sys.stderr.flush()
+                doabort = True
+            if doabort:
+              for w, (idx, t0) in list(active.items()): # mark all running tasks as failed
+                self.datavectors[idx,:,:] = 0.0
+                self.failed[idx] = True
+                completed[idx] = True
+              self.__save_chk() # save before crashing
+              comm.Abort(1)
+            time.sleep(.1) # avoid 100% CPU usage    
+        # end active workers
+        
+        # stop workers ---------------------------------------------------------
+        self.__save_chk() # save before sending stop sign 
+        active = {}       # reinitialize active (extra safety)
+        for w in range(1, nworkers + 1): # stop workers
+          comm.send((0, None), dest=w, tag=STAG)
+          active[w] = (0, MPI.Wtime())     
+        while active:
+          # comm.Iprobe = non-blocking operation used to check for an incoming 
+          #               message without actually receiving it
+          # Why? protect the script against crashes (like CAMB/Class crash)
+          if comm.Iprobe(source=MPI.ANY_SOURCE, tag=DTAG, status=status):
+            _ = comm.recv(source=MPI.ANY_SOURCE, tag=DTAG, status=status)
+            src = status.Get_source()
+            if src in active:
+              del active[src]
+          else:
+            for w, (_, t0) in list(active.items()):
+              if (MPI.Wtime()-t0) > STOP_TIMEOUT: # no task runtime > TIMEOUT
+                sys.stderr.write(f"[Rank 0] Worker {w} timed out (MPI DTAG)")
+                sys.stderr.flush()
+                comm.Abort(1)
+            time.sleep(.1) # avoid 100% CPU usage
+        # end stop workers
+      
+      else:
+      
+        status = MPI.Status()
+        while (True):
+          idx, sample = comm.recv(source = 0, 
+                                  tag = MPI.ANY_TAG, 
+                                  status = status) # try block on main b/c if
+                                                   # rank zero throws an exception
+                                                   # before send, MPI hangs
+          if (status.Get_tag() == STAG):
+            comm.send(("worker done", rank), dest = 0, tag = DTAG)
+            break
+          try:
+            dvs = self._compute_dvs_from_sample(sample)
+            comm.send(("ok", idx, dvs), dest = 0, tag = RTAG)
+          except Exception as e:
+            sys.stderr.write(f"[Rank {rank}] Exception type: {type(e).__name__}\n")
+            sys.stderr.write(f"[Rank {rank}] Exception message: {e}\n")
+            comm.send(("err", idx, traceback.format_exc(limit=8)), 
+                      dest = 0, 
+                      tag = RTAG)
+            continue
+    return
 
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+# main
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
 
-#mpirun -n 5 --oversubscribe --mca pml ^ucx --mca btl vader,tcp,self \
-#     --bind-to core --map-by core --report-bindings --mca mpi_yield_when_idle 1 \
-#    python datageneratorbaosn.py \
-#    --data_path './trainingdata/' \
-#    --datavectors_file 'dvfilename' \
-#    --parameters_file 'paramfilename.npy' \
-#    --N 100 \
-#    --mode 'train' \
+if __name__ == "__main__":
+  comm = MPI.COMM_WORLD
+  rank = comm.Get_rank()
+  try:
+    generator = dataset()
+  except Exception:
+    traceback.print_exc()
+    comm.Abort(1)   # other ranks don’t hang in recv/barrier
+  MPI.Finalize()
+  exit(0)
 
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
+#-------------------------------------------------------------------------------
diff --git a/emultraining/dataset_generator_baosn_copy.py b/emultraining/dataset_generator_baosn_copy.py
new file mode 100644
index 0000000..ba0fdb4
--- /dev/null
+++ b/emultraining/dataset_generator_baosn_copy.py
@@ -0,0 +1,268 @@
+import numpy as np
+import cobaya
+from cobaya.yaml import yaml_load
+from cobaya.model import get_model
+import sys
+import os
+import platform
+import yaml
+from mpi4py import MPI
+from scipy.stats import qmc
+import copy
+import functools, iminuit, copy, argparse, random, time 
+import emcee, itertools
+from cobaya.likelihood import Likelihood
+from schwimmbad import MPIPool
+
+
+parser = argparse.ArgumentParser(prog='cos_uniform')
+
+
+class SimpleBAODVLikelihood(Likelihood):
+    # Example data can also be passed via YAML or hardcoded here
+    def initialize(self):
+        # Define data inside the class (or pass from outside if needed)
+        z1=np.linspace(0,3,600, endpoint=False)
+        z2=np.linspace(3,1200,200)
+        self.z_data = np.concatenate((z1,z2),axis=0)  # example redshifts
+
+    def get_requirements(self):
+        # Tell Cobaya which theory quantities you need at these redshifts
+        return {
+            "angular_diameter_distance": {"z": self.z_data},
+            "Hubble": {"z": self.z_data}
+            
+        }
+
+    def logp(self, **params_values):
+        # Get required theory quantities
+        return -0.5
+
+parser.add_argument("--N",
+                    dest="N",
+                    help="Number of points requested",
+                    type=int,
+                    nargs='?',
+                    const=1,
+                    default=100)
+
+parser.add_argument("--mode",
+                    dest="mode",
+                    help="mode of points generated",
+                    type=str,
+                    nargs='?',
+                    const=1,
+                    default='train')
+parser.add_argument("--data_path",
+                    dest="data_path",
+                    help="Directory for saving the data files",
+                    type=str,
+                    nargs='?',
+                    const=1,
+                    default='/data/')
+parser.add_argument("--datavectors_file",
+                    dest="datavectors_file",
+                    help="Name for data vector files (no .npy included)",
+                    type=str,
+                    nargs='?',
+                    const=1,
+                    default='cos_uni')
+parser.add_argument("--parameters_file",
+                    dest="parameters_file",
+                    help="Name for Parameter files (.npy included)",
+                    type=str,
+                    nargs='?',
+                    const=1,
+                    default='cos_uni_input.npy')
+args, unknown = parser.parse_known_args()
+
+####add yaml here, and make all input paratemers passing in
+yaml_string=r"""
+
+likelihood:
+  dummy:
+    class: SimpleBAODVLikelihood
+
+params:
+  
+  omegabh2:
+    prior:
+      min: 0.0
+      max: 0.04
+    ref:
+      dist: norm
+      loc: 0.022383
+      scale: 0.005
+    proposal: 0.005
+    latex: \Omega_\mathrm{b} h^2
+  omegach2:
+    prior:
+      min: 0.0
+      max: 0.5
+    ref:
+      dist: norm
+      loc: 0.12011
+      scale: 0.03
+    proposal: 0.03
+    latex: \Omega_\mathrm{c} h^2
+  H0:
+    prior:
+      min: 20
+      max: 120
+    ref:
+      dist: norm
+      loc: 67
+      scale: 2
+    proposal: 0.001
+    latex: H_0
+  tau:
+    value: 0.06
+    latex: \tau_\mathrm{reio}
+
+  logA:
+    value: 3.04
+    latex: \log(10^{10} A_\mathrm{s})
+    drop: true
+  ns:
+    value: 0.95
+    latex: n_\mathrm{s}
+  As:
+    value: 'lambda logA: 1e-10*np.exp(logA)'
+    latex: A_\mathrm{s}
+
+  mnu:
+    value: 0.06
+  thetastar:
+    derived: true
+    latex: \Theta_\star
+  rdrag:
+    derived: True
+    latex: r_\mathrm{drag}
+
+theory:
+  camb:
+    path: ./external_modules/code/CAMB
+    extra_args:
+      #dark_energy_model: ppf
+      lmax: 1000
+
+
+
+
+
+"""
+
+
+####add main function.
+
+
+#===================================================================================================
+# datavectors
+
+def generate_parameters(N, u_bound, l_bound, mode, parameters_file, save=True):
+    D = len(u_bound)
+
+    if mode=='train':
+        
+        N_LHS = int(0.05*N)
+        sampler = qmc.LatinHypercube(d=D)
+        sample = sampler.random(n=N_LHS)
+        sample_scaled = qmc.scale(sample, l_bound, u_bound)
+
+        N_uni = N-N_LHS
+        data = np.random.uniform(low=l_bound, high=u_bound, size=(N_uni, D))
+        samples = np.concatenate((sample_scaled, data), axis=0)
+    else:
+        samples = np.random.uniform(low=l_bound, high=u_bound, size=(N, D))
+
+    if save:
+        np.save(parameters_file, samples)
+        print('(Input Parameters) Saved!')
+    return samples
+mode = args.mode
+N = args.N
+PATH = os.environ.get("ROOTDIR") + '/' + args.data_path
+parameters_file  = PATH + args.parameters_file
+
+if __name__ == '__main__':
+    f = yaml_load(yaml_string)
+    sys.modules["SimpleBAODVLikelihood"] = sys.modules[__name__]
+    model = get_model(f)
+    
+    prior_params = list(model.parameterization.sampled_params())
+    sampling_dim = len(prior_params)
+    datavectors_file_path = PATH + args.datavectors_file
+    comm = MPI.COMM_WORLD
+    rank = comm.Get_rank()
+    num_ranks = comm.Get_size()
+
+    print('rank',rank,'is at barrier')
+           
+    z = model.likelihood['dummy'].z_data
+    len_z = len(z)
+    num_output = 2
+    SN_DIR = datavectors_file_path + '_baosn.npy'
+    u_bound = model.prior.bounds()[:,1]
+    l_bound = model.prior.bounds()[:,0]
+    if rank == 0:
+        samples = generate_parameters(N, u_bound, l_bound, mode, parameters_file)
+        total_num_dvs = len(samples)
+
+        param_info = samples[0:total_num_dvs:num_ranks]#reading for 0th rank input
+        for i in range(1,num_ranks):#sending other ranks' data
+            comm.send(
+                samples[i:total_num_dvs:num_ranks], 
+                dest = i, 
+                tag  = 1
+            )
+                
+    else:
+            
+        param_info = comm.recv(source = 0, tag = 1)
+
+            
+    num_datavector = len(param_info)
+
+    BAOSN = np.zeros(
+            (num_datavector, len_z, num_output), dtype = "float32"
+        ) 
+
+    for i in range(num_datavector):
+        input_params = model.parameterization.to_input(param_info[i])  
+        try:
+            model.loglike(input_params)
+            theory = list(model.theory.values())[1]
+            H = theory.get_Hubble(z)
+            Dl = theory.get_angular_diameter_distance(z)*(1+z)**2
+                
+        except:
+            print('fail')
+        else:
+            BAOSN[i,:,0] = H
+            BAOSN[i,:,1] = Dl
+            
+
+    if rank == 0:
+        result_baosn   = np.zeros((total_num_dvs, len_z, num_output), dtype="float32")
+        result_baosn[0:total_num_dvs:num_ranks] = BAOSN
+
+        for i in range(1,num_ranks):        
+            result_baosn[i:total_num_dvs:num_ranks] = comm.recv(source = i, tag = 10)
+
+        np.save(SN_DIR, result_baosn)
+            
+    else:    
+        comm.send(BAOSN, dest = 0, tag = 10)
+
+
+
+
+#mpirun -n 5 --oversubscribe --mca pml ^ucx --mca btl vader,tcp,self \
+#     --bind-to core --map-by core --report-bindings --mca mpi_yield_when_idle 1 \
+#    python datageneratorbaosn.py \
+#    --data_path './trainingdata/' \
+#    --datavectors_file 'dvfilename' \
+#    --parameters_file 'paramfilename.npy' \
+#    --N 100 \
+#    --mode 'train' \
+
diff --git a/emultraining/dataset_generator_cmb.py b/emultraining/dataset_generator_cmb.py
index 2e7e65a..23c8fd5 100644
--- a/emultraining/dataset_generator_cmb.py
+++ b/emultraining/dataset_generator_cmb.py
@@ -1,7 +1,6 @@
 import numpy as np
 import emcee, argparse, os, sys, yaml, time, traceback 
 import psutil, gc, math, copy, tempfile
-from cobaya.yaml import yaml_load
 from cobaya.model import get_model
 from mpi4py import MPI
 from pathlib import Path
@@ -266,7 +265,7 @@ def __setup_flags(self):
       raise KeyError(f"Cobaya YAML missing required blocks {missing}: {self.yaml}") 
 
     train_args = info["train_args"]
-    required_keys = ['probe', 'ord', 'lrange', 'derived']
+    required_keys = ['probe', 'ord', 'lrange']
     if not self.unif == 1:
       required_keys += ['fiducial', 'params_covmat_file']
 
@@ -288,9 +287,10 @@ def __setup_flags(self):
 
     self.sampled_params = train_args['ord'] # preferred ordering of params
 
-    self.derived = train_args['derived']
+    self.derived = train_args['derived'] if 'derived' in train_args else []
 
     self.lrange = np.array(train_args['lrange'], dtype=int)
+    
     if not self.unif == 1:
       fid = train_args["fiducial"] # load fiducial data vector
       
@@ -422,12 +422,15 @@ def __load_chk(self):
                                                  f"{self.paramsf}.ranges",
                                                  f"{self.paramsf}.1.txt"]])
       if loadchk:
+        # load sample file begins ----------------------------------------------  
         # row 0/1 rows are weights, lnp. Last row is chi2
         self.samples = np.atleast_2d(np.loadtxt(f"{self.paramsf}.1.txt", 
                                                 dtype=self.dtype))[:,2:-1]
         if self.samples.ndim != 2:
           raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
-        
+        # load sample file ends ------------------------------------------------ 
+
+        # load fail file begins ------------------------------------------------
         self.failed = np.atleast_1d(np.loadtxt(f"{self.failf}.txt", 
                                                dtype=np.uint8))
         self.failed = np.asarray(self.failed).astype(bool)
@@ -436,23 +439,26 @@ def __load_chk(self):
         
         if self.samples.shape[0] != self.failed.shape[0]:
           raise ValueError(f"Incompatible samples/failed chk files")
+        # load fail file ends --------------------------------------------------
 
         # load datavectors begins ----------------------------------------------
         arr = np.load(f"{self.dvsf}.npy", 
-                      mmap_mode="r", 
-                      allow_pickle=False)
-        RAMneed = arr.nbytes + self.samples.nbytes + self.failed.nbytes
+                      mmap_mode = "r", 
+                      allow_pickle = False)
+        RAMneed = (arr.nbytes + 
+                   self.samples.nbytes + 
+                   self.failed.nbytes)
         RAMavail = psutil.virtual_memory().available
         if RAMneed < 0.75 * RAMavail:
-          self.datavectors = np.load(f"{self.dvsf}.npy", allow_pickle=False)
+          self.datavectors = np.load(f"{self.dvsf}.npy", allow_pickle = False)
           self.dvs_is_memmap = False
         else:
           print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
                 f"There is {RAMavail/1e9:.2f} GB of RAM available. "
                 f"We will read dvs from HD (slow)")
           self.datavectors = np.load(f"{self.dvsf}.npy", 
-                                     mmap_mode="r+", 
-                                     allow_pickle=False)
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
           self.dvs_is_memmap = True
         del arr
         # load datavectors ends ------------------------------------------------
@@ -461,21 +467,26 @@ def __load_chk(self):
           raise ValueError(f"datavectors must be 3D, got {self.datavectors.shape}") 
         if self.datavectors.shape[0] != self.samples.shape[0]:
           raise ValueError(f"Incompatible samples/datavector chk files")
-        if loadchk: 
-          print("Loaded models from chk")
-          if self.append == 0:
-            self.loadedsamples = True
-            self.loadedfromchk = True
+        print("Loaded models from chk")
+        if self.append == 0:
+          self.loadedsamples = True
+          self.loadedfromchk = True
         rtnvar = True
     return rtnvar
   
   def __save_chk(self):
+    # save data vector file ----------------------------------------------------
     if self.dvs_is_memmap == True:
       self.datavectors.flush()  # checkpoint dv in-place
     else:
+      # save (flush) dvs to tmp file (safer) -----------------------------------
       np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+      # save data vector file (from tmp) ---------------------------------------
       os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+    # save fail file -----------------------------------------------------------
+    # save (flush) dvs to tmp file (safer) -------------------------------------
     np.savetxt(f"{self.failf}.tmp.txt", self.failed.astype(np.uint8), fmt="%d")
+    # save data vector file (from tmp) -----------------------------------------
     os.replace(f"{self.failf}.tmp.txt", f"{self.failf}.txt")
 
   #-----------------------------------------------------------------------------
@@ -517,7 +528,8 @@ def __run_mcmc(self):
       
       if not self.unif == 1:
         # high number of samples: make sure we get unique samples
-        nparams  = 40*self.nparams if self.bounds_adj < 1 else 20*self.nparams
+        nparam  = 40*self.nparams if self.bounds_adj < 1 else 20*self.nparams
+        nparams  = max(nparam, 5000000)
         nwalkers = int(10*ndim)
         nsteps   = int(max(7500, nparams/nwalkers)) # (for safety we assume tau>100)
         burnin   = int(0.1*nsteps)                  # 10% burn-in
@@ -538,8 +550,9 @@ def __run_mcmc(self):
         if len(xf) < self.nparams:
           print(f"Warning: only {len(xf)} unique rows, requested {self.nparams}")
         else:
-          xf  = xf[:self.nparams,:]
-          lnp = lnp[:self.nparams,:]
+          indices = np.random.choice(np.arange(len(xf)), size=self.nparams, replace=False)
+          xf  = xf[indices,:]
+          lnp = lnp[indices,:]
         nparams = len(xf)        
       else:
         nparams  = self.nparams
@@ -631,6 +644,11 @@ def __run_mcmc(self):
         del chi2      # save RAM memory
         gc.collect()  # save RAM memory
       else:
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
+        # This option = loadedfromchk == True and self.append == 1
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
         # append chain file begins ---------------------------------------------
         fname = f"{self.paramsf}.1.txt";
         with open(fname, "a") as f: # append mode
@@ -645,10 +663,10 @@ def __run_mcmc(self):
         del chi2      # save RAM memory
         gc.collect()  # save RAM memory
         
-
         self.samples = np.atleast_2d(np.loadtxt(fname, dtype=self.dtype))[:,2:-1]
         if self.samples.ndim != 2:
           raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
+        # append chain file ends -----------------------------------------------
 
         # append fail file begins ----------------------------------------------
         fname = f"{self.failf}.txt";
@@ -663,44 +681,52 @@ def __run_mcmc(self):
 
         if self.samples.shape[0] != self.failed.shape[0]:
           raise ValueError(f"Incompatible samples/failed chk files")
+        # append fail file begins ----------------------------------------------
 
-        # Expand dvs begins ----------------------------------------------------
+        # append dvs (with zeros) begins ---------------------------------------
         nrows   = self.datavectors.shape[0]
         ncols   = self.datavectors.shape[1]
         nstride = self.datavectors.shape[2]
 
-        RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
+        RAMneed = ( self.samples.nbytes + 
+                    self.failed.nbytes + 
                     self.datavectors.nbytes + 
                     (nrows + nparams)*ncols*nstride*self.datavectors.dtype.itemsize)
         RAMavail = psutil.virtual_memory().available
+        
         if RAMneed < 0.75 * RAMavail:
+          # setup new datavector numpy array -----------------------------------
           self.datavectors = np.vstack((self.datavectors, 
-                                        np.zeros((nparams,ncols,nstride),
-                                                 dtype=self.dtype)
-                                        ))
+                                        np.zeros((nparams, ncols, nstride), dtype=self.dtype)))
+          # save (flush) dvs to tmp file (safer) -------------------------------
           np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+          # save data vector file (from tmp) -----------------------------------
           os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
           self.dvs_is_memmap = False
         else:
           print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
                 f"There is {RAMavail/1e9:.2f} GB of RAM available. "
                 f"We will read dvs from HD (slow)")
+          # setup new datavector numpy array -----------------------------------
           datavectors = open_memmap(f"{self.dvsf}.tmp.npy", 
-                                    mode="w+",
-                                    shape=(nrows + nparams, ncols, nstride),
-                                    dtype=self.datavectors.dtype)
-          for s in range(0, nrows, 2500): # chunks = avoid RAM spikes) 
+                                    mode = "w+",
+                                    shape = (nrows + nparams, ncols, nstride),
+                                    dtype = self.datavectors.dtype)
+          for s in range(0, nrows, 2500): # read dvs in chunks: avoid RAM spikes 
             e = min(nrows, s + 2500)
             datavectors[s:e] = self.datavectors[s:e]
           for s in range(nrows, nrows + nparams, 2500):
             e = min(nrows + nparams, s + 2500)
             datavectors[s:e] = 0
-          datavectors.flush()
+          # save (flush) data vector (in-place) --------------------------------
+          datavectors.flush() 
           del datavectors
+          # save data vector file (from tmp) -----------------------------------
           os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+          # finally, load the new dv numpy array from file ---------------------
           self.datavectors = np.load(f"{self.dvsf}.npy", 
-                                     mmap_mode="r+", 
-                                     allow_pickle=False)
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
           self.dvs_is_memmap = True
         # Expand dvs ends ------------------------------------------------------
         
@@ -718,17 +744,34 @@ def __run_mcmc(self):
                      fmt="%.9e",
                      header=' '.join(names),
                      comments="# ")
-
-        # set  self.loadedfromchk ----------------------------------------------
+        # set self.loadedfromchk -----------------------------------------------
         self.loadedfromchk = True
-
-
     # set self.loadedsamples ---------------------------------------------------
     self.loadedsamples = True
   
   #-----------------------------------------------------------------------------
   # datavectors
   #-----------------------------------------------------------------------------
+  def __allocate_data_vector(self, nrows, ncols, nstride):  
+    RAMneed = ( self.samples.nbytes + 
+                self.failed.nbytes + 
+                nrows*ncols*nstride*np.dtype(self.dtype).itemsize )
+    RAMavail = psutil.virtual_memory().available
+    if RAMneed < 0.75 * RAMavail:
+      self.datavectors = np.zeros((nrows, ncols, nstride), dtype=self.dtype)
+      self.dvs_is_memmap = False
+    else:
+      print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
+            f"There is {RAMavail/1e9:.2f} GB of RAM available. "
+            f"We will read dvs from HD (slow)")
+      self.datavectors = open_memmap(f"{self.dvsf}.npy", 
+                                     mode = "w+",
+                                     shape = (nrows, ncols, nstride),
+                                     dtype = self.dtype)
+      self.datavectors[::] = 0.0
+      self.datavectors.flush()
+      self.dvs_is_memmap = True
+
   def _compute_dvs_from_sample(self, sample):
     # Define fortran errors we want to capture ---------------------------------
     camb_error_keywords = {"ERROR", "error", "Did not converge"}
@@ -750,20 +793,24 @@ def _compute_dvs_from_sample(self, sample):
     ncols = 5
     out = np.zeros((nrows, ncols), dtype=self.dtype)
 
-    captured = 0
+    captured = 0 # variable that will hold terminal output 
     with capture_native_output() as tmp:
       for (x, _), z in zip(self.model._component_order.items(),
                            self.model._params_of_dependencies):
         x.check_cache_and_compute(
-            params_values_dict=dict({p: param[p] for p in x.input_params}),
-            want_derived=self.derived,
-            dependency_params=list(param.keys()),
-            cached=True
+            params_values_dict = dict({p: param[p] for p in x.input_params}),
+            want_derived = self.derived,
+            dependency_params = list(param.keys()),
+            cached = True
         )
       tmp.seek(0)
-      captured = tmp.read()
+      captured = tmp.read() # copy terminal output -----------------------------
+    
+    # check for CAMB errors in the terminal output -----------------------------
     if any(kw in captured for kw in camb_error_keywords):
       raise RuntimeError(f"CAMB Fortran error: {captured.strip()}")
+    
+    # get results from Theory block (already computed) -------------------------
     for (x, _), z in zip(self.model._component_order.items(),
                          self.model._params_of_dependencies):
       if (self.probe == "cmblensed" and
@@ -817,34 +864,20 @@ def __generate_datavectors(self):
       nparams = len(self.samples)
 
       if not self.loadedfromchk:
+        # Allocate failed array begins -----------------------------------------
         self.failed = np.ones(nparams, dtype=np.uint8) # start w/ all failed
         self.failed = np.asarray(self.failed).astype(bool)
-        # Allocate dvs begins --------------------------------------------------
+        
+        # Allocate data vectors begins -----------------------------------------
         nrows   = nparams
         ncols   = (self.lrange[1] - self.lrange[0]) + 1
         nstride = 5 # TT, TE, EE, PHIPHI, EXTRA (waste a lot of RAM but simple)
+        self.__allocate_data_vector(nrows=nrows, ncols=ncols, nstride=nstride)
+        # Allocate data vectors end --------------------------------------------
         
-        RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
-                    nrows*ncols*nstride*np.dtype(self.dtype).itemsize )
-        RAMavail = psutil.virtual_memory().available
-        if RAMneed < 0.75 * RAMavail:
-          self.datavectors = np.zeros((nrows, ncols, nstride), dtype=self.dtype)
-          self.dvs_is_memmap = False
-        else:
-          print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
-                f"There is {RAMavail/1e9:.2f} GB of RAM available. "
-                f"We will read dvs from HD (slow)")
-          self.datavectors = open_memmap(f"{self.dvsf}.npy", 
-                                         mode="w+",
-                                         shape=(nrows, ncols, nstride),
-                                         dtype=self.dtype)
-          self.datavectors[::] = 0.0
-          self.datavectors.flush()
-          self.dvs_is_memmap = True
-        # Allocate dvs end -----------------------------------------------------
-        idx = np.arange(0, nparams)
+        idx = np.arange(0, nparams) # indexes to compute data vectors
       else:
-        idx = np.where(self.failed == True)[0] 
+        idx = np.where(self.failed == True)[0] # indexes to compute data vectors
 
       for i in idx:
         try:
@@ -878,35 +911,21 @@ def __generate_datavectors(self):
         completed = np.zeros(nparams, dtype=bool)
 
         if not self.loadedfromchk:
+          # Allocate failed array begins ---------------------------------------
           self.failed = np.ones(nparams, dtype=np.uint8) # start w/ all failed
           self.failed = np.asarray(self.failed).astype(bool)
-          # Allocate dvs begins ------------------------------------------------
+          
+          # Allocate data vectors begins ---------------------------------------
           nrows = nparams
           ncols = (self.lrange[1] - self.lrange[0]) + 1
           nstride = 5 # TT, TE, EE, PHIPHI, EXTRA (waste a lot of RAM but simple)
-
-          RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
-                      nrows*ncols*nstride*np.dtype(self.dtype).itemsize )
-          RAMavail = psutil.virtual_memory().available
-          if RAMneed < 0.75 * RAMavail:
-            self.datavectors = np.zeros((nrows, ncols, nstride), dtype=self.dtype)
-            self.dvs_is_memmap = False
-          else:
-            print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
-                  f"There is {RAMavail/1e9:.2f} GB of RAM available. "
-                  f"We will read dvs from HD (slow)")
-            self.datavectors = open_memmap(f"{self.dvsf}.npy", 
-                                         mode="w+",
-                                         shape=(nrows, ncols, nstride),
-                                         dtype=self.dtype)
-            self.datavectors[::] = 0.0
-            self.datavectors.flush()
-            self.dvs_is_memmap = True
-          # Allocate dvs end ---------------------------------------------------
-          idx0 = np.arange(0, nparams)
+          self.__allocate_data_vector(nrows=nrows, ncols=ncols, nstride=nstride)
+          # Allocate data vectors end ------------------------------------------
+          
+          idx0 = np.arange(0, nparams) # indexes to compute data vectors
         else:
           completed = ~self.failed
-          idx0 = np.where(self.failed == True)[0]
+          idx0 = np.where(self.failed == True)[0] # indexes to compute data vectors
         
         tasks   = deque(idx0.tolist())
         nactive = min(nworkers, len(tasks))
@@ -1090,4 +1109,4 @@ def __generate_datavectors(self):
 #-------------------------------------------------------------------------------
 #-------------------------------------------------------------------------------
 #-------------------------------------------------------------------------------
-#-------------------------------------------------------------------------------
\ No newline at end of file
+#-------------------------------------------------------------------------------
diff --git a/emultraining/dataset_generator_lensing.py b/emultraining/dataset_generator_lensing.py
index b3aec08..f8e08e1 100644
--- a/emultraining/dataset_generator_lensing.py
+++ b/emultraining/dataset_generator_lensing.py
@@ -1,7 +1,6 @@
 import numpy as np
 import emcee, argparse, os, sys, yaml, time, traceback 
 import psutil, gc, math, copy, tempfile
-from cobaya.yaml import yaml_load
 from cobaya.model import get_model
 from mpi4py import MPI
 from pathlib import Path
@@ -418,12 +417,15 @@ def __load_chk(self):
                                                  f"{self.paramsf}.ranges",
                                                  f"{self.paramsf}.1.txt"]])
       if loadchk:
+        # load sample file begins ----------------------------------------------  
         # row 0/1 rows are weights, lnp. Last row is chi2
         self.samples = np.atleast_2d(np.loadtxt(f"{self.paramsf}.1.txt", 
                                                 dtype=self.dtype))[:,2:-1]
         if self.samples.ndim != 2:
           raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
-        
+        # load sample file ends ------------------------------------------------ 
+
+        # load fail file begins ------------------------------------------------
         self.failed = np.atleast_1d(np.loadtxt(f"{self.failf}.txt", 
                                                dtype=np.uint8))
         self.failed = np.asarray(self.failed).astype(bool)
@@ -432,23 +434,26 @@ def __load_chk(self):
         
         if self.samples.shape[0] != self.failed.shape[0]:
           raise ValueError(f"Incompatible samples/failed chk files")
+        # load fail file ends --------------------------------------------------
 
         # load datavectors begins ----------------------------------------------
         arr = np.load(f"{self.dvsf}.npy", 
-                      mmap_mode="r", 
-                      allow_pickle=False)
-        RAMneed = arr.nbytes + self.samples.nbytes + self.failed.nbytes
+                      mmap_mode = "r", 
+                      allow_pickle = False)
+        RAMneed = (arr.nbytes + 
+                   self.samples.nbytes + 
+                   self.failed.nbytes)
         RAMavail = psutil.virtual_memory().available
         if RAMneed < 0.75 * RAMavail:
-          self.datavectors = np.load(f"{self.dvsf}.npy", allow_pickle=False)
+          self.datavectors = np.load(f"{self.dvsf}.npy", allow_pickle = False)
           self.dvs_is_memmap = False
         else:
           print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
                 f"There is {RAMavail/1e9:.2f} GB of RAM available. "
                 f"We will read dvs from HD (slow)")
           self.datavectors = np.load(f"{self.dvsf}.npy", 
-                                     mmap_mode="r+", 
-                                     allow_pickle=False)
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
           self.dvs_is_memmap = True
         del arr
         # load datavectors ends ------------------------------------------------
@@ -466,12 +471,18 @@ def __load_chk(self):
     return rtnvar
   
   def __save_chk(self):
+    # save data vector file ----------------------------------------------------
     if self.dvs_is_memmap == True:
       self.datavectors.flush()  # checkpoint dv in-place
     else:
+      # save (flush) dvs to tmp file (safer) -----------------------------------
       np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+      # save data vector file (from tmp) ---------------------------------------
       os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+    # save fail file -----------------------------------------------------------
+    # save (flush) dvs to tmp file (safer) -------------------------------------
     np.savetxt(f"{self.failf}.tmp.txt", self.failed.astype(np.uint8), fmt="%d")
+    # save data vector file (from tmp) -----------------------------------------
     os.replace(f"{self.failf}.tmp.txt", f"{self.failf}.txt")
 
   #-----------------------------------------------------------------------------
@@ -513,7 +524,8 @@ def __run_mcmc(self):
       
       if not self.unif == 1:
         # high number of samples: make sure we get unique samples
-        nparams  = 40*self.nparams if self.bounds_adj < 1 else 20*self.nparams
+        nparam  = 40*self.nparams if self.bounds_adj < 1 else 20*self.nparams
+        nparams  = max(nparam, 5000000)
         nwalkers = int(10*ndim)
         nsteps   = int(max(7500, nparams/nwalkers)) # (for safety we assume tau>100)
         burnin   = int(0.1*nsteps)                  # 10% burn-in
@@ -534,8 +546,9 @@ def __run_mcmc(self):
         if len(xf) < self.nparams:
           print(f"Warning: only {len(xf)} unique rows, requested {self.nparams}")
         else:
-          xf  = xf[:self.nparams,:]
-          lnp = lnp[:self.nparams,:]
+          indices = np.random.choice(np.arange(len(xf)), size=self.nparams, replace=False)
+          xf  = xf[indices,:]
+          lnp = lnp[indices,:]
         nparams = len(xf)        
       else:
         nparams  = self.nparams
@@ -627,6 +640,11 @@ def __run_mcmc(self):
         del chi2      # save RAM memory
         gc.collect()  # save RAM memory
       else:
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
+        # This option = loadedfromchk == True and self.append == 1
+        # ----------------------------------------------------------------------
+        # ----------------------------------------------------------------------
         # append chain file begins ---------------------------------------------
         fname = f"{self.paramsf}.1.txt";
         with open(fname, "a") as f: # append mode
@@ -641,10 +659,10 @@ def __run_mcmc(self):
         del chi2      # save RAM memory
         gc.collect()  # save RAM memory
         
-
         self.samples = np.atleast_2d(np.loadtxt(fname, dtype=self.dtype))[:,2:-1]
         if self.samples.ndim != 2:
           raise ValueError(f"samples must be 2D, got {self.samples.shape}") 
+        # append chain file ends -----------------------------------------------
 
         # append fail file begins ----------------------------------------------
         fname = f"{self.failf}.txt";
@@ -659,43 +677,51 @@ def __run_mcmc(self):
 
         if self.samples.shape[0] != self.failed.shape[0]:
           raise ValueError(f"Incompatible samples/failed chk files")
+        # append fail file begins ----------------------------------------------
 
-        # Expand dvs begins ----------------------------------------------------
+        # append dvs (with zeros) begins ---------------------------------------
         nrows = self.datavectors.shape[0]
         ncols = self.datavectors.shape[1]
 
-        RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
+        RAMneed = ( self.samples.nbytes + 
+                    self.failed.nbytes + 
                     self.datavectors.nbytes + 
                     (nrows + nparams)*ncols*self.datavectors.dtype.itemsize)
         RAMavail = psutil.virtual_memory().available
+        
         if RAMneed < 0.75 * RAMavail:
+          # setup new datavector numpy array -----------------------------------
           self.datavectors = np.vstack((self.datavectors, 
-                                        np.zeros((nparams,ncols),
-                                                 dtype=self.dtype)
-                                        ))
+                                        np.zeros((nparams, ncols), dtype=self.dtype)))
+          # save (flush) dvs to tmp file (safer) -------------------------------
           np.save(f"{self.dvsf}.tmp.npy", self.datavectors)
+          # save data vector file (from tmp) -----------------------------------
           os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
           self.dvs_is_memmap = False
         else:
           print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
                 f"There is {RAMavail/1e9:.2f} GB of RAM available. "
                 f"We will read dvs from HD (slow)")
+          # setup new datavector numpy array -----------------------------------
           datavectors = open_memmap(f"{self.dvsf}.tmp.npy", 
-                                    mode="w+",
-                                    shape=(nrows + nparams, ncols),
-                                    dtype=self.datavectors.dtype)
-          for s in range(0, nrows, 2500): # chunks = avoid RAM spikes) 
+                                    mode = "w+",
+                                    shape = (nrows + nparams, ncols),
+                                    dtype = self.datavectors.dtype)
+          for s in range(0, nrows, 2500): # read dvs in chunks: avoid RAM spikes
             e = min(nrows, s + 2500)
             datavectors[s:e] = self.datavectors[s:e]
           for s in range(nrows, nrows + nparams, 2500):
             e = min(nrows + nparams, s + 2500)
             datavectors[s:e] = 0
+          # save (flush) data vector (in-place) --------------------------------
           datavectors.flush()
           del datavectors
+          # save data vector file (from tmp) -----------------------------------
           os.replace(f"{self.dvsf}.tmp.npy", f"{self.dvsf}.npy")
+          # finally, load the new dv numpy array from file ---------------------
           self.datavectors = np.load(f"{self.dvsf}.npy", 
-                                     mmap_mode="r+", 
-                                     allow_pickle=False)
+                                     mmap_mode = "r+", 
+                                     allow_pickle = False)
           self.dvs_is_memmap = True
         # Expand dvs ends ------------------------------------------------------
         
@@ -713,17 +739,34 @@ def __run_mcmc(self):
                      fmt="%.9e",
                      header=' '.join(names),
                      comments="# ")
-
-        # set  self.loadedfromchk ----------------------------------------------
+        # set self.loadedfromchk -----------------------------------------------
         self.loadedfromchk = True
-
-
     # set self.loadedsamples ---------------------------------------------------
     self.loadedsamples = True
   
   #-----------------------------------------------------------------------------
   # datavectors
   #-----------------------------------------------------------------------------
+  def __allocate_data_vector(self, nrows, ncols):
+    RAMneed = ( self.samples.nbytes + 
+                self.failed.nbytes + 
+                nrows*ncols*np.dtype(self.dtype).itemsize)
+    RAMavail = psutil.virtual_memory().available
+    if RAMneed < 0.75 * RAMavail:
+      self.datavectors = np.zeros((nrows, ncols), dtype=self.dtype)
+      self.dvs_is_memmap = False
+    else:
+      print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
+            f"There is {RAMavail/1e9:.2f} GB of RAM available. "
+            f"We will read dvs from HD (slow)")
+      self.datavectors = open_memmap(f"{self.dvsf}.npy", 
+                                     mode = "w+",
+                                     shape = (nrows, ncols),
+                                     dtype = self.dtype)
+      self.datavectors[:] = 0.0
+      self.datavectors.flush()
+      self.dvs_is_memmap = True
+
   def _compute_dvs_from_sample(self, sample):
     # Define fortran errors we want to capture ---------------------------------
     camb_error_keywords = {"ERROR", "error", "Did not converge"}
@@ -743,7 +786,7 @@ def _compute_dvs_from_sample(self, sample):
     # Compute data vector (within using cobaya API) ----------------------------
     likelihood = self.model.likelihood[list(self.model.likelihood.keys())[0]]
     
-    captured = 0
+    captured = 0 # variable that will hold terminal output 
     with capture_native_output() as tmp:
       for (x, _), z in zip(self.model._component_order.items(),
                            self.model._params_of_dependencies):
@@ -754,12 +797,15 @@ def _compute_dvs_from_sample(self, sample):
             cached=True
         )
       tmp.seek(0)
-      captured = tmp.read()
+      captured = tmp.read() # copy terminal output -----------------------------
+    
+    # check for CAMB errors in the terminal output -----------------------------
     if any(kw in captured for kw in camb_error_keywords):
       raise RuntimeError(f"CAMB Fortran error: {captured.strip()}")
+    
     return np.array(likelihood.get_datavector(**param), 
-                    copy=True, 
-                    dtype=self.dtype)
+                    copy = True, 
+                    dtype = self.dtype)
 
   def __generate_datavectors(self):
     if not self.setup:
@@ -782,9 +828,11 @@ def __generate_datavectors(self):
       nparams = len(self.samples)
 
       if not self.loadedfromchk:
+        # Allocate failed array begins -----------------------------------------
         self.failed = np.ones(nparams, dtype=np.uint8) # start w/ all failed
         self.failed = np.asarray(self.failed).astype(bool)
-        # Allocate dvs begins --------------------------------------------------
+        
+        # Allocate data vectors begins -----------------------------------------
         try: # First run: get data vector size
           dvs = self._compute_dvs_from_sample(self.samples[0])
         except Exception:
@@ -792,30 +840,15 @@ def __generate_datavectors(self):
                              f"Cannot determine datavector length.")
         nrows = nparams
         ncols = len(dvs)
-  
-        RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
-                    nrows*ncols*dvs.dtype.itemsize)
-        RAMavail = psutil.virtual_memory().available
-        if RAMneed < 0.75 * RAMavail:
-          self.datavectors = np.zeros((nrows, ncols), dtype=self.dtype)
-          self.dvs_is_memmap = False
-        else:
-          print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
-                f"There is {RAMavail/1e9:.2f} GB of RAM available. "
-                f"We will read dvs from HD (slow)")
-          self.datavectors = open_memmap(f"{self.dvsf}.npy", 
-                                         mode="w+",
-                                         shape=(nrows, ncols),
-                                         dtype=self.dtype)
-          self.datavectors[:] = 0.0
-          self.datavectors.flush()
-          self.dvs_is_memmap = True
-        # Allocate dvs end -----------------------------------------------------
-        self.datavectors[0] = dvs
-        self.failed[0] = False
-        idx = np.arange(1, nparams)
+        self.__allocate_data_vector(nrows=nrows, ncols=ncols)
+        # Allocate data vectors end --------------------------------------------
+        
+        self.datavectors[0] = dvs   # first data vector was already computed
+        self.failed[0] = False      # first data vector was already computed
+        
+        idx = np.arange(1, nparams) # indexes to compute data vectors
       else:
-        idx = np.where(self.failed == True)[0] 
+        idx = np.where(self.failed == True)[0]  # indexes to compute data vectors
 
       for i in idx:
         try:
@@ -850,9 +883,11 @@ def __generate_datavectors(self):
         completed = np.zeros(nparams, dtype=bool)
 
         if not self.loadedfromchk:
+          # Allocate failed array begins ---------------------------------------
           self.failed = np.ones(nparams, dtype=np.uint8) # start w/ all failed
           self.failed = np.asarray(self.failed).astype(bool)
-          # Allocate dvs begins ------------------------------------------------
+          
+          # Allocate data vectors begins ---------------------------------------
           try: # First run: get data vector size
             dvs = self._compute_dvs_from_sample(self.samples[0])
           except Exception:
@@ -863,32 +898,16 @@ def __generate_datavectors(self):
             comm.Abort(1)
           nrows = nparams
           ncols = len(dvs)
-
-          RAMneed = ( self.samples.nbytes + self.failed.nbytes + 
-                      nrows*ncols*dvs.dtype.itemsize)
-          RAMavail = psutil.virtual_memory().available
-          if RAMneed < 0.75 * RAMavail:
-            self.datavectors = np.zeros((nrows, ncols), dtype=self.dtype)
-            self.dvs_is_memmap = False
-          else:
-            print(f"Warning: samples & dvs need {RAMneed/1e9:.2f} GB of RAM. "
-                  f"There is {RAMavail/1e9:.2f} GB of RAM available. "
-                  f"We will read dvs from HD (slow)")
-            self.datavectors = open_memmap(f"{self.dvsf}.npy", 
-                                         mode="w+",
-                                         shape=(nrows, ncols),
-                                         dtype=self.dtype)
-            self.datavectors[:] = 0.0
-            self.datavectors.flush()
-            self.dvs_is_memmap = True
-          # Allocate dvs end ---------------------------------------------------
-          self.datavectors[0] = dvs
-          self.failed[0] = False
-          completed[0] = True
-          idx0 = np.arange(1, nparams)
+          self.__allocate_data_vector(nrows=nrows, ncols=ncols)
+          # Allocate data vectors end ------------------------------------------
+          
+          self.datavectors[0] = dvs     # first data vector was already computed
+          self.failed[0] = False        # first data vector was already computed
+          completed[0] = True           # first data vector was already computed
+          idx0 = np.arange(1, nparams)  # indexes to compute data vectors
         else:
           completed = ~self.failed
-          idx0 = np.where(self.failed == True)[0]
+          idx0 = np.where(self.failed == True)[0] # indexes to compute data vectors
         
         tasks   = deque(idx0.tolist())
         nactive = min(nworkers, len(tasks))
@@ -1072,4 +1091,4 @@ def __generate_datavectors(self):
 #-------------------------------------------------------------------------------
 #-------------------------------------------------------------------------------
 #-------------------------------------------------------------------------------
-#-------------------------------------------------------------------------------
\ No newline at end of file
+#-------------------------------------------------------------------------------