Implement control for implicit parallelism using --max_cpu_cores argument

2026-01-18 00:06:33 +08:00
parent cfe7f88162
commit 1d682c130d
1 changed files with 16 additions and 0 deletions
--- a/evaluate_next_event.py
+++ b/evaluate_next_event.py
@@ -186,6 +186,22 @@ def _compute_next_event_auc_clean_control(
 def main() -> None:
    args = parse_args()
    # Best-effort control of implicit parallelism to avoid CPU oversubscription.
    # Note: environment variables are ideally set before importing NumPy/PyTorch,
    # but setting them early in main can still affect subprocesses or lazy readers.
    if int(args.max_cpu_cores) > 0:
        n_threads = int(args.max_cpu_cores)
        torch.set_num_threads(n_threads)
        for k in (
            "OMP_NUM_THREADS",
            "MKL_NUM_THREADS",
            "OPENBLAS_NUM_THREADS",
            "VECLIB_MAXIMUM_THREADS",
            "NUMEXPR_NUM_THREADS",
        ):
            os.environ[k] = str(n_threads)
        print(f"Restricting implicit parallelism to {n_threads} threads.")
    seed_everything(args.seed)
    show_progress = (not args.no_tqdm)