From 20ae6921d37f8efa53ce71db73330f712502a079 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Tue, 6 Jan 2026 00:46:33 +0100
Subject: [PATCH 01/11] added hucira tool. Just run_one_enrichment

---
 pertpy/tools/__init__.py |   2 +
 pertpy/tools/_hucira.py  | 374 +++++++++++++++++++++++++++++++++++++++
 2 files changed, 376 insertions(+)
 create mode 100644 pertpy/tools/_hucira.py

diff --git a/pertpy/tools/__init__.py b/pertpy/tools/__init__.py
index 06a44cd7..5105cf46 100644
--- a/pertpy/tools/__init__.py
+++ b/pertpy/tools/__init__.py
@@ -7,6 +7,7 @@
 from pertpy.tools._distances._distance_tests import DistanceTest
 from pertpy.tools._distances._distances import Distance
 from pertpy.tools._enrichment import Enrichment
+from pertpy.tools._hucira import hucira
 from pertpy.tools._milo import Milo
 from pertpy.tools._mixscape import Mixscape
 from pertpy.tools._perturbation_space._clustering import ClusteringSpace
@@ -68,6 +69,7 @@ def __dir__():
     "DistanceTest",
     "Distance",
     "Enrichment",
+    "hucira",
     "Milo",
     "Mixscape",
     "ClusteringSpace",
diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
new file mode 100644
index 00000000..78b2a62a
--- /dev/null
+++ b/pertpy/tools/_hucira.py
@@ -0,0 +1,374 @@
+from typing import Literal
+
+import blitzgsea
+import gseapy as gp
+import numpy as np
+import pandas as pd
+from anndata import AnnData
+
+
+def _vprint(msg, verbose):
+    if verbose:
+        print(msg)
+
+
+class hucira:
+    def _get_genesets(
+        self,
+        adata: AnnData,
+        df: pd.DataFrame,
+        celltype_signature: str,
+        direction: Literal["upregulated", "downregulated", "both"] | None = None,
+        threshold_pval: float | None = None,
+        threshold_lfc: float | None = None,
+    ) -> tuple[dict[str, list[str]], pd.DataFrame]:
+        """Get shared gene sets between query adata and the Human Cytokine Dictionary, CIP signatures, or custom gene signatures of a chosen cell type.
+
+        Parameters
+        ----------
+        - adata: AnnData object with gene expression data.
+        - df: Either hcd, CIP signature, or a custom dataframe containing columns ["gene", "query_program", "celltype"].
+        - celltype_signature: celltype naming convention needs to match df.celltype
+        - direction: Relevant for hcd, but not for CIP or custom gene program
+        - threshold_pval: Relevant for hcd, but not for CIP or custom gene program
+        - threshold_lfc: Relevant for hcd, but not for CIP or custom gene program
+
+        Returns:
+        -------
+        - gene_set_dict: dictionary with cytokine/CIP as key and associated genes as values
+        - gene_set_df: df containing information on gene overlap between query data and gene program for chosen cell type
+        """
+        required_for_hcd = ["log_fc", "adj_p_value", "cytokine"]
+        required_for_CIP = ["gene", "CIP", "celltype"]
+
+        # Construct signature gene set if input is human cytokine dictionary
+        if set(required_for_hcd).issubset(df.columns):
+            print(f"Computing gene sets of Human Cytokine Dictionary for {celltype_signature}.")
+            select = (df.adj_p_value <= threshold_pval) & (df.celltype == celltype_signature)
+            if direction == "upregulated":
+                select = select & (df.log_fc >= threshold_lfc)
+            elif direction == "downregulated":
+                select = select & (df.log_fc <= threshold_lfc)
+            elif direction == "both":
+                select = select & (df.log_fc.abs() >= threshold_lfc)
+            else:
+                raise ValueError(f"Invalid direction: {direction}.")
+            df = df.loc[select]
+
+            gene_set_dict = {}
+            gene_set_df = pd.DataFrame()
+            for cytokine_i, cytokine in enumerate(df.cytokine.unique()):
+                gene_set = df.loc[df.cytokine == cytokine].gene.values
+                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
+                gene_set_df.loc[cytokine_i, "cytokine"] = cytokine
+                gene_set_df.loc[cytokine_i, "num_genes_signature"] = len(gene_set)
+                gene_set_df.loc[cytokine_i, "num_shared_genes_signature"] = len(gene_set_shared)
+                gene_set_df.loc[cytokine_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
+                gene_set_dict[cytokine] = gene_set_shared
+
+        # Construct signature gene set if input is CIP signatures
+        elif set(required_for_CIP).issubset(df.columns):
+            print(f"Computing gene sets of Cytokine-induced gene programs for {celltype_signature}.")
+            select = df.celltype == celltype_signature
+            df = df.loc[select]
+            gene_set_dict = {}
+            gene_set_df = pd.DataFrame()
+            for CIP_i, CIP in enumerate(df.CIP.unique()):
+                gene_set = df.loc[df.CIP == CIP].gene.values
+                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
+                gene_set_df.loc[CIP_i, "CIP"] = CIP
+                gene_set_df.loc[CIP_i, "num_genes_signature"] = len(gene_set)
+                gene_set_df.loc[CIP_i, "num_shared_genes_signature"] = len(gene_set_shared)
+                gene_set_df.loc[CIP_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
+                gene_set_dict[CIP] = gene_set_shared
+
+        # Construct signature gene set for custom gene programs
+        elif "query_program" in df.columns:
+            print(f"Computing gene sets of user-defined gene programs for {celltype_signature}.")
+            select = df.celltype == celltype_signature
+            df = df.loc[select]
+            gene_set_dict = {}
+            gene_set_df = pd.DataFrame()
+            for query_program_i, query_program in enumerate(df.query_program.unique()):
+                gene_set = df.loc[df.query_program == query_program].gene.values
+                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
+                gene_set_df.loc[query_program_i, "query_program"] = query_program
+                gene_set_df.loc[query_program_i, "num_genes_signature"] = len(gene_set)
+                gene_set_df.loc[query_program_i, "num_shared_genes_signature"] = len(gene_set_shared)
+                gene_set_df.loc[query_program_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
+                gene_set_dict[query_program] = gene_set_shared
+
+        else:
+            raise ValueError(
+                "invalid input for df parameter. You can use either the Human Cytokine Dictionary with load_human_cytokine_dict(), or our CIP signatures with load_CIP_signatures(). If you want to compute enrichment of custom gene sets, df must have columns: ['gene', 'query_program', 'celltype']."
+            )
+            return
+        return gene_set_dict, gene_set_df
+
+    def _compute_mu_and_sigma(self, adata: AnnData, contrast_column: str, condition: str) -> pd.DataFrame:
+        group = adata[adata.obs[contrast_column] == condition]
+        num_cells = group.shape[0]
+        X = group.X.toarray() if hasattr(group.X, "toarray") else group.X
+        mu = np.mean(X, axis=0)
+        sigma = np.std(X, axis=0, ddof=1)
+        return {"mu": mu, "sigma": sigma, "num_cells": num_cells}
+
+    def _compute_s2n(
+        self,
+        adata: AnnData,
+        contrast_column: str,
+        condition_1: str,
+        condition_2: str,
+        precomputed_stats: dict | None = None,
+    ) -> tuple[pd.DataFrame, pd.DataFrame]:
+        """Compute the signal-to-noise ratio (S2N) for each gene between two conditions in an AnnData object.
+
+        Parameters
+        ----------
+        - adata: AnnData object with gene expression data.
+        - contrast_column: Key in `adata.obs` indicating the condition labels (e.g. "disease_state").
+        - condition_1: Name of the first condition (e.g., "flare").
+        - condition_2: Name of the second condition (e.g., "healthy").
+
+        Returns:
+        -------
+        - s2n_scores: pandas Series of S2N values indexed by gene names.
+        """
+        if precomputed_stats is None:
+            # Select cells for each condition
+            group1 = adata[adata.obs[contrast_column] == condition_1]
+            group2 = adata[adata.obs[contrast_column] == condition_2]
+
+            # number of cells per condition
+            num_cells_1 = group1.shape[0]
+            num_cells_2 = group2.shape[0]
+
+            # Get expression matrices
+            X1 = group1.X.toarray() if hasattr(group1.X, "toarray") else group1.X
+            X2 = group2.X.toarray() if hasattr(group2.X, "toarray") else group2.X
+
+            # Compute mean and std per gene
+            mu1 = np.mean(X1, axis=0)
+            mu2 = np.mean(X2, axis=0)
+            sigma1 = np.std(X1, axis=0, ddof=1)
+            sigma2 = np.std(X2, axis=0, ddof=1)
+
+        else:
+            _vprint("Using precomputed stats", True)
+            num_cells_1 = precomputed_stats[condition_1]["num_cells"]
+            num_cells_2 = precomputed_stats[condition_2]["num_cells"]
+            mu1 = precomputed_stats[condition_1]["mu"]
+            mu2 = precomputed_stats[condition_2]["mu"]
+            sigma1 = precomputed_stats[condition_1]["sigma"]
+            sigma2 = precomputed_stats[condition_2]["sigma"]
+
+        # Compute S2N
+        s2n = (mu1 - mu2) / (sigma1 + sigma2 + 1e-8)  # epsilon to avoid division by zero
+
+        num_cells = pd.DataFrame(
+            index=[f"{condition_1}_vs_{condition_2}"],
+            columns=["num_cells_1", "num_cells_2"],
+            data=[[num_cells_1, num_cells_2]],
+        )
+        stats = pd.DataFrame(s2n, index=adata.var_names, columns=[f"{condition_1}_vs_{condition_2}"])
+
+        return stats, num_cells
+
+    def _compute_ranking_statistic(
+        self, adata: AnnData, contrast_column: str, contrasts_combo: list[tuple[str, str]]
+    ) -> tuple[pd.DataFrame, pd.DataFrame]:
+        rnk_stats, num_cells = [], []
+        precomputed_stats = {}
+
+        conditions = []
+        for condition in contrasts_combo:
+            conditions.extend([condition[0], condition[1]])
+        conditions = np.unique(conditions)
+
+        for condition in conditions:
+            precomputed_stats[condition] = self._compute_mu_and_sigma(
+                adata, contrast_column=contrast_column, condition=condition
+            )
+
+        for condition in contrasts_combo:
+            _rnk_stats, _num_cells = self._compute_s2n(
+                adata,
+                contrast_column=contrast_column,
+                condition_1=condition[0],
+                condition_2=condition[1],
+                precomputed_stats=precomputed_stats,
+            )
+            rnk_stats.append(_rnk_stats)
+            num_cells.append(_num_cells)
+        return pd.concat(rnk_stats, axis=1), pd.concat(num_cells, axis=0)
+
+    def run_one_enrichment_test(
+        self,
+        adata: AnnData,
+        df: pd.DataFrame,
+        celltype_combo: tuple[str, str] = ("B cell", "B_cell"),
+        celltype_column: str = "cell_type",
+        contrasts_combo: tuple[str, str] | list[tuple[str, str]] = None,
+        contrast_column: str = "disease_state",
+        direction: Literal["upregulated", "downregulated", "both"] = "upregulated",
+        # Filtering parameters for gene set construction
+        threshold_lfc: float = 1.0,
+        threshold_expression: float = 0.0,
+        threshold_pval: float = 0.01,
+        # GSEA parameters
+        min_size: int = 10,
+        max_size: int = 1000,
+        permutation_num: int = 1000,
+        weight: float = 1.0,
+        seed: int = 2025,
+        verbose: bool = False,
+        threads: int = 6,
+    ) -> pd.DataFrame:
+        """Computes cytokine enrichment activity in one celltype using GSEA scoring.
+
+        1. "Looks up" query cell type in human cytokine dictionary and retrieves associated up-/downregulated genes per cytokine as reference.
+        2. Creates ranking of query data genes contrasting condition1 vs condition2. A continuum from genes most associated with condition1 (top) to genes most associated with condition2 (bottom)
+        3. Computes enrichment of each cytokine by matching their associated gene set in the ranked list.
+
+        Parameters
+        ----------
+        - adata
+            The query adata object.
+        - df
+            Human Cytokine Dictionary
+        - celltype_combo
+            A tuple with the celltype name of query adata in first position and respective celltype name of df in second position. Simulates "lookup of query in dictionary".
+        - celltype_column
+            Column name of adata.obs object that stores the cell types.
+        - contrasts_combo
+            Tuple that stores two biological conditions that are compared to each other in enrichment. E.g., which cytokines are enriched in healthy samples vs disease samples? Can be a list of tuples, function automatically loops through them.
+        - contrast_column
+            Column name of adata.obs object that stores the biological condition of samples.
+        - direction
+            "upregulated", "downregulated", or "both" are valid input. Up-/downregulation w.r.t condition1 (condition1 is the first of the two elements in each contrasts tuple.
+        - threshold_pval
+            Constructs the gene set: Filters for genes in human df with an adj. p-val lower than threshold_pval.
+        - threshold_lfc
+            Constructs the gene set: Filters for genes in human df that are up/downregulated with a lfc higher than threshold_lfc.
+        - threshold_expression
+            Filters out genes with mean gene expression across all cells lower than threshold_expression.
+
+        Returns:
+        -------
+        - results
+            A DataFrame with all computed enrichment scores and statistical parameters. Not filtered by significance or robustness yet.
+        """
+        print(type(contrasts_combo))
+        if not isinstance(contrasts_combo, list):
+            assert isinstance(contrasts_combo, tuple)
+            contrasts_combo = [contrasts_combo]
+
+        celltype_adata = celltype_combo[0]
+        celltype_signature = celltype_combo[1]
+
+        # allows potential loop of celltype combos to continue
+        if celltype_adata not in adata.obs[celltype_column].unique():
+            print(
+                f"'{celltype_adata}' is not present in celltype_column ({celltype_column}) of query adata. Skipping enrichment test of this celltype.\n"
+            )
+            return None
+
+        # filter for cell type
+        _vprint("Filter for cell type:", verbose)
+        adata = adata[adata.obs[celltype_column] == celltype_adata]
+        _vprint("Filter for cell type: done.", verbose)
+
+        # filter based on gene expression
+        _vprint("Filter for gene expression:", verbose)
+        adata = adata[:, adata.X.mean(axis=0) >= threshold_expression]
+        _vprint("Filter for gene expression: done.", verbose)
+
+        # get genesets
+        _vprint("Get gene sets:", verbose)
+        gene_set_dict, gene_set_df = self._get_genesets(
+            adata=adata,
+            df=df,
+            celltype_signature=celltype_signature,
+            direction=direction,
+            threshold_pval=threshold_pval,
+            threshold_lfc=threshold_lfc,
+        )
+
+        _vprint("Get gene sets: done.", verbose)
+
+        # compute ranking stat
+        _vprint("Get ranking stats:", verbose)
+        rnk_stats, num_cells_per_condition = self._compute_ranking_statistic(
+            adata, contrast_column=contrast_column, contrasts_combo=contrasts_combo
+        )
+        _vprint("Get ranking stats: done.", verbose)
+        results = []
+
+        for contrast_name in rnk_stats.columns:
+            print(contrast_name)
+            # format stat so that it can be processed by blitzgsea. E.g., needs col "0": genenames, and "1": scores
+            rnk = (
+                rnk_stats.loc[:, contrast_name]
+                .replace([np.inf, -np.inf], np.nan)
+                .dropna()
+                .sort_values(ascending=False)
+                .to_frame()
+                .reset_index()
+                .rename(columns={"index": "0", contrast_name: "1"})
+            )
+
+            # run enrichment (changed gp.prerank() to blitzgsea. The output result is in slightly diff format.
+            """
+            gp_res = gp.prerank(
+                rnk=rnk,
+                gene_sets=gene_set_dict,
+                min_size=min_size,
+                max_size=max_size,
+                permutation_num=permutation_num,
+                weight=weight,
+                outdir=None,
+                seed=seed,
+                verbose=verbose,
+                threads=threads,
+            )
+            """
+            _res = blitzgsea.gsea(rnk, gene_set_dict)
+
+            _res.loc[:, "Term"] = _res.index
+            _res.loc[:, "contrast"] = contrast_name
+            _res.loc[:, "num_cells_1"] = num_cells_per_condition.loc[contrast_name, "num_cells_1"]
+            _res.loc[:, "num_cells_2"] = num_cells_per_condition.loc[contrast_name, "num_cells_2"]
+            _res.loc[:, "percent_duplicate_ranking_stats"] = (rnk.duplicated(keep="first").sum() / rnk.shape[0]) * 100
+            results.append(_res)
+            _vprint(f"{contrast_name}: done.", verbose)
+
+        # combine results and save hyperparams
+        results = pd.concat(results, axis=0, ignore_index=True)
+        results.loc[:, "celltype_adata"] = celltype_adata
+        results.loc[:, "celltype_signature"] = celltype_signature
+        results.loc[:, "celltype_combo"] = f"{celltype_adata} ({celltype_signature})"
+        results.loc[:, "direction"] = direction
+        results.loc[:, "threshold_pval"] = threshold_pval
+        results.loc[:, "threshold_lfc"] = threshold_lfc
+        results.loc[:, "threshold_expression"] = threshold_expression
+        results.loc[:, "min_size"] = min_size
+        results.loc[:, "max_size"] = max_size
+        results.loc[:, "permutation_num"] = permutation_num
+        results.loc[:, "weight"] = weight
+        results.loc[:, "seed"] = seed
+        results.loc[:, "threads"] = threads
+
+        required_for_hcd = ["log_fc", "adj_p_value", "cytokine"]
+        if set(required_for_hcd).issubset(df.columns):
+            results.rename({"Term": "cytokine"}, inplace=True, axis=1)
+            results = pd.merge(results, gene_set_df, on="cytokine")
+        elif "CIP" in df.columns:
+            results.rename({"Term": "CIP"}, inplace=True, axis=1)
+            results = pd.merge(results, gene_set_df, on="CIP")
+            results.direction = "upregulated"
+        elif "query_program" in df.columns:
+            results.rename({"Term": "query_program"}, inplace=True, axis=1)
+            results = pd.merge(results, gene_set_df, on="query_program")
+            results.direction = "custom input"
+
+        return results

From 768d0f9df500c2bd4a26ed7c92e8b0441819385b Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Tue, 6 Jan 2026 19:02:50 +0100
Subject: [PATCH 02/11] added robustness_test.py from huCIRA package

---
 pertpy/tools/__init__.py |   2 +-
 pertpy/tools/_hucira.py  | 307 ++++++++++++++++++++++++++++++++++++++-
 2 files changed, 307 insertions(+), 2 deletions(-)

diff --git a/pertpy/tools/__init__.py b/pertpy/tools/__init__.py
index 5105cf46..2d765ea8 100644
--- a/pertpy/tools/__init__.py
+++ b/pertpy/tools/__init__.py
@@ -7,7 +7,7 @@
 from pertpy.tools._distances._distance_tests import DistanceTest
 from pertpy.tools._distances._distances import Distance
 from pertpy.tools._enrichment import Enrichment
-from pertpy.tools._hucira import hucira
+from pertpy.tools._hucira import Hucira
 from pertpy.tools._milo import Milo
 from pertpy.tools._mixscape import Mixscape
 from pertpy.tools._perturbation_space._clustering import ClusteringSpace
diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
index 78b2a62a..74e5f6d7 100644
--- a/pertpy/tools/_hucira.py
+++ b/pertpy/tools/_hucira.py
@@ -1,10 +1,15 @@
+import re
+import warnings
+from pathlib import Path
 from typing import Literal
 
 import blitzgsea
 import gseapy as gp
 import numpy as np
 import pandas as pd
+import scanpy as sc
 from anndata import AnnData
+from tqdm.auto import tqdm
 
 
 def _vprint(msg, verbose):
@@ -12,7 +17,83 @@ def _vprint(msg, verbose):
         print(msg)
 
 
-class hucira:
+class Hucira:
+    def load_human_cytokine_dict(self, save_dir="", force_download=False, exclude_well_biased_genes=True):
+        """Download and load our Human Cytokine Dictionary from Parse Biosciences.
+
+        https://www.parsebiosciences.com/datasets/10-million-human-pbmcs-in-a-single-experiment/.
+
+        Parameters
+        ----------
+        save_dir : str
+            Directory where the file will be saved.
+        force_download : bool
+            Allows user to force a fresh download
+        exclude_well_biased_genes : bool
+            If True, exclude genes that are well biased according to our analysis
+            in the original publication.
+
+        Returns:
+        -------
+        cytokine_dict : pandas.DataFrame
+            Human Cytokine Dictionary adata object.
+        """
+        url = "https://cdn.parsebiosciences.com/gigalab/10m/DEGs.csv"
+        if save_dir == "":
+            save_dir = Path.cwd()
+        save_dir.mkdir(parents=True, exist_ok=True)
+        local_path = save_dir / "human_cytokine_dict.csv"
+
+        if force_download or not Path.exists(local_path):
+            print("Downloading Human Cytokine Dictionary from Parse Biosciences...")
+            cytokine_dict = pd.read_csv(url, index_col=0)
+            cytokine_dict = cytokine_dict.reset_index(drop=True)
+            cytokine_dict.to_csv(local_path)
+        else:
+            print(f"Loading from: {local_path}")
+            cytokine_dict = pd.read_csv(local_path, index_col=0)
+            cytokine_dict = cytokine_dict.reset_index(drop=True)
+
+        if exclude_well_biased_genes:
+            cytokine_dict = cytokine_dict.loc[~cytokine_dict.well_biased]
+
+        return cytokine_dict
+
+    def load_cytokine_info(self, save_dir="", force_download=False):
+        """Download and load Cytokine information sheet: includes information about sender and receptor genes (for cell-cell communication plot).
+
+        Parameters
+        ----------
+        save_dir : str
+            Directory where the file will be saved.
+        force_download : bool
+            Allows user to force a fresh download
+
+        Returns:
+        -------
+        cytokine_info : pandas.DataFrame
+        """
+        url = (
+            "https://raw.githubusercontent.com/theislab/huCIRA/"
+            "main/src/hucira/data/"
+            "20250125_cytokine_info_with_functional_classification_LV.xlsx"
+        )
+
+        if save_dir == "":
+            save_dir = Path.cwd()
+        save_dir.mkdir(parents=True, exist_ok=True)
+        local_path = save_dir / "cytokine_info.xlsx"
+
+        if force_download or not Path.exists(local_path):
+            print("Downloading Cytokine Information sheet...")
+            cytokine_info = pd.read_excel(url, sheet_name="all_cytokines", engine="openpyxl")
+            cytokine_info.to_excel(local_path, sheet_name="all_cytokines")
+        else:
+            print(f"Loading from: {local_path}")
+            cytokine_info = pd.read_excel(local_path)
+
+        return cytokine_info
+
     def _get_genesets(
         self,
         adata: AnnData,
@@ -372,3 +453,227 @@ def run_one_enrichment_test(
             results.direction = "custom input"
 
         return results
+
+    def _check_robustness_fractions(
+        self,
+        df_pivot,
+        threshold_qval=0.1,  # adjusted p value
+        threshold_valid=0.1,  # fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
+        threshold_below_alpha=0.75,  # fraction of results that need to be significant
+    ):
+        n_total = np.prod(df_pivot.shape)
+        n_valid = n_total - df_pivot.isna().sum().sum()
+        n_below_alpha = (
+            (df_pivot < threshold_qval).sum().sum()
+        )  # number of results below pval threshold, i.e., number of significant results
+        frac_valid_results = n_valid / n_total
+        frac_pval_below_alpha = n_below_alpha / n_valid  # fraction of significant results relative to valid results
+        is_robust = (frac_pval_below_alpha > threshold_below_alpha) & (frac_valid_results > threshold_valid)
+        return frac_valid_results, frac_pval_below_alpha, is_robust
+
+    def check_robustness(
+        self,
+        all_results,
+        threshold_qval=0.1,
+        threshold_valid=0.1,
+        threshold_below_alpha=0.9,
+    ):
+        """Filters for robust and significant results (<threshold_qval/alpha) out of original enrichments (run_enrichment_test() output).
+
+        Returns only the enrichments that are stable across many different tests and that are statistically significant.
+
+
+        Parameters
+        ----------
+        - results
+            The DataFrame output from run_enrichment_test().
+        - threshold_qval
+            Threshold that checks significance of results (leniently). Result is considered significant if its q-val is below this threshold.
+        - threshold_valid
+            The fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
+        - threshold_below_alpha
+            The fraction of results that need to be significant
+
+
+        Returns:
+        -------
+        - robust_results
+            DataFrame with robust and significant enrichments (includes min and max of nes)
+
+        """
+        all_thresholds_expression = all_results.threshold_expression.sort_values(ascending=False).unique()
+        all_thresholds_lfc = sorted(all_results.threshold_lfc.unique())
+
+        df = pd.DataFrame(index=all_thresholds_expression, columns=all_thresholds_lfc)
+        df.index.rename("threshold_expression", inplace=True)
+        df.columns.rename("threshold_lfc", inplace=True)
+
+        robust_results = []
+
+        # Get gene_program name of your enrichment analysis.
+        if "cytokine" in all_results.columns:
+            gene_program = "cytokine"
+        elif "CIP" in all_results.columns:
+            gene_program = "CIP"
+        elif "query_program" in all_results.columns:
+            gene_program = "query_program"
+        else:
+            raise ValueError("Missing column that is defining gene programs in 'all_results'.")
+            return
+
+        for contrast in tqdm(all_results.contrast.unique()):
+            for celltype_combo in all_results.celltype_combo.unique():
+                results_ct = all_results.loc[
+                    (all_results.celltype_combo == celltype_combo) & (all_results.contrast == contrast)
+                ]
+                for program in results_ct[gene_program].unique():
+                    results_ct_cy = results_ct.loc[results_ct[gene_program] == program]
+                    df_pivot = results_ct_cy.pivot(index="threshold_expression", columns="threshold_lfc", values="fdr")
+                    with warnings.catch_warnings():
+                        warnings.simplefilter(action="ignore", category=FutureWarning)
+                        df_combined = pd.concat([df, df_pivot])
+                    df_merged = df_combined.combine_first(df_pivot)
+                    df_merged = df_merged.loc[~df_merged.index.duplicated()]
+                    df_pivot = df_merged.loc[all_thresholds_expression, all_thresholds_lfc].astype(float)
+                    frac_valid_results, frac_pval_below_alpha, is_robust = self._check_robustness_fractions(
+                        df_pivot,
+                        threshold_qval=threshold_qval,
+                        threshold_valid=threshold_valid,
+                        threshold_below_alpha=threshold_below_alpha,
+                    )
+
+                    if is_robust:
+                        robust_results.append(
+                            (
+                                celltype_combo,
+                                contrast,
+                                program,
+                                frac_valid_results,
+                                frac_pval_below_alpha,
+                                is_robust,
+                                results_ct_cy.nes.min(),
+                                results_ct_cy.nes.max(),
+                                threshold_qval,
+                                threshold_below_alpha,
+                            )
+                        )
+
+        robust_results = pd.DataFrame(robust_results).rename(
+            {
+                0: "celltype_combo",
+                1: "contrast",
+                2: gene_program,
+                3: "frac_valid",
+                4: "frac_significant",
+                5: "is_robust",
+                6: "NES_min",
+                7: "NES_max",
+                8: "qval_threshold",
+                9: "threshold_frac_below_alpha",
+            },
+            axis=1,
+        )
+        return robust_results
+
+    def get_robust_significant_results(self, results, alphas=None, threshold_valid=0.1, threshold_below_alpha=0.9):
+        """Function Wrapper: Filters for robust and signifcant results across several alpha/q-val from original enrichments (run_enrichment_test() output).
+
+        Returns only the enrichments that are statistically significant (q-val), and stable across many different tests (per contrast).
+        Calls check_robustness for different qval thresholds to explore more stringent significance thresholds. Use for visualization of results (e.g. in a heatmap). If using thresholds [0.1, 0.05, 0.01] for significant testing, returns significance notations as well (*, **, ***)
+
+        Parameters
+        ----------
+        - results
+            The DataFrame output from run_enrichment_test().
+        - alphas
+            List of thresholds (q-val) to check significance of results. Result is considered significant if its q-val is below this threshold.
+        - threshold_valid
+            The fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
+        - threshold_below_alpha
+            The fraction of results that need to be significant
+
+        Returns:
+        -------
+        - robust_results_dict
+            Dictionary mapping contrasts to lists of the enrichment score results (pivot_df), their significance annotations (annot_df), and significance thresholds (robust_sub).
+            robust_results_dict = {contrast1: [pivot_df1, annot_df1, robust_sub1],
+                                   contrast2: [pivot_df2, annot_df2, robust_sub2]}
+        """
+        # default significant values (matching significance stars)
+        if alphas is None:
+            alphas = [0.1, 0.05, 0.01]
+
+        # Get gene_program name of your enrichment analysis.
+        if "cytokine" in results.columns:
+            gene_program = "cytokine"
+        elif "CIP" in results.columns:
+            gene_program = "CIP"
+        elif "query_program" in results.columns:
+            gene_program = "query_program"
+        else:
+            raise ValueError("Missing column that is defining gene programs in 'results'.")
+            return
+
+        results_robust = [
+            self.check_robustness(
+                results,
+                threshold_qval=alpha,
+                threshold_valid=threshold_valid,
+                threshold_below_alpha=threshold_below_alpha,
+            )
+            for alpha in alphas
+        ]
+
+        results_robust = pd.concat(results_robust)
+
+        # if none of the results in the df pass the filter, exit out and don't return anything.
+        if results_robust.empty:
+            print("No robust results to process. Exiting function.")
+            return
+
+        results_robust = (
+            results_robust.groupby(["contrast", "celltype_combo", gene_program])["qval_threshold"]
+            .min()
+            .to_frame()
+            .reset_index()
+        )
+
+        results_mean = (
+            results.assign(NES=pd.to_numeric(results.NES, errors="coerce"))  # ensure numeric
+            .fillna({"nes": 0})  # only fill NES
+            .groupby(["contrast", "celltype_combo", gene_program])["nes"]
+            .mean()
+            .to_frame()
+            .reset_index()
+        )
+
+        # Create separate robust results dict for every contrast pair.
+        robust_results_dict = {}
+        for contrast in results.contrast.unique():
+            subset = results_mean[results_mean.contrast == contrast]
+            pivot_df = subset.pivot(index=gene_program, columns="celltype_combo", values="nes")
+
+            # create empty annotation df
+            annot_df = pivot_df.copy().astype(object)
+            annot_df[:] = ""
+
+            # fill annotations based on results_robust
+            robust_sub = results_robust[results_robust.contrast == contrast]
+            for program in annot_df.index:
+                for celltype in annot_df.columns:
+                    qval = robust_sub.loc[
+                        (robust_sub[gene_program] == program) & (robust_sub.celltype_combo == celltype),
+                        "qval_threshold",
+                    ]
+                    if len(qval) != 0:
+                        qval = qval.values[0]
+                        if qval == 0.1:
+                            annot_df.loc[program, celltype] = "*"
+                        elif qval == 0.05:
+                            annot_df.loc[program, celltype] = "**"
+                        elif qval == 0.01:
+                            annot_df.loc[program, celltype] = "***"
+
+            robust_results_dict[contrast] = [pivot_df, annot_df, robust_sub]
+
+        return robust_results_dict

From afafba301f0eb50016591cf50e9355651b205ba0 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Sun, 11 Jan 2026 14:47:24 +0100
Subject: [PATCH 03/11] Modified dict loading and added pl tools and sender
 receiver tl.

---
 pertpy/data/__init__.py  |   2 +
 pertpy/data/_datasets.py |  35 ++
 pertpy/tools/_hucira.py  | 706 ++++++++++++++++++++++++++++++++++++---
 3 files changed, 691 insertions(+), 52 deletions(-)

diff --git a/pertpy/data/__init__.py b/pertpy/data/__init__.py
index d8ccfec5..9a23f0a7 100644
--- a/pertpy/data/__init__.py
+++ b/pertpy/data/__init__.py
@@ -25,6 +25,7 @@
     gehring_2019,
     haber_2017_regions,
     hagai_2018,
+    human_cytokine_dict,
     kang_2018,
     mcfarland_2020,
     norman_2019,
@@ -84,6 +85,7 @@
     "gehring_2019",
     "haber_2017_regions",
     "hagai_2018",
+    "human_cytokine_dict",
     "kang_2018",
     "mcfarland_2020",
     "norman_2019",
diff --git a/pertpy/data/_datasets.py b/pertpy/data/_datasets.py
index 97115e28..2b548aa5 100644
--- a/pertpy/data/_datasets.py
+++ b/pertpy/data/_datasets.py
@@ -1,5 +1,6 @@
 from pathlib import Path
 
+import pandas as pd
 import scanpy as sc
 from anndata import AnnData
 from mudata import MuData
@@ -1598,3 +1599,37 @@ def hagai_2018() -> AnnData:  # pragma: no cover
     adata = sc.read_h5ad(output_file_path)
 
     return adata
+
+
+def human_cytokine_dict(exclude_well_biased_genes=True) -> pd.DataFrame:
+    r"""Human Cytokine Dictionary curated from PBMC allows you to infer differential cytokine activity.
+
+    The Human Cytokine Dictionary was created from single-cell RNA-seq of 9,697,974 human peripheral blood mononuclear cells (PBMC) from 12 donors stimulated in vitro with 87 different cytokines. The object is a dataframe representing cytokine activity as differentially expressed genes after cytokine perturbation.
+
+    References:
+        Oesinghaus, Lukas and Becker, S{\"o}ren and Vornholz, Larsen
+        .... bla bla coming
+
+    Returns:
+        Pandas DataFrame
+
+    """
+    output_file_name = "human_cytokine_dict.csv"
+    output_file_path = settings.datasetdir / output_file_name
+    if not Path(output_file_path).exists():
+        _download(
+            url="https://cdn.parsebiosciences.com/gigalab/10m/DEGs.csv",
+            output_file_name=output_file_name,
+            output_path=settings.datasetdir,
+            is_zip=False,
+        )
+
+    cytokine_dict = pd.read_csv(output_file_path, index_col=0)
+    revision_cytokines = ["TGF-beta1", "IL-18", "C3a"]
+    cytokine_dict = cytokine_dict[~cytokine_dict["cytokine"].isin(revision_cytokines)]
+    cytokine_dict = cytokine_dict.reset_index(drop=True)
+
+    if exclude_well_biased_genes:
+        cytokine_dict = cytokine_dict.loc[~cytokine_dict.well_biased]
+
+    return cytokine_dict
diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
index 74e5f6d7..ba03e6c9 100644
--- a/pertpy/tools/_hucira.py
+++ b/pertpy/tools/_hucira.py
@@ -1,3 +1,4 @@
+import os
 import re
 import warnings
 from pathlib import Path
@@ -5,10 +6,15 @@
 
 import blitzgsea
 import gseapy as gp
+import matplotlib.lines as mlines
+import matplotlib.pyplot as plt
 import numpy as np
 import pandas as pd
 import scanpy as sc
+import seaborn as sns
 from anndata import AnnData
+from bokeh.palettes import all_palettes
+from pycirclize import Circos
 from tqdm.auto import tqdm
 
 
@@ -18,47 +24,6 @@ def _vprint(msg, verbose):
 
 
 class Hucira:
-    def load_human_cytokine_dict(self, save_dir="", force_download=False, exclude_well_biased_genes=True):
-        """Download and load our Human Cytokine Dictionary from Parse Biosciences.
-
-        https://www.parsebiosciences.com/datasets/10-million-human-pbmcs-in-a-single-experiment/.
-
-        Parameters
-        ----------
-        save_dir : str
-            Directory where the file will be saved.
-        force_download : bool
-            Allows user to force a fresh download
-        exclude_well_biased_genes : bool
-            If True, exclude genes that are well biased according to our analysis
-            in the original publication.
-
-        Returns:
-        -------
-        cytokine_dict : pandas.DataFrame
-            Human Cytokine Dictionary adata object.
-        """
-        url = "https://cdn.parsebiosciences.com/gigalab/10m/DEGs.csv"
-        if save_dir == "":
-            save_dir = Path.cwd()
-        save_dir.mkdir(parents=True, exist_ok=True)
-        local_path = save_dir / "human_cytokine_dict.csv"
-
-        if force_download or not Path.exists(local_path):
-            print("Downloading Human Cytokine Dictionary from Parse Biosciences...")
-            cytokine_dict = pd.read_csv(url, index_col=0)
-            cytokine_dict = cytokine_dict.reset_index(drop=True)
-            cytokine_dict.to_csv(local_path)
-        else:
-            print(f"Loading from: {local_path}")
-            cytokine_dict = pd.read_csv(local_path, index_col=0)
-            cytokine_dict = cytokine_dict.reset_index(drop=True)
-
-        if exclude_well_biased_genes:
-            cytokine_dict = cytokine_dict.loc[~cytokine_dict.well_biased]
-
-        return cytokine_dict
-
     def load_cytokine_info(self, save_dir="", force_download=False):
         """Download and load Cytokine information sheet: includes information about sender and receptor genes (for cell-cell communication plot).
 
@@ -375,6 +340,10 @@ def run_one_enrichment_test(
             threshold_lfc=threshold_lfc,
         )
 
+        gene_set_dict = {
+            key: gene_set for key, gene_set in gene_set_dict.items() if min_size < len(gene_set) < max_size
+        }
+
         _vprint("Get gene sets: done.", verbose)
 
         # compute ranking stat
@@ -413,7 +382,8 @@ def run_one_enrichment_test(
                 threads=threads,
             )
             """
-            _res = blitzgsea.gsea(rnk, gene_set_dict)
+
+            _res = blitzgsea.gsea(rnk, gene_set_dict, permutations=permutation_num)
 
             _res.loc[:, "Term"] = _res.index
             _res.loc[:, "contrast"] = contrast_name
@@ -456,10 +426,10 @@ def run_one_enrichment_test(
 
     def _check_robustness_fractions(
         self,
-        df_pivot,
-        threshold_qval=0.1,  # adjusted p value
-        threshold_valid=0.1,  # fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
-        threshold_below_alpha=0.75,  # fraction of results that need to be significant
+        df_pivot: pd.DataFrame,
+        threshold_qval: float = 0.1,  # adjusted p value
+        threshold_valid: float = 0.1,  # fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
+        threshold_below_alpha: float = 0.75,  # fraction of results that need to be significant
     ):
         n_total = np.prod(df_pivot.shape)
         n_valid = n_total - df_pivot.isna().sum().sum()
@@ -473,10 +443,10 @@ def _check_robustness_fractions(
 
     def check_robustness(
         self,
-        all_results,
-        threshold_qval=0.1,
-        threshold_valid=0.1,
-        threshold_below_alpha=0.9,
+        all_results: pd.DataFrame,
+        threshold_qval: float = 0.1,
+        threshold_valid: float = 0.1,
+        threshold_below_alpha: float = 0.9,
     ):
         """Filters for robust and significant results (<threshold_qval/alpha) out of original enrichments (run_enrichment_test() output).
 
@@ -575,7 +545,13 @@ def check_robustness(
         )
         return robust_results
 
-    def get_robust_significant_results(self, results, alphas=None, threshold_valid=0.1, threshold_below_alpha=0.9):
+    def get_robust_significant_results(
+        self,
+        results: pd.DataFrame,
+        alphas: list[float] | None = None,
+        threshold_valid: float = 0.1,
+        threshold_below_alpha: float = 0.9,
+    ):
         """Function Wrapper: Filters for robust and signifcant results across several alpha/q-val from original enrichments (run_enrichment_test() output).
 
         Returns only the enrichments that are statistically significant (q-val), and stable across many different tests (per contrast).
@@ -639,7 +615,7 @@ def get_robust_significant_results(self, results, alphas=None, threshold_valid=0
         )
 
         results_mean = (
-            results.assign(NES=pd.to_numeric(results.NES, errors="coerce"))  # ensure numeric
+            results.assign(nes=pd.to_numeric(results.nes, errors="coerce"))  # ensure numeric
             .fillna({"nes": 0})  # only fill NES
             .groupby(["contrast", "celltype_combo", gene_program])["nes"]
             .mean()
@@ -677,3 +653,629 @@ def get_robust_significant_results(self, results, alphas=None, threshold_valid=0
             robust_results_dict[contrast] = [pivot_df, annot_df, robust_sub]
 
         return robust_results_dict
+
+    def _get_senders(
+        self,
+        adata: AnnData,
+        cytokine_info: pd.DataFrame,
+        cytokine: str = "IL-32-beta",
+        show: bool = False,
+        column_cell_type: str = "cell_type",
+    ) -> pd.DataFrame:
+        genes = np.unique(re.split(", ", cytokine_info.loc[cytokine_info.name == cytokine, "gene"].values[0]))
+        mask = np.isin(genes, adata.var_names)
+
+        if not mask.any():
+            print(f"None of the cytokine producing genes ({genes}) were found in dataset for cytokine {cytokine}.")
+            return None
+        if not mask.all():
+            print(
+                f"The following cytokine producing genes were not found in the dataset and are excluded: {genes[~mask]}"
+            )
+            genes = genes[mask]
+        adata = adata[:, genes]
+
+        # Ranks gene(s) of query sender cytokine across immune cell types.
+        adata_out = sc.tl.rank_genes_groups(
+            adata,
+            groupby=column_cell_type,
+            copy=True,
+            use_raw=False,
+            method="wilcoxon",
+        )
+        result = adata_out.uns["rank_genes_groups"]
+        groups = result["names"].dtype.names
+
+        results_mean, results_frac = [], []
+        rank_genes_df = []
+        for g in groups:
+            df = pd.DataFrame(
+                {
+                    "gene": result["names"][g],
+                    "logfoldchanges": result["logfoldchanges"][g],
+                    "pvals": result["pvals"][g],
+                    "pvals_adj": result["pvals_adj"][g],
+                    column_cell_type: g,
+                }
+            )
+            rank_genes_df.append(df)
+        rank_genes_df = pd.concat(rank_genes_df, axis=0)
+        rank_genes_df.set_index(column_cell_type, inplace=True)
+        grouped = rank_genes_df.groupby(column_cell_type)
+
+        # Chooses minimum rank_genes_group() statistical parameters (considers limiting gene, if there are multiple per cytokine)
+        grouped_rank_genes_df_all = []
+        for celltype in grouped.groups:
+            grouped_celltype_df = grouped.get_group(celltype)
+
+            # get gene with smallest log_fold_change (representing limiting gene), and retrieve stat. parameters
+            limiting_gene_idx = np.argmin(grouped_celltype_df["logfoldchanges"].values)
+            limiting_gene_vals = grouped_celltype_df.iloc[limiting_gene_idx][["logfoldchanges", "pvals", "pvals_adj"]]
+            gene_concat = ", ".join(grouped_celltype_df["gene"])
+            grouped_rank_genes_df = limiting_gene_vals.to_frame().T
+            grouped_rank_genes_df["gene"] = gene_concat
+            grouped_rank_genes_df.index = [celltype]
+            grouped_rank_genes_df_all.append(grouped_rank_genes_df)
+
+        grouped_rank_genes_df_all = pd.concat(grouped_rank_genes_df_all, axis=0)
+        grouped_rank_genes_df_all = grouped_rank_genes_df_all.rename(
+            columns={"logfoldchanges": "min_logfoldchanges", "pvals": "min_pvals", "pvals_adj": "min_pvals_adj"}
+        )
+
+        # Minimum of mean gene expression of sender cytokine genes:
+        X_df = adata[:, genes].to_df()
+        frac_df = X_df > 0
+        X_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
+        frac_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
+
+        # take minimum average gene expression across all genes required for this sender
+        results_mean = (
+            X_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame().rename({0: "mean_X"}, axis=1)
+        )
+        # take minimum expression fraction across all genes required for this sender
+        results_frac = (
+            frac_df.groupby(column_cell_type, observed=False)
+            .mean()
+            .min(axis=1)
+            .to_frame()
+            .rename({0: "frac_X"}, axis=1)
+        )
+
+        # Final df with information about active sender cytokines.
+        results = pd.concat([grouped_rank_genes_df_all, results_mean, results_frac], axis=1)
+        results["mean_X>0"] = results["mean_X"].where(results["mean_X"] > 0, None)
+        results.loc[:, "cytokine"] = cytokine
+        return results
+
+    def _get_receivers(
+        self, adata: AnnData, cytokine_info: pd.DataFrame, cytokine: str, column_cell_type: str = "cell_type"
+    ) -> pd.DataFrame | None:
+        # get receptor genes for this cytokine
+        _receptor_genes = cytokine_info.loc[cytokine_info.name == cytokine, "receptor gene"]
+        if _receptor_genes.isna().all():
+            print(f"No receptor gene found in cytokine_info for cytokine: {cytokine}")
+            return None
+        assert len(_receptor_genes) == 1, _receptor_genes
+        _receptor_genes = _receptor_genes.values[0]
+        # there can be multiple receptors
+        candidates = re.split("; ", _receptor_genes)
+        results_mean, results_frac = [], []
+        # each receptor may require the expression of multiple genes
+        for candidate in candidates:
+            # print(candidate)
+            genes = np.array(re.split(", ", candidate))
+            mask = np.isin(genes, adata.var_names)
+            if not mask.any():
+                print(f"None of the cytokine receptor genes ({genes}) were found in dataset for cytokine {cytokine}.")
+                continue
+            if not mask.all():
+                print(
+                    f"The following cytokine receptor genes were not found in the dataset and are excluded: {genes[~mask]}"
+                )
+                genes = genes[mask]
+            X_df = adata[:, genes].to_df()
+            frac_df = X_df > 0
+            X_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
+            frac_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
+            # take minimum average gene expression across all genes required for this receptor
+            results_mean.append(X_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame())
+            # take minimum expression fraction across all genes required for this receptor
+            results_frac.append(frac_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame())
+        if len(results_mean) == 0:
+            return None
+
+        results_mean = pd.concat(results_mean, axis=1).max(axis=1).to_frame().rename({0: "mean_X"}, axis=1)
+        results_frac = pd.concat(results_frac, axis=1).max(axis=1).to_frame().rename({0: "frac_X"}, axis=1)
+        results = pd.concat([results_mean, results_frac], axis=1)
+        results.loc[:, "cytokine"] = cytokine
+        return results
+
+    def get_one_senders_and_receivers(
+        self,
+        adata: AnnData,
+        cytokine_info: pd.DataFrame,
+        cytokine: str,
+        celltype_colname: str = "cell_type",
+        sender_pvalue_threshold: float = 0.1,
+        receiver_mean_X_threshold: float = 0,
+        sender_lfc_threshold: float = 0,
+    ) -> tuple[pd.DataFrame, pd.DataFrame]:
+        """Generates cytokine producer and receiver statistics (senders and receivers of cell-cell communication) for one cytokine.
+
+        Best for exploration purposes of a singular cytokine.
+
+        Parameters
+        ----------
+        adata : AnnData
+            Query adata object of analysis
+        cytokine_info : pd.DataFrame
+            External file containing info about receptor genes of each cytokine in format
+            pd.DataFrame({"name": cytokine, "receptor gene": [gene1, gene2]})
+        cytokine : str
+            A cytokine, which ideally should be present in robust_results
+            (the outcome of the robust enrichment analysis)
+        celltype_colname : str, default "cell_type"
+            Column name of where cell types are stored in adata
+
+        Returns:
+        -------
+        df_senders : pd.DataFrame
+            Cytokine signal senders per cell type
+        df_receivers : pd.DataFrame
+            Cytokine signal receivers per cell type
+        """
+        df_senders = self._get_senders(
+            adata=adata, cytokine_info=cytokine_info, cytokine=cytokine, column_cell_type=celltype_colname
+        )
+        df_receivers = self._get_receivers(
+            adata=adata, cytokine_info=cytokine_info, cytokine=cytokine, column_cell_type=celltype_colname
+        )
+        if df_senders is not None:
+            df_senders = df_senders.loc[
+                (df_senders.min_pvals < sender_pvalue_threshold)
+                & (df_senders.min_logfoldchanges > sender_lfc_threshold)
+            ]
+        if df_receivers is not None:
+            df_receivers = df_receivers.loc[df_receivers.mean_X > receiver_mean_X_threshold]
+
+        return df_senders, df_receivers
+
+    def get_all_senders_and_receivers(
+        self,
+        adata: AnnData,
+        cytokine_info: pd.DataFrame,
+        cytokine_list: list = None,
+        celltype_colname: str = "cell_type",
+        sender_pvalue_threshold: float = 0.1,
+        receiver_mean_X_threshold: float = 0,
+    ) -> tuple[pd.DataFrame, pd.DataFrame]:
+        """Generates cytokine producer and receiver statistics (senders and receivers of cell-cell communication) for a list of cytokines.
+
+        Best for visualization purposes (for plot_communication function).
+
+        Parameters
+        ----------
+        adata : AnnData
+            Query adata object of analysis
+        cytokine_info : pd.DataFrame
+            External file containing info about receptor genes of each cytokine in format
+            pd.DataFrame({"name": cytokine, "receptor gene": [gene1, gene2]})
+        cytokine_list : list, optional
+            List of cytokines, which ideally should be present in robust_results
+            (the outcome of the robust enrichment analysis). Default is None.
+        celltype_colname : str, default "cell_type"
+            Column name of where cell types are stored in adata
+
+        Returns:
+        -------
+        df_src : pd.DataFrame
+            All cytokine signal senders
+        df_tgt : pd.DataFrame
+            All cytokine signal receivers
+        """
+        senders, receivers = [], []
+        for cytokine in cytokine_list:
+            df_senders, df_receivers = self.get_one_senders_and_receivers(
+                adata=adata,
+                cytokine_info=cytokine_info,
+                cytokine=cytokine,
+                celltype_colname=celltype_colname,
+                sender_pvalue_threshold=0.1,
+                receiver_mean_X_threshold=0,
+            )
+
+            if cytokine == "IL-32-beta":
+                # no known receptor genes - create non-informative df_receivers manually.
+                all_celltypes = sorted(adata.obs[celltype_colname].unique())
+                df_receivers = pd.DataFrame.from_dict(
+                    dict(zip(all_celltypes, np.ones([len(all_celltypes), 2]) * np.inf, strict=True)),
+                    orient="index",
+                ).rename({0: "mean_X", 1: "frac_X"}, axis=1)
+                df_receivers.loc[:, "cytokine"] = cytokine
+
+            if df_senders is not None and df_receivers is not None:
+                df_senders = df_senders.assign(celltype=df_senders.index)
+                df_receivers = df_receivers.assign(celltype=df_receivers.index)
+
+                senders.append(df_senders)
+                receivers.append(df_receivers)
+
+        df_src = pd.concat(senders)
+        df_tgt = pd.concat(receivers)
+
+        return df_src, df_tgt
+
+    ######## PLOTTING: #########
+
+    def _format_cytokine_names(self, x):
+        if isinstance(x, (list, np.ndarray, pd.Index)):
+            return [self._format_cytokine_names(_x) for _x in x]
+        text = x.get_text() if hasattr(x, "get_text") else x
+        text = text.replace("beta", r"$\beta$")
+        text = text.replace("alpha", r"$\alpha$")
+        text = text.replace("gamma", r"$\gamma$")
+        text = text.replace("lambda", r"$\lambda$")
+        text = text.replace("omega", r"$\omega$")
+        return text
+
+    def plot_significant_results(
+        self,
+        results_pivot: pd.DataFrame,
+        df_annot: pd.DataFrame,
+        robust_results_dict: dict[str, pd.DataFrame] | None = None,
+        selected_celltypes: list[str] | None = None,
+        selected_cytokines: list[str] | None = None,
+        fontsize: float = 6.0,
+        save_fig: bool = False,
+        fig_path: str = "",
+        fig_width: float = 10.0,
+        fig_height: float = 12.0,
+    ):
+        """Optional heatmap plotting aid: Plots either the robust results from a dict of contrasts or individually per contrast.
+
+        Parameters
+        ----------
+        - robust_results_dict:
+            robust enrichment score dictionary from get_significant_results(). If this argument is present it has precedence over results_pivot and df_annot.
+        - results_pivot:
+            pandas DataFrame of robust enrichment for results from one contrast
+        - df_annot:
+            pandas DataFrame of robust enrichment significance annotations for results from one contrast
+        - selected_celltypes:
+            Can choose to only visualize selected celltypes out of available from robust results. Must be in robust results, otherwise error.
+        - selected_cytokines:
+            Can choose to only visualize selected celltypes out of available from robust results. Must be in robust results, otherwise error.
+
+        Returns:
+        -------
+        - Nothing. Plotting function only
+
+        """
+        # Case 1: robust_results_dict is provided. This precedes the other arguments. Plots all contrasts together.
+        if robust_results_dict is not None and len(robust_results_dict) > 0:
+            n = len(robust_results_dict)
+            fig, axes = plt.subplots(1, n, squeeze=False)
+
+            for i, (contrast, (_pivot, _annot, _)) in enumerate(robust_results_dict.items()):
+                ax = axes[0, i]
+                pivot = _pivot
+                annot = _annot
+
+                # Apply filtering if requested
+                if selected_celltypes:
+                    pivot = pivot.T.loc[selected_celltypes].T
+                    annot = annot.T.loc[selected_celltypes].T
+                if selected_cytokines:
+                    pivot = pivot.loc[selected_cytokines]
+                    annot = annot.loc[selected_cytokines]
+
+                fig, ax = plt.subplots(figsize=(fig_width, fig_height))
+                sns.heatmap(
+                    pivot,
+                    square=True,
+                    annot=annot,
+                    cmap="RdBu_r",
+                    center=0,
+                    annot_kws={"fontsize": fontsize, "family": "sans-serif"},
+                    fmt="",
+                    linewidths=0.5,
+                    linecolor="white",
+                    cbar=True,
+                    cbar_kws={"shrink": 0.5, "fraction": 0.04, "pad": 0.02},
+                    ax=ax,
+                )
+
+                ax.set_title(contrast, fontsize=10)
+                ax.set_xlabel("")
+                ax.set_ylabel("")
+                ax.set_facecolor("lightgray")
+                ax.tick_params(axis="both", which="both", length=0)
+
+                # Axis labels
+                ax.set_xticks(0.5 + np.arange(pivot.shape[1]))
+                ax.set_xticklabels(pivot.columns, fontsize=fontsize, rotation=90, ha="center")
+                ax.set_yticks(0.5 + np.arange(pivot.shape[0]))
+                ax.set_yticklabels(self._format_cytokine_names(pivot.index), fontsize=fontsize, rotation=0, ha="right")
+
+            if save_fig:
+                fig_file = Path(fig_path) / "all_contrasts_significant_results.svg"
+                # Ensure the directory exists
+                fig_file.parent.mkdir(parents=True, exist_ok=True)
+
+                plt.savefig(
+                    fig_file,
+                    bbox_inches="tight",
+                    pad_inches=0,
+                    dpi=500,
+                )
+            plt.tight_layout()
+            plt.show()
+            return
+
+        # Case 2: single robust_result is provided, only the one chosen contrast comparison is plotted.
+        if isinstance(results_pivot, pd.DataFrame) and isinstance(df_annot, pd.DataFrame):
+            if selected_celltypes:
+                results_pivot = results_pivot.T.loc[selected_celltypes].T
+                df_annot = df_annot.T.loc[selected_celltypes].T
+            if selected_cytokines:
+                results_pivot = results_pivot.loc[selected_cytokines]
+                df_annot = df_annot.loc[selected_cytokines]
+
+            fig, ax = plt.subplots(figsize=(fig_width, fig_height))
+            sns.heatmap(
+                results_pivot,
+                square=True,
+                annot=df_annot,
+                cmap="RdBu_r",
+                center=0,
+                annot_kws={"fontsize": fontsize, "family": "sans-serif"},
+                fmt="",
+                linewidths=0.5,
+                linecolor="white",
+                cbar=True,
+                cbar_kws={"shrink": 0.5, "fraction": 0.04, "pad": 0.02},
+                ax=ax,
+            )
+            ax.set_title("Contrast1_vs_Contrast2", fontsize=10)
+            ax.set_xlabel("")
+            ax.set_ylabel("")
+            ax.set_facecolor("lightgray")
+            ax.tick_params(axis="both", which="both", length=0)
+
+            # Axis labels
+            ax.set_xticks(0.5 + np.arange(results_pivot.shape[1]))
+            ax.set_xticklabels(results_pivot.columns, fontsize=fontsize, rotation=90, ha="center")
+            ax.set_yticks(0.5 + np.arange(results_pivot.shape[0]))
+            ax.set_yticklabels(
+                self._format_cytokine_names(results_pivot.index), fontsize=fontsize, rotation=0, ha="right"
+            )
+
+            plt.show()
+
+            if save_fig:
+                fig_file = Path(fig_path) / "significant_results.svg"
+                # Ensure the directory exists
+                fig_file.parent.mkdir(parents=True, exist_ok=True)
+
+                plt.savefig(fig_file, bbox_inches="tight", pad_inches=0, dpi=500)
+            return
+
+        print("Nothing was plotted. Check input data!")
+        return
+
+    def plot_communication(
+        self,
+        df_src: pd.DataFrame,
+        df_tgt: pd.DataFrame,
+        frac_expressing_cells_sender: float | None = 0.05,
+        frac_expressing_cells_receiver: float | None = 0.05,
+        mean_cytokine_gene_expression_sender: float | None = None,
+        mean_cytokine_gene_expression_receiver: float | None = None,
+        df_enrichment: pd.DataFrame | None = None,
+        all_celltypes: list | None = None,
+        cytokine2color: dict | None = None,
+        celltype2color: dict | None = None,
+        figsize: tuple[float, float] = (5, 5),
+        show_legend: bool = True,
+        save_path: str | None = None,
+        lw: float = 1.0,
+        fontsize: int = 6,
+        loc: str = "upper left",
+        bbox_to_anchor: tuple[float, float] = (1, 1),
+    ):
+        """Generates a Circos plot to visualize cell-cell communication based on cytokine producers and receivers.
+
+        The function filters the input dataframes based on thresholds for fraction of expressing cells
+        and mean cytokine gene expression, then creates a circular layout with cell type partitions
+        and draws directed links representing cytokine communication between producers and receivers.
+
+        Parameters
+        ----------
+        df_src : pd.DataFrame
+            DataFrame containing producer cell type and cytokine expression statistics,
+            typically from `_get_expression_stats`. Must have 'celltype', 'cytokine',
+            'mean_cytokine_gene_expression', and 'frac_expressing_cells' columns.
+        df_tgt : pd.DataFrame
+            DataFrame containing receiver cell type and cytokine expression statistics,
+            typically from `_get_expression_stats`. Must have 'celltype', 'cytokine',
+            'mean_cytokine_gene_expression', and 'frac_expressing_cells' columns.
+        frac_expressing_cells_sender : float | None, default 0.05
+            Minimum fraction of cells expressing a cytokine gene for a producer cell type.
+            If None, no filtering is applied.
+        frac_expressing_cells_receiver : float | None, default 0.05
+            Minimum fraction of cells expressing a cytokine gene for a receiver cell type.
+            If None, no filtering is applied.
+        mean_cytokine_gene_expression_sender : float | None, default None
+            Minimum mean expression of a cytokine gene for a producer cell type. If None, no filtering is applied.
+        mean_cytokine_gene_expression_receiver : float | None, default None
+            Minimum mean expression of a cytokine gene for a receiver cell type. If None, no filtering is applied.
+        df_enrichment : pd.DataFrame | None, optional
+            Optional dataframe with enrichment information. Default is None.
+        all_celltypes : list | None, optional
+            List of all cell types. If None, inferred from df_src and df_tgt.
+        cytokine2color : dict | None, optional
+            Optional mapping from cytokine names to colors.
+        celltype2color : dict | None, optional
+            Optional mapping from cell type names to colors.
+        figsize : tuple[float, float], default (5, 5)
+            Figure size for the plot.
+        show_legend : bool, default True
+            Whether to show the legend.
+        save_path : str | None, optional
+            Path to save the figure. If None, figure is not saved.
+        lw : float, default 1.0
+            Line width for links.
+        fontsize : int, default 6
+            Font size for labels.
+        loc : str, default "upper left"
+            Legend location.
+        bbox_to_anchor : tuple[float, float], default (1, 1)
+            Bounding box anchor for the legend.
+
+        """
+        if frac_expressing_cells_sender is not None:
+            df_src = df_src.loc[df_src.frac_X > frac_expressing_cells_sender]
+        if frac_expressing_cells_receiver is not None:
+            df_tgt = df_tgt.loc[df_tgt.frac_X > frac_expressing_cells_receiver]
+        if mean_cytokine_gene_expression_sender is not None:
+            df_src = df_src.loc[df_src.mean_X > mean_cytokine_gene_expression_sender]
+        if frac_expressing_cells_receiver is not None:
+            df_tgt = df_tgt.loc[df_tgt.mean_X > mean_cytokine_gene_expression_receiver]
+
+        if all_celltypes is None:
+            all_celltypes = sorted(np.union1d(df_src.celltype.unique(), df_tgt.celltype.unique()))
+        # celltype_colors = all_palettes["Set3"][len(all_celltypes)]
+        if celltype2color is None:
+            n = len(all_celltypes)
+
+            # Get first 20 colors from Category20
+            palette_20 = all_palettes["Category20"][20]
+            # Get 20 colors from Category20b
+            palette_20b = all_palettes["Category20b"][20]
+
+            # Combine palettes
+            combined_palette = palette_20 + palette_20b
+
+            if n > 40:
+                raise ValueError(f"Too many cell types ({n}) for available palettes (max 40).")
+
+            # Assign colors to cell types
+            celltype_colors = combined_palette[:n]
+            celltype2color = dict(zip(all_celltypes, celltype_colors, strict=True))
+
+        all_cytokines = np.union1d(df_src.cytokine.unique(), df_tgt.cytokine.unique())
+        cytokine2idx = {cytokine: k for k, cytokine in enumerate(all_cytokines)}
+        # cytokine_colors = all_palettes["Category20"][len(all_cytokines)]
+        # cytokine2color = dict(zip(all_cytokines, cytokine_colors, strict=True))
+
+        unique_cytokines = df_src.cytokine.unique()
+        if df_enrichment is not None:
+            significant_cytokines = df_enrichment.cytokine.unique()
+            unique_cytokines = np.intersect1d(unique_cytokines, significant_cytokines)
+
+        if cytokine2color is None:
+            cytokine_colors = all_palettes["Colorblind"][max(3, len(unique_cytokines))]
+            cytokine_colors = cytokine_colors[: len(unique_cytokines)]  # in case there are less than 3 unique cytokines
+            # cytokine_colors = all_palettes["Set3"][max(3, len(unique_cytokines))]
+            cytokine2color = dict(zip(unique_cytokines, cytokine_colors, strict=True))
+
+        # draw outer circle / cell type partitions
+        sectors = dict(zip(all_celltypes, (2 * len(all_cytokines) + 3) * np.ones(len(all_celltypes)), strict=True))
+
+        circos = Circos(sectors, space=3)
+        for sector in circos.sectors:
+            start, stop = sector.deg_lim
+            center = (start + stop) / 2
+            track = sector.add_track((92, 100))
+
+            if 160 >= center >= 20:
+                ha = "left"
+            elif 340 >= center >= 200:
+                ha = "right"
+            else:
+                ha = "center"
+
+            va = "bottom" if center < 90 or center > 270 else "top"
+
+            track.axis(facecolor=celltype2color[sector.name])
+            # track.text(shorten_cell_type_names(sector.name), color="black", size=6, r=110, rotation="horizontal", adjust_rotation=False, family="sans-serif", ha=ha)
+            track.text(
+                sector.name,
+                color="black",
+                size=fontsize,
+                r=110,
+                rotation="horizontal",
+                adjust_rotation=False,
+                family="sans-serif",
+                ha=ha,
+                va=va,
+            )
+
+        # draw links
+        legend_cytokine2color = {}
+        for _row_idx, row in df_src.iterrows():
+            src_celltype = row.celltype
+            cytokine_idx = cytokine2idx[row.cytokine]
+            tgt_celltypes = df_tgt.loc[df_tgt.cytokine == row.cytokine].celltype.unique()
+
+            for tgt_celltype in tgt_celltypes:
+                is_enriched = True  # default --> plot if enriched or whenever no enrichment info is provided
+
+                if df_enrichment is not None:
+                    df_enrichment.loc[:, "celltype"] = df_enrichment.celltype_combo.apply(lambda x: x.split(" (")[0])
+                    select = (df_enrichment.celltype == tgt_celltype) & (df_enrichment.cytokine == row.cytokine)
+                    is_enriched = df_enrichment.loc[select].shape[0] > 0
+
+                if is_enriched:
+                    linestyle = None
+                    _score = df_tgt.loc[
+                        (df_tgt.cytokine == row.cytokine) & (df_tgt.celltype == tgt_celltype), "mean_X"
+                    ].values
+                    assert len(_score) == 1
+                    if not np.isfinite(_score[0]):
+                        linestyle = "--"
+
+                    circos.link_line(
+                        (src_celltype, 1 + cytokine_idx),  # src node
+                        (tgt_celltype, 2 + len(all_cytokines) + cytokine_idx),  # tgt node
+                        direction=1,
+                        color=cytokine2color[row.cytokine],
+                        # color=celltype2color[src_celltype],
+                        lw=lw,
+                        arrow_height=8.0,
+                        arrow_width=8.0,
+                        linestyle=linestyle,
+                    )
+                    if row.cytokine not in legend_cytokine2color:
+                        legend_cytokine2color[row.cytokine] = cytokine2color[row.cytokine]
+
+        circos.plotfig(figsize=figsize)
+        plt.gca()
+
+        legend_handles = []
+        legend_labels = []
+        for cytokine, color in legend_cytokine2color.items():
+            legend_handles.append(mlines.Line2D([], [], color=color, lw=1.5))
+            legend_labels.append(cytokine)
+        if show_legend:
+            plt.legend(
+                handles=legend_handles,
+                labels=legend_labels,
+                title="Cytokines",
+                loc=loc,
+                bbox_to_anchor=bbox_to_anchor,
+                prop={"family": "sans-serif", "size": 6},
+                title_fontsize=6,
+            )
+        plt.tight_layout()
+        if save_path:
+            plt.savefig(
+                save_path,
+                bbox_inches="tight",
+                pad_inches=0,
+                transparent=True,
+                dpi=400,
+            )
+        plt.show()
+
+        return legend_handles, legend_labels

From 3193fdd8c104e29748cf45ee771fda22dcd05435 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Sun, 11 Jan 2026 22:25:22 +0100
Subject: [PATCH 04/11] added function wrapper run_all_enrichment_test()

---
 pertpy/tools/_hucira.py | 124 ++++++++++++++++++++++++++++++++++++----
 1 file changed, 114 insertions(+), 10 deletions(-)

diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
index ba03e6c9..aae49980 100644
--- a/pertpy/tools/_hucira.py
+++ b/pertpy/tools/_hucira.py
@@ -382,16 +382,20 @@ def run_one_enrichment_test(
                 threads=threads,
             )
             """
-
-            _res = blitzgsea.gsea(rnk, gene_set_dict, permutations=permutation_num)
-
-            _res.loc[:, "Term"] = _res.index
-            _res.loc[:, "contrast"] = contrast_name
-            _res.loc[:, "num_cells_1"] = num_cells_per_condition.loc[contrast_name, "num_cells_1"]
-            _res.loc[:, "num_cells_2"] = num_cells_per_condition.loc[contrast_name, "num_cells_2"]
-            _res.loc[:, "percent_duplicate_ranking_stats"] = (rnk.duplicated(keep="first").sum() / rnk.shape[0]) * 100
-            results.append(_res)
-            _vprint(f"{contrast_name}: done.", verbose)
+            if len(gene_set_dict) > 0:
+                _res = blitzgsea.gsea(rnk, gene_set_dict, permutations=permutation_num)
+                _res.loc[:, "Term"] = _res.index
+                _res.loc[:, "contrast"] = contrast_name
+                _res.loc[:, "num_cells_1"] = num_cells_per_condition.loc[contrast_name, "num_cells_1"]
+                _res.loc[:, "num_cells_2"] = num_cells_per_condition.loc[contrast_name, "num_cells_2"]
+                _res.loc[:, "percent_duplicate_ranking_stats"] = (
+                    rnk.duplicated(keep="first").sum() / rnk.shape[0]
+                ) * 100
+                results.append(_res)
+                _vprint(f"{contrast_name}: done.", verbose)
+            else:
+                print(f"No enrichment results for {celltype_signature} because gene set is empty.")
+                return
 
         # combine results and save hyperparams
         results = pd.concat(results, axis=0, ignore_index=True)
@@ -424,6 +428,101 @@ def run_one_enrichment_test(
 
         return results
 
+    def run_all_enrichment_test(
+        self,
+        adata: AnnData,
+        df: pd.DataFrame,
+        celltype_combos: list[tuple[str, str]] = None,
+        celltype_column: str = "cell_type",
+        contrasts_combo: tuple[str, str] | list[tuple[str, str]] = None,
+        contrast_column: str = "disease_state",
+        direction: Literal["upregulated", "downregulated", "both"] = "upregulated",
+        # Filtering parameters for gene set construction
+        threshold_lfc: float | list[float] = 1.0,
+        threshold_expression: float | list[float] = 0.0,
+        threshold_pval: float = 0.01,
+        # GSEA parameters
+        min_size: int = 10,
+        max_size: int = 1000,
+        permutation_num: int = 1000,
+        weight: float = 1.0,
+        seed: int = 2025,
+        verbose: bool = False,
+        threads: int = 6,
+    ) -> pd.DataFrame:
+        """Function wrapper: Computes cytokine enrichment activity in one celltype using GSEA scoring. Loops through several threshold value to obtain more robust gene sets.
+
+        1. "Looks up" query cell type in human cytokine dictionary and retrieves associated up-/downregulated genes per cytokine as reference.
+        2. Creates ranking of query data genes contrasting condition1 vs condition2. A continuum from genes most associated with condition1 (top) to genes most associated with condition2 (bottom)
+        3. Computes enrichment of each cytokine by matching their associated gene set in the ranked list.
+
+        Parameters
+        ----------
+        - adata
+            The query adata object.
+        - df
+            Human Cytokine Dictionary
+        - celltype_combos
+            A tuple with the celltype names of query adata in first position and respective celltype name of df in second position. Simulates "lookup of query in dictionary".
+        - celltype_column
+            Column name of adata.obs object that stores the cell types.
+        - contrasts_combo
+            Tuple that stores two biological conditions that are compared to each other in enrichment. E.g., which cytokines are enriched in healthy samples vs disease samples? Can be a list of tuples, function automatically loops through them.
+        - contrast_column
+            Column name of adata.obs object that stores the biological condition of samples.
+        - direction
+            "upregulated", "downregulated", or "both" are valid input. Up-/downregulation w.r.t condition1 (condition1 is the first of the two elements in each contrasts tuple.
+        - threshold_pval
+            Constructs the gene set: Filters for genes in human df with an adj. p-val lower than threshold_pval.
+        - threshold_lfc
+            Constructs the gene set: Filters for genes in human df that are up/downregulated with a lfc higher than threshold_lfc.
+        - threshold_expression
+            Filters out genes with mean gene expression across all cells lower than threshold_expression.
+
+        Returns:
+        -------
+        - results
+            A DataFrame with all computed enrichment scores and statistical parameters. All results from multiple thresholds (ran for robustness).
+        """
+        if celltype_combos is None:
+            celltype_combos = [("B cell", "B_cell")]
+        if isinstance(threshold_lfc, float):
+            threshold_lfc = [threshold_lfc]
+        if isinstance(threshold_expression, float):
+            threshold_expression = [threshold_expression]
+
+        all_enrichment_results = []
+        for _celltype_combo_k, celltype_combo in enumerate(celltype_combos):
+            for lfc in threshold_lfc:
+                for expr in threshold_expression:
+                    results = self.run_one_enrichment_test(
+                        adata=adata,
+                        df=df,
+                        celltype_combo=celltype_combo,
+                        celltype_column=celltype_column,
+                        contrasts_combo=contrasts_combo,
+                        contrast_column=contrast_column,
+                        direction=direction,
+                        # Robustness parameters
+                        threshold_pval=threshold_pval,
+                        threshold_lfc=lfc,
+                        threshold_expression=expr,
+                        # GSEA parameters
+                        min_size=min_size,
+                        max_size=max_size,
+                        permutation_num=permutation_num,
+                        weight=weight,
+                        seed=seed,
+                        verbose=verbose,
+                        threads=threads,
+                    )
+
+                    all_enrichment_results.append(results)
+
+        all_enrichment_results = pd.concat(all_enrichment_results, axis=0)
+
+        return all_enrichment_results
+
     def _check_robustness_fractions(
         self,
         df_pivot: pd.DataFrame,
@@ -654,6 +753,7 @@ def get_robust_significant_results(
 
         return robust_results_dict
 
+    ######## cell communication methods ########
     def _get_senders(
         self,
         adata: AnnData,
@@ -974,6 +1074,8 @@ def plot_significant_results(
                     pivot,
                     square=True,
                     annot=annot,
+                    vmin=-1,
+                    vmax=1,
                     cmap="RdBu_r",
                     center=0,
                     annot_kws={"fontsize": fontsize, "family": "sans-serif"},
@@ -1026,6 +1128,8 @@ def plot_significant_results(
                 results_pivot,
                 square=True,
                 annot=df_annot,
+                vmin=-1,
+                vmax=1,
                 cmap="RdBu_r",
                 center=0,
                 annot_kws={"fontsize": fontsize, "family": "sans-serif"},

From ea2fbfd239c972cb22782831c42ef5b53bd27fd2 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Sun, 11 Jan 2026 23:46:40 +0100
Subject: [PATCH 05/11] removed import of gseapy

---
 pertpy/tools/_hucira.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
index aae49980..b6722857 100644
--- a/pertpy/tools/_hucira.py
+++ b/pertpy/tools/_hucira.py
@@ -5,7 +5,6 @@
 from typing import Literal
 
 import blitzgsea
-import gseapy as gp
 import matplotlib.lines as mlines
 import matplotlib.pyplot as plt
 import numpy as np
@@ -546,7 +545,7 @@ def check_robustness(
         threshold_qval: float = 0.1,
         threshold_valid: float = 0.1,
         threshold_below_alpha: float = 0.9,
-    ):
+    ) -> pd.DataFrame:
         """Filters for robust and significant results (<threshold_qval/alpha) out of original enrichments (run_enrichment_test() output).
 
         Returns only the enrichments that are stable across many different tests and that are statistically significant.
@@ -650,7 +649,7 @@ def get_robust_significant_results(
         alphas: list[float] | None = None,
         threshold_valid: float = 0.1,
         threshold_below_alpha: float = 0.9,
-    ):
+    ) -> pd.DataFrame:
         """Function Wrapper: Filters for robust and signifcant results across several alpha/q-val from original enrichments (run_enrichment_test() output).
 
         Returns only the enrichments that are statistically significant (q-val), and stable across many different tests (per contrast).

From df4371c4a5af4fa5ceaadd5f37c0368f9cafea89 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Mon, 12 Jan 2026 22:39:50 +0100
Subject: [PATCH 06/11] added dependencies and very generic tests

---
 pertpy/data/__init__.py    |   2 +
 pertpy/data/_datasets.py   |  33 ++++++++++++
 pertpy/tools/_hucira.py    |  38 +++++++++++++-
 pyproject.toml             |   6 ++-
 tests/tools/test_hucira.py | 105 +++++++++++++++++++++++++++++++++++++
 5 files changed, 181 insertions(+), 3 deletions(-)
 create mode 100644 tests/tools/test_hucira.py

diff --git a/pertpy/data/__init__.py b/pertpy/data/__init__.py
index 9a23f0a7..06a55f2f 100644
--- a/pertpy/data/__init__.py
+++ b/pertpy/data/__init__.py
@@ -1,4 +1,5 @@
 from pertpy.data._datasets import (
+    MS_CSF_tutorial_data,
     adamson_2016_pilot,
     adamson_2016_upr_epistasis,
     adamson_2016_upr_perturb_seq,
@@ -88,6 +89,7 @@
     "human_cytokine_dict",
     "kang_2018",
     "mcfarland_2020",
+    "MS_CSF_tutorial_data",
     "norman_2019",
     "norman_2019_raw",
     "papalexi_2021",
diff --git a/pertpy/data/_datasets.py b/pertpy/data/_datasets.py
index 2b548aa5..8d657d70 100644
--- a/pertpy/data/_datasets.py
+++ b/pertpy/data/_datasets.py
@@ -1633,3 +1633,36 @@ def human_cytokine_dict(exclude_well_biased_genes=True) -> pd.DataFrame:
         cytokine_dict = cytokine_dict.loc[~cytokine_dict.well_biased]
 
     return cytokine_dict
+
+
+def MS_CSF_tutorial_data(save_dir="", force_download=False):
+    """Multiple Sklerosis Dataset (blood and cerebrospinal fluid) for hucira tutorial.
+
+    Download and load the MS dataset automatically.
+    Xu, Chenling (2021). MS_CSF.h5ad. figshare. Dataset. https://doi.org/10.6084/m9.figshare.14356661.v1
+
+    Parameters
+    ----------
+    save_dir : str
+        Directory where the file will be saved.
+    force_download : bool
+        Allows user to force a fresh download from CellxGene
+
+    Returns:
+    -------
+    adata : AnnData
+        MS adata object.
+    """
+    output_file_name = "MS_CSF.h5ad"
+    output_file_path = settings.datasetdir / output_file_name
+
+    if force_download or not output_file_path.exists():
+        _download(
+            url="https://figshare.com/ndownloader/files/27405182",
+            output_file_name=output_file_name,
+            output_path=settings.datasetdir,
+            is_zip=False,
+        )
+
+    adata = sc.read_h5ad(output_file_path)
+    return adata
diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
index b6722857..6123772f 100644
--- a/pertpy/tools/_hucira.py
+++ b/pertpy/tools/_hucira.py
@@ -48,7 +48,7 @@ def load_cytokine_info(self, save_dir="", force_download=False):
         save_dir.mkdir(parents=True, exist_ok=True)
         local_path = save_dir / "cytokine_info.xlsx"
 
-        if force_download or not Path.exists(local_path):
+        if force_download or not local_path.exists():
             print("Downloading Cytokine Information sheet...")
             cytokine_info = pd.read_excel(url, sheet_name="all_cytokines", engine="openpyxl")
             cytokine_info.to_excel(local_path, sheet_name="all_cytokines")
@@ -58,6 +58,36 @@ def load_cytokine_info(self, save_dir="", force_download=False):
 
         return cytokine_info
 
+    def load_CIP_signatures(self, save_dir="", force_download=False):
+        """Download and load metadata file (sheet "13.CIP_activations") from supplemental data: information about CIPs (cytokine induced gene programs).
+
+        Parameters
+        ----------
+        save_dir : str
+            Directory where the file will be saved.
+        force_download : bool
+            Allows user to force a fresh download
+
+        Returns:
+        -------
+        CIP_signatures : pandas.DataFrame
+        """
+        url = "https://raw.githubusercontent.com/theislab/huCIRA/main/src/hucira/data/df_cips_genesets.csv"
+        if save_dir == "":
+            save_dir = Path.cwd()
+        save_dir.mkdir(parents=True, exist_ok=True)
+        local_path = save_dir / "CIP_signatures.csv"
+
+        if force_download or not local_path.exists():
+            print("Downloading Cytokine-induced Gene Programs...")
+            CIP_signatures = pd.read_csv(url, index_col=0)
+            CIP_signatures.to_csv(local_path, index=False)
+        else:
+            print(f"Loading from: {local_path}")
+            CIP_signatures = pd.read_csv(local_path, index_col=0)
+
+        return CIP_signatures
+
     def _get_genesets(
         self,
         adata: AnnData,
@@ -303,11 +333,15 @@ def run_one_enrichment_test(
         - results
             A DataFrame with all computed enrichment scores and statistical parameters. Not filtered by significance or robustness yet.
         """
-        print(type(contrasts_combo))
         if not isinstance(contrasts_combo, list):
             assert isinstance(contrasts_combo, tuple)
             contrasts_combo = [contrasts_combo]
 
+        if not isinstance(celltype_combo, tuple):
+            raise ValueError(
+                f"Expected a tuple of two strings for celltype_combo, got {type(celltype_combo)}. This function only computes enrichment for one cell type. If you want to compute enrichment for several celltypes, use 'run_all_enrichment_test()'."
+            )
+
         celltype_adata = celltype_combo[0]
         celltype_signature = celltype_combo[1]
 
diff --git a/pyproject.toml b/pyproject.toml
index be0498d9..056d870b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -65,7 +65,11 @@ dependencies = [
     "scikit-learn>=1.4",
     "fast-array-utils[accel,sparse]",
     "arviz",
-    "filelock"
+    "filelock",
+    "bokeh",
+    "pycirclize",
+    "tqdm"
+
 ]
 
 [project.optional-dependencies]
diff --git a/tests/tools/test_hucira.py b/tests/tools/test_hucira.py
new file mode 100644
index 00000000..003e01da
--- /dev/null
+++ b/tests/tools/test_hucira.py
@@ -0,0 +1,105 @@
+import numpy as np
+import pandas as pd
+import pytest
+import scanpy as sc
+from anndata import AnnData
+
+import pertpy as pt
+
+
+@pytest.fixture
+def dummy_adata():
+    n_obs = 15
+    n_vars = 5
+    rng = np.random.default_rng()
+    X = rng.random((n_obs, n_vars))
+    adata = AnnData(X)
+    adata.var_names = [f"gene{i}" for i in range(n_vars)]
+    adata.obs["cell_type"] = ["B cell"] * 5 + ["CD8a"] * 5 + ["Mono"] * 5  # celltype column
+    adata.obs["conditions"] = ["Healthy"] * 7 + ["Disease"] * 8  # contrast column
+    return adata
+
+
+@pytest.fixture(scope="module")
+def hucira():
+    return pt.tl.Hucira()
+
+
+@pytest.fixture(scope="module")
+def hcd():
+    return pt.dt.human_cytokine_dict()
+
+
+# Generic test confirming correct output.
+def test_compute_ranking_statistic(dummy_adata, hucira):
+    contrast_column = "conditions"
+    contrasts_combo = [("Healthy", "Disease")]
+
+    ranked_stats, _num_cells = hucira._compute_ranking_statistic(dummy_adata, contrast_column, contrasts_combo)
+    assert isinstance(ranked_stats, pd.DataFrame)
+
+    # with pytest.raises(KeyError):
+    #    hucira._compute_ranking_statistic(dummy_adata, "wrong_conditions", contrasts_combo)
+
+
+# Test confirming correct argument format for celltype_combo
+def test_run_one_enrichment_test(dummy_adata, hcd, hucira):
+    # celltype_combo_correct = ("B cell", "B_cell")
+    celltype_combo_wrong = [
+        ("B cell", "B_cell"),
+        ("CD8a", "CD8_T_cell"),
+        ("Mono", "CD14_Mono"),
+    ]  # can't be a list for "run_one_enrichment_test()"
+
+    with pytest.raises(ValueError):
+        hucira.run_one_enrichment_test(
+            dummy_adata, hcd, celltype_combo_wrong, "cell_type", [("Healthy", "Disease")], "conditions", "upregulated"
+        )
+
+
+# Smoke test run
+def test_smoke_full_enrichment_test(dummy_adata, hcd, hucira):
+    celltype_combo = [
+        ("B cell", "B_cell"),
+        ("CD8a", "CD8_T_cell"),
+        ("Mono", "CD14_Mono"),
+    ]  # can't be a list for "run_one_enrichment_test()"
+    celltype_column = "cell_type"
+    contrasts_combo = [("Healthy", "Disease")]
+    contrast_column = "conditions"
+    # direction
+
+    all_enrichment_results = hucira.run_all_enrichment_test(
+        dummy_adata,
+        hcd,
+        contrasts_combo,
+        celltype_combo,
+        contrast_column,
+        celltype_column,
+        contrasts_combo,
+        contrast_column,
+    )
+    assert isinstance(all_enrichment_results, pd.DataFrame)
+
+    robust_results_dict = hucira.get_robust_significant_results(
+        results=all_enrichment_results,
+        alphas=[0.1, 0.05, 0.01],
+        threshold_valid=0.1,
+        threshold_below_alpha=0.9,
+    )
+    assert isinstance(robust_results_dict, dict)
+
+    cytokine_info = hucira.load_cytokine_info()
+    df_senders, df_receivers = hucira.get_all_senders_and_receivers(
+        dummy_adata,
+        cytokine_info,
+        robust_results_dict[contrasts_combo[0]][
+            2
+        ].cytokine.unique(),  # deep indexing, should change that soon bc not very robust.
+        celltype_column,
+        sender_pvalue_threshold=0.1,
+        receiver_mean_X_threshold=0,
+    )
+
+    assert isinstance(df_senders, pd.DataFrame)
+    assert isinstance(df_receivers, pd.DataFrame)

From bbdae6a74990379c67d74e2217c2535fe1d4534f Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Wed, 20 May 2026 13:33:12 +0200
Subject: [PATCH 07/11] remove hucira module, keep only hcd loading function.

---
 pertpy/data/__init__.py    |    2 -
 pertpy/data/_datasets.py   |   51 +-
 pertpy/tools/__init__.py   |    2 -
 pertpy/tools/_hucira.py    | 1418 ------------------------------------
 pyproject.toml             |    6 +-
 tests/tools/test_hucira.py |  105 ---
 6 files changed, 13 insertions(+), 1571 deletions(-)
 delete mode 100644 pertpy/tools/_hucira.py
 delete mode 100644 tests/tools/test_hucira.py

diff --git a/pertpy/data/__init__.py b/pertpy/data/__init__.py
index 06a55f2f..9a23f0a7 100644
--- a/pertpy/data/__init__.py
+++ b/pertpy/data/__init__.py
@@ -1,5 +1,4 @@
 from pertpy.data._datasets import (
-    MS_CSF_tutorial_data,
     adamson_2016_pilot,
     adamson_2016_upr_epistasis,
     adamson_2016_upr_perturb_seq,
@@ -89,7 +88,6 @@
     "human_cytokine_dict",
     "kang_2018",
     "mcfarland_2020",
-    "MS_CSF_tutorial_data",
     "norman_2019",
     "norman_2019_raw",
     "papalexi_2021",
diff --git a/pertpy/data/_datasets.py b/pertpy/data/_datasets.py
index 8d657d70..a2726143 100644
--- a/pertpy/data/_datasets.py
+++ b/pertpy/data/_datasets.py
@@ -1601,17 +1601,23 @@ def hagai_2018() -> AnnData:  # pragma: no cover
     return adata
 
 
-def human_cytokine_dict(exclude_well_biased_genes=True) -> pd.DataFrame:
-    r"""Human Cytokine Dictionary curated from PBMC allows you to infer differential cytokine activity.
+def human_cytokine_dict(exclude_well_biased_genes: bool = True) -> pd.DataFrame:
+    """Human Cytokine Dictionary curated from PBMC allows you to infer differential cytokine activity.
 
-    The Human Cytokine Dictionary was created from single-cell RNA-seq of 9,697,974 human peripheral blood mononuclear cells (PBMC) from 12 donors stimulated in vitro with 87 different cytokines. The object is a dataframe representing cytokine activity as differentially expressed genes after cytokine perturbation.
+    The Human Cytokine Dictionary was created from single-cell RNA-seq of 9,697,974 human peripheral blood mononuclear cells (PBMC)
+    from 12 donors stimulated in vitro with 87 different cytokines.
+    Genes with a mean-to-stddev-ratio above 1 across all 6 wells for >10 cytokines in a given cell type and for >5 cell types are "well-biased".
+
+    Args:
+        exclude_well_biased_genes: Whether to exclude well-biased genes from the returned dataframe.
 
     References:
-        Oesinghaus, Lukas and Becker, S{\"o}ren and Vornholz, Larsen
-        .... bla bla coming
+        Oesinghaus, L., Becker, S., Vornholz, L., Papalexi, E. et al.
+        A single-cell cytokine dictionary of human peripheral blood.
+        bioRxiv (2025). https://doi.org/10.64898/2025.12.12.693897
 
     Returns:
-        Pandas DataFrame
+        :class:`~ pandas.DataFrame` object of differentially expressed genes after cytokine perturbation.
 
     """
     output_file_name = "human_cytokine_dict.csv"
@@ -1633,36 +1639,3 @@ def human_cytokine_dict(exclude_well_biased_genes=True) -> pd.DataFrame:
         cytokine_dict = cytokine_dict.loc[~cytokine_dict.well_biased]
 
     return cytokine_dict
-
-
-def MS_CSF_tutorial_data(save_dir="", force_download=False):
-    """Multiple Sklerosis Dataset (blood and cerebrospinal fluid) for hucira tutorial.
-
-    Download and load the MS dataset automatically.
-    Xu, Chenling (2021). MS_CSF.h5ad. figshare. Dataset. https://doi.org/10.6084/m9.figshare.14356661.v1
-
-    Parameters
-    ----------
-    save_dir : str
-        Directory where the file will be saved.
-    force_download : bool
-        Allows user to force a fresh download from CellxGene
-
-    Returns:
-    -------
-    adata : AnnData
-        MS adata object.
-    """
-    output_file_name = "MS_CSF.h5ad"
-    output_file_path = settings.datasetdir / output_file_name
-
-    if force_download or not output_file_path.exists():
-        _download(
-            url="https://figshare.com/ndownloader/files/27405182",
-            output_file_name=output_file_name,
-            output_path=settings.datasetdir,
-            is_zip=False,
-        )
-
-    adata = sc.read_h5ad(output_file_path)
-    return adata
diff --git a/pertpy/tools/__init__.py b/pertpy/tools/__init__.py
index 2d765ea8..06a44cd7 100644
--- a/pertpy/tools/__init__.py
+++ b/pertpy/tools/__init__.py
@@ -7,7 +7,6 @@
 from pertpy.tools._distances._distance_tests import DistanceTest
 from pertpy.tools._distances._distances import Distance
 from pertpy.tools._enrichment import Enrichment
-from pertpy.tools._hucira import Hucira
 from pertpy.tools._milo import Milo
 from pertpy.tools._mixscape import Mixscape
 from pertpy.tools._perturbation_space._clustering import ClusteringSpace
@@ -69,7 +68,6 @@ def __dir__():
     "DistanceTest",
     "Distance",
     "Enrichment",
-    "hucira",
     "Milo",
     "Mixscape",
     "ClusteringSpace",
diff --git a/pertpy/tools/_hucira.py b/pertpy/tools/_hucira.py
deleted file mode 100644
index 6123772f..00000000
--- a/pertpy/tools/_hucira.py
+++ /dev/null
@@ -1,1418 +0,0 @@
-import os
-import re
-import warnings
-from pathlib import Path
-from typing import Literal
-
-import blitzgsea
-import matplotlib.lines as mlines
-import matplotlib.pyplot as plt
-import numpy as np
-import pandas as pd
-import scanpy as sc
-import seaborn as sns
-from anndata import AnnData
-from bokeh.palettes import all_palettes
-from pycirclize import Circos
-from tqdm.auto import tqdm
-
-
-def _vprint(msg, verbose):
-    if verbose:
-        print(msg)
-
-
-class Hucira:
-    def load_cytokine_info(self, save_dir="", force_download=False):
-        """Download and load Cytokine information sheet: includes information about sender and receptor genes (for cell-cell communication plot).
-
-        Parameters
-        ----------
-        save_dir : str
-            Directory where the file will be saved.
-        force_download : bool
-            Allows user to force a fresh download
-
-        Returns:
-        -------
-        cytokine_info : pandas.DataFrame
-        """
-        url = (
-            "https://raw.githubusercontent.com/theislab/huCIRA/"
-            "main/src/hucira/data/"
-            "20250125_cytokine_info_with_functional_classification_LV.xlsx"
-        )
-
-        if save_dir == "":
-            save_dir = Path.cwd()
-        save_dir.mkdir(parents=True, exist_ok=True)
-        local_path = save_dir / "cytokine_info.xlsx"
-
-        if force_download or not local_path.exists():
-            print("Downloading Cytokine Information sheet...")
-            cytokine_info = pd.read_excel(url, sheet_name="all_cytokines", engine="openpyxl")
-            cytokine_info.to_excel(local_path, sheet_name="all_cytokines")
-        else:
-            print(f"Loading from: {local_path}")
-            cytokine_info = pd.read_excel(local_path)
-
-        return cytokine_info
-
-    def load_CIP_signatures(self, save_dir="", force_download=False):
-        """Download and load metadata file (sheet "13.CIP_activations") from supplemental data: information about CIPs (cytokine induced gene programs).
-
-        Parameters
-        ----------
-        save_dir : str
-            Directory where the file will be saved.
-        force_download : bool
-            Allows user to force a fresh download
-
-        Returns:
-        -------
-        CIP_signatures : pandas.DataFrame
-        """
-        url = "https://raw.githubusercontent.com/theislab/huCIRA/main/src/hucira/data/df_cips_genesets.csv"
-        if save_dir == "":
-            save_dir = Path.cwd()
-        save_dir.mkdir(parents=True, exist_ok=True)
-        local_path = save_dir / "CIP_signatures.csv"
-
-        if force_download or not local_path.exists():
-            print("Downloading Cytokine-induced Gene Programs...")
-            CIP_signatures = pd.read_csv(url, index_col=0)
-            CIP_signatures.to_csv(local_path, index=False)
-        else:
-            print(f"Loading from: {local_path}")
-            CIP_signatures = pd.read_csv(local_path, index_col=0)
-
-        return CIP_signatures
-
-    def _get_genesets(
-        self,
-        adata: AnnData,
-        df: pd.DataFrame,
-        celltype_signature: str,
-        direction: Literal["upregulated", "downregulated", "both"] | None = None,
-        threshold_pval: float | None = None,
-        threshold_lfc: float | None = None,
-    ) -> tuple[dict[str, list[str]], pd.DataFrame]:
-        """Get shared gene sets between query adata and the Human Cytokine Dictionary, CIP signatures, or custom gene signatures of a chosen cell type.
-
-        Parameters
-        ----------
-        - adata: AnnData object with gene expression data.
-        - df: Either hcd, CIP signature, or a custom dataframe containing columns ["gene", "query_program", "celltype"].
-        - celltype_signature: celltype naming convention needs to match df.celltype
-        - direction: Relevant for hcd, but not for CIP or custom gene program
-        - threshold_pval: Relevant for hcd, but not for CIP or custom gene program
-        - threshold_lfc: Relevant for hcd, but not for CIP or custom gene program
-
-        Returns:
-        -------
-        - gene_set_dict: dictionary with cytokine/CIP as key and associated genes as values
-        - gene_set_df: df containing information on gene overlap between query data and gene program for chosen cell type
-        """
-        required_for_hcd = ["log_fc", "adj_p_value", "cytokine"]
-        required_for_CIP = ["gene", "CIP", "celltype"]
-
-        # Construct signature gene set if input is human cytokine dictionary
-        if set(required_for_hcd).issubset(df.columns):
-            print(f"Computing gene sets of Human Cytokine Dictionary for {celltype_signature}.")
-            select = (df.adj_p_value <= threshold_pval) & (df.celltype == celltype_signature)
-            if direction == "upregulated":
-                select = select & (df.log_fc >= threshold_lfc)
-            elif direction == "downregulated":
-                select = select & (df.log_fc <= threshold_lfc)
-            elif direction == "both":
-                select = select & (df.log_fc.abs() >= threshold_lfc)
-            else:
-                raise ValueError(f"Invalid direction: {direction}.")
-            df = df.loc[select]
-
-            gene_set_dict = {}
-            gene_set_df = pd.DataFrame()
-            for cytokine_i, cytokine in enumerate(df.cytokine.unique()):
-                gene_set = df.loc[df.cytokine == cytokine].gene.values
-                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
-                gene_set_df.loc[cytokine_i, "cytokine"] = cytokine
-                gene_set_df.loc[cytokine_i, "num_genes_signature"] = len(gene_set)
-                gene_set_df.loc[cytokine_i, "num_shared_genes_signature"] = len(gene_set_shared)
-                gene_set_df.loc[cytokine_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
-                gene_set_dict[cytokine] = gene_set_shared
-
-        # Construct signature gene set if input is CIP signatures
-        elif set(required_for_CIP).issubset(df.columns):
-            print(f"Computing gene sets of Cytokine-induced gene programs for {celltype_signature}.")
-            select = df.celltype == celltype_signature
-            df = df.loc[select]
-            gene_set_dict = {}
-            gene_set_df = pd.DataFrame()
-            for CIP_i, CIP in enumerate(df.CIP.unique()):
-                gene_set = df.loc[df.CIP == CIP].gene.values
-                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
-                gene_set_df.loc[CIP_i, "CIP"] = CIP
-                gene_set_df.loc[CIP_i, "num_genes_signature"] = len(gene_set)
-                gene_set_df.loc[CIP_i, "num_shared_genes_signature"] = len(gene_set_shared)
-                gene_set_df.loc[CIP_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
-                gene_set_dict[CIP] = gene_set_shared
-
-        # Construct signature gene set for custom gene programs
-        elif "query_program" in df.columns:
-            print(f"Computing gene sets of user-defined gene programs for {celltype_signature}.")
-            select = df.celltype == celltype_signature
-            df = df.loc[select]
-            gene_set_dict = {}
-            gene_set_df = pd.DataFrame()
-            for query_program_i, query_program in enumerate(df.query_program.unique()):
-                gene_set = df.loc[df.query_program == query_program].gene.values
-                gene_set_shared = np.intersect1d(gene_set, adata.var_names)
-                gene_set_df.loc[query_program_i, "query_program"] = query_program
-                gene_set_df.loc[query_program_i, "num_genes_signature"] = len(gene_set)
-                gene_set_df.loc[query_program_i, "num_shared_genes_signature"] = len(gene_set_shared)
-                gene_set_df.loc[query_program_i, "frac_shared_genes_signature"] = len(gene_set_shared) / len(gene_set)
-                gene_set_dict[query_program] = gene_set_shared
-
-        else:
-            raise ValueError(
-                "invalid input for df parameter. You can use either the Human Cytokine Dictionary with load_human_cytokine_dict(), or our CIP signatures with load_CIP_signatures(). If you want to compute enrichment of custom gene sets, df must have columns: ['gene', 'query_program', 'celltype']."
-            )
-            return
-        return gene_set_dict, gene_set_df
-
-    def _compute_mu_and_sigma(self, adata: AnnData, contrast_column: str, condition: str) -> pd.DataFrame:
-        group = adata[adata.obs[contrast_column] == condition]
-        num_cells = group.shape[0]
-        X = group.X.toarray() if hasattr(group.X, "toarray") else group.X
-        mu = np.mean(X, axis=0)
-        sigma = np.std(X, axis=0, ddof=1)
-        return {"mu": mu, "sigma": sigma, "num_cells": num_cells}
-
-    def _compute_s2n(
-        self,
-        adata: AnnData,
-        contrast_column: str,
-        condition_1: str,
-        condition_2: str,
-        precomputed_stats: dict | None = None,
-    ) -> tuple[pd.DataFrame, pd.DataFrame]:
-        """Compute the signal-to-noise ratio (S2N) for each gene between two conditions in an AnnData object.
-
-        Parameters
-        ----------
-        - adata: AnnData object with gene expression data.
-        - contrast_column: Key in `adata.obs` indicating the condition labels (e.g. "disease_state").
-        - condition_1: Name of the first condition (e.g., "flare").
-        - condition_2: Name of the second condition (e.g., "healthy").
-
-        Returns:
-        -------
-        - s2n_scores: pandas Series of S2N values indexed by gene names.
-        """
-        if precomputed_stats is None:
-            # Select cells for each condition
-            group1 = adata[adata.obs[contrast_column] == condition_1]
-            group2 = adata[adata.obs[contrast_column] == condition_2]
-
-            # number of cells per condition
-            num_cells_1 = group1.shape[0]
-            num_cells_2 = group2.shape[0]
-
-            # Get expression matrices
-            X1 = group1.X.toarray() if hasattr(group1.X, "toarray") else group1.X
-            X2 = group2.X.toarray() if hasattr(group2.X, "toarray") else group2.X
-
-            # Compute mean and std per gene
-            mu1 = np.mean(X1, axis=0)
-            mu2 = np.mean(X2, axis=0)
-            sigma1 = np.std(X1, axis=0, ddof=1)
-            sigma2 = np.std(X2, axis=0, ddof=1)
-
-        else:
-            _vprint("Using precomputed stats", True)
-            num_cells_1 = precomputed_stats[condition_1]["num_cells"]
-            num_cells_2 = precomputed_stats[condition_2]["num_cells"]
-            mu1 = precomputed_stats[condition_1]["mu"]
-            mu2 = precomputed_stats[condition_2]["mu"]
-            sigma1 = precomputed_stats[condition_1]["sigma"]
-            sigma2 = precomputed_stats[condition_2]["sigma"]
-
-        # Compute S2N
-        s2n = (mu1 - mu2) / (sigma1 + sigma2 + 1e-8)  # epsilon to avoid division by zero
-
-        num_cells = pd.DataFrame(
-            index=[f"{condition_1}_vs_{condition_2}"],
-            columns=["num_cells_1", "num_cells_2"],
-            data=[[num_cells_1, num_cells_2]],
-        )
-        stats = pd.DataFrame(s2n, index=adata.var_names, columns=[f"{condition_1}_vs_{condition_2}"])
-
-        return stats, num_cells
-
-    def _compute_ranking_statistic(
-        self, adata: AnnData, contrast_column: str, contrasts_combo: list[tuple[str, str]]
-    ) -> tuple[pd.DataFrame, pd.DataFrame]:
-        rnk_stats, num_cells = [], []
-        precomputed_stats = {}
-
-        conditions = []
-        for condition in contrasts_combo:
-            conditions.extend([condition[0], condition[1]])
-        conditions = np.unique(conditions)
-
-        for condition in conditions:
-            precomputed_stats[condition] = self._compute_mu_and_sigma(
-                adata, contrast_column=contrast_column, condition=condition
-            )
-
-        for condition in contrasts_combo:
-            _rnk_stats, _num_cells = self._compute_s2n(
-                adata,
-                contrast_column=contrast_column,
-                condition_1=condition[0],
-                condition_2=condition[1],
-                precomputed_stats=precomputed_stats,
-            )
-            rnk_stats.append(_rnk_stats)
-            num_cells.append(_num_cells)
-        return pd.concat(rnk_stats, axis=1), pd.concat(num_cells, axis=0)
-
-    def run_one_enrichment_test(
-        self,
-        adata: AnnData,
-        df: pd.DataFrame,
-        celltype_combo: tuple[str, str] = ("B cell", "B_cell"),
-        celltype_column: str = "cell_type",
-        contrasts_combo: tuple[str, str] | list[tuple[str, str]] = None,
-        contrast_column: str = "disease_state",
-        direction: Literal["upregulated", "downregulated", "both"] = "upregulated",
-        # Filtering parameters for gene set construction
-        threshold_lfc: float = 1.0,
-        threshold_expression: float = 0.0,
-        threshold_pval: float = 0.01,
-        # GSEA parameters
-        min_size: int = 10,
-        max_size: int = 1000,
-        permutation_num: int = 1000,
-        weight: float = 1.0,
-        seed: int = 2025,
-        verbose: bool = False,
-        threads: int = 6,
-    ) -> pd.DataFrame:
-        """Computes cytokine enrichment activity in one celltype using GSEA scoring.
-
-        1. "Looks up" query cell type in human cytokine dictionary and retrieves associated up-/downregulated genes per cytokine as reference.
-        2. Creates ranking of query data genes contrasting condition1 vs condition2. A continuum from genes most associated with condition1 (top) to genes most associated with condition2 (bottom)
-        3. Computes enrichment of each cytokine by matching their associated gene set in the ranked list.
-
-        Parameters
-        ----------
-        - adata
-            The query adata object.
-        - df
-            Human Cytokine Dictionary
-        - celltype_combo
-            A tuple with the celltype name of query adata in first position and respective celltype name of df in second position. Simulates "lookup of query in dictionary".
-        - celltype_column
-            Column name of adata.obs object that stores the cell types.
-        - contrasts_combo
-            Tuple that stores two biological conditions that are compared to each other in enrichment. E.g., which cytokines are enriched in healthy samples vs disease samples? Can be a list of tuples, function automatically loops through them.
-        - contrast_column
-            Column name of adata.obs object that stores the biological condition of samples.
-        - direction
-            "upregulated", "downregulated", or "both" are valid input. Up-/downregulation w.r.t condition1 (condition1 is the first of the two elements in each contrasts tuple.
-        - threshold_pval
-            Constructs the gene set: Filters for genes in human df with an adj. p-val lower than threshold_pval.
-        - threshold_lfc
-            Constructs the gene set: Filters for genes in human df that are up/downregulated with a lfc higher than threshold_lfc.
-        - threshold_expression
-            Filters out genes with mean gene expression across all cells lower than threshold_expression.
-
-        Returns:
-        -------
-        - results
-            A DataFrame with all computed enrichment scores and statistical parameters. Not filtered by significance or robustness yet.
-        """
-        if not isinstance(contrasts_combo, list):
-            assert isinstance(contrasts_combo, tuple)
-            contrasts_combo = [contrasts_combo]
-
-        if not isinstance(celltype_combo, tuple):
-            raise ValueError(
-                f"Expected a tuple of two strings for celltype_combo, got {type(celltype_combo)}. This function only computes enrichment for one cell type. If you want to compute enrichment for several celltypes, use 'run_all_enrichment_test()'."
-            )
-
-        celltype_adata = celltype_combo[0]
-        celltype_signature = celltype_combo[1]
-
-        # allows potential loop of celltype combos to continue
-        if celltype_adata not in adata.obs[celltype_column].unique():
-            print(
-                f"'{celltype_adata}' is not present in celltype_column ({celltype_column}) of query adata. Skipping enrichment test of this celltype.\n"
-            )
-            return None
-
-        # filter for cell type
-        _vprint("Filter for cell type:", verbose)
-        adata = adata[adata.obs[celltype_column] == celltype_adata]
-        _vprint("Filter for cell type: done.", verbose)
-
-        # filter based on gene expression
-        _vprint("Filter for gene expression:", verbose)
-        adata = adata[:, adata.X.mean(axis=0) >= threshold_expression]
-        _vprint("Filter for gene expression: done.", verbose)
-
-        # get genesets
-        _vprint("Get gene sets:", verbose)
-        gene_set_dict, gene_set_df = self._get_genesets(
-            adata=adata,
-            df=df,
-            celltype_signature=celltype_signature,
-            direction=direction,
-            threshold_pval=threshold_pval,
-            threshold_lfc=threshold_lfc,
-        )
-
-        gene_set_dict = {
-            key: gene_set for key, gene_set in gene_set_dict.items() if min_size < len(gene_set) < max_size
-        }
-
-        _vprint("Get gene sets: done.", verbose)
-
-        # compute ranking stat
-        _vprint("Get ranking stats:", verbose)
-        rnk_stats, num_cells_per_condition = self._compute_ranking_statistic(
-            adata, contrast_column=contrast_column, contrasts_combo=contrasts_combo
-        )
-        _vprint("Get ranking stats: done.", verbose)
-        results = []
-
-        for contrast_name in rnk_stats.columns:
-            print(contrast_name)
-            # format stat so that it can be processed by blitzgsea. E.g., needs col "0": genenames, and "1": scores
-            rnk = (
-                rnk_stats.loc[:, contrast_name]
-                .replace([np.inf, -np.inf], np.nan)
-                .dropna()
-                .sort_values(ascending=False)
-                .to_frame()
-                .reset_index()
-                .rename(columns={"index": "0", contrast_name: "1"})
-            )
-
-            # run enrichment (changed gp.prerank() to blitzgsea. The output result is in slightly diff format.
-            """
-            gp_res = gp.prerank(
-                rnk=rnk,
-                gene_sets=gene_set_dict,
-                min_size=min_size,
-                max_size=max_size,
-                permutation_num=permutation_num,
-                weight=weight,
-                outdir=None,
-                seed=seed,
-                verbose=verbose,
-                threads=threads,
-            )
-            """
-            if len(gene_set_dict) > 0:
-                _res = blitzgsea.gsea(rnk, gene_set_dict, permutations=permutation_num)
-                _res.loc[:, "Term"] = _res.index
-                _res.loc[:, "contrast"] = contrast_name
-                _res.loc[:, "num_cells_1"] = num_cells_per_condition.loc[contrast_name, "num_cells_1"]
-                _res.loc[:, "num_cells_2"] = num_cells_per_condition.loc[contrast_name, "num_cells_2"]
-                _res.loc[:, "percent_duplicate_ranking_stats"] = (
-                    rnk.duplicated(keep="first").sum() / rnk.shape[0]
-                ) * 100
-                results.append(_res)
-                _vprint(f"{contrast_name}: done.", verbose)
-            else:
-                print(f"No enrichment results for {celltype_signature} because gene set is empty.")
-                return
-
-        # combine results and save hyperparams
-        results = pd.concat(results, axis=0, ignore_index=True)
-        results.loc[:, "celltype_adata"] = celltype_adata
-        results.loc[:, "celltype_signature"] = celltype_signature
-        results.loc[:, "celltype_combo"] = f"{celltype_adata} ({celltype_signature})"
-        results.loc[:, "direction"] = direction
-        results.loc[:, "threshold_pval"] = threshold_pval
-        results.loc[:, "threshold_lfc"] = threshold_lfc
-        results.loc[:, "threshold_expression"] = threshold_expression
-        results.loc[:, "min_size"] = min_size
-        results.loc[:, "max_size"] = max_size
-        results.loc[:, "permutation_num"] = permutation_num
-        results.loc[:, "weight"] = weight
-        results.loc[:, "seed"] = seed
-        results.loc[:, "threads"] = threads
-
-        required_for_hcd = ["log_fc", "adj_p_value", "cytokine"]
-        if set(required_for_hcd).issubset(df.columns):
-            results.rename({"Term": "cytokine"}, inplace=True, axis=1)
-            results = pd.merge(results, gene_set_df, on="cytokine")
-        elif "CIP" in df.columns:
-            results.rename({"Term": "CIP"}, inplace=True, axis=1)
-            results = pd.merge(results, gene_set_df, on="CIP")
-            results.direction = "upregulated"
-        elif "query_program" in df.columns:
-            results.rename({"Term": "query_program"}, inplace=True, axis=1)
-            results = pd.merge(results, gene_set_df, on="query_program")
-            results.direction = "custom input"
-
-        return results
-
-    def run_all_enrichment_test(
-        self,
-        adata: AnnData,
-        df: pd.DataFrame,
-        celltype_combos: list[tuple[str, str]] = None,
-        celltype_column: str = "cell_type",
-        contrasts_combo: tuple[str, str] | list[tuple[str, str]] = None,
-        contrast_column: str = "disease_state",
-        direction: Literal["upregulated", "downregulated", "both"] = "upregulated",
-        # Filtering parameters for gene set construction
-        threshold_lfc: float | list[float] = 1.0,
-        threshold_expression: float | list[float] = 0.0,
-        threshold_pval: float = 0.01,
-        # GSEA parameters
-        min_size: int = 10,
-        max_size: int = 1000,
-        permutation_num: int = 1000,
-        weight: float = 1.0,
-        seed: int = 2025,
-        verbose: bool = False,
-        threads: int = 6,
-    ) -> pd.DataFrame:
-        """Function wrapper: Computes cytokine enrichment activity in one celltype using GSEA scoring. Loops through several threshold value to obtain more robust gene sets.
-
-        1. "Looks up" query cell type in human cytokine dictionary and retrieves associated up-/downregulated genes per cytokine as reference.
-        2. Creates ranking of query data genes contrasting condition1 vs condition2. A continuum from genes most associated with condition1 (top) to genes most associated with condition2 (bottom)
-        3. Computes enrichment of each cytokine by matching their associated gene set in the ranked list.
-
-        Parameters
-        ----------
-        - adata
-            The query adata object.
-        - df
-            Human Cytokine Dictionary
-        - celltype_combos
-            A tuple with the celltype names of query adata in first position and respective celltype name of df in second position. Simulates "lookup of query in dictionary".
-        - celltype_column
-            Column name of adata.obs object that stores the cell types.
-        - contrasts_combo
-            Tuple that stores two biological conditions that are compared to each other in enrichment. E.g., which cytokines are enriched in healthy samples vs disease samples? Can be a list of tuples, function automatically loops through them.
-        - contrast_column
-            Column name of adata.obs object that stores the biological condition of samples.
-        - direction
-            "upregulated", "downregulated", or "both" are valid input. Up-/downregulation w.r.t condition1 (condition1 is the first of the two elements in each contrasts tuple.
-        - threshold_pval
-            Constructs the gene set: Filters for genes in human df with an adj. p-val lower than threshold_pval.
-        - threshold_lfc
-            Constructs the gene set: Filters for genes in human df that are up/downregulated with a lfc higher than threshold_lfc.
-        - threshold_expression
-            Filters out genes with mean gene expression across all cells lower than threshold_expression.
-
-        Returns:
-        -------
-        - results
-            A DataFrame with all computed enrichment scores and statistical parameters. All results from multiple thresholds (ran for robustness).
-        """
-        if celltype_combos is None:
-            celltype_combos = [("B cell", "B_cell")]
-        if isinstance(threshold_lfc, float):
-            threshold_lfc = [threshold_lfc]
-        if isinstance(threshold_expression, float):
-            threshold_expression = [threshold_expression]
-
-        all_enrichment_results = []
-        for _celltype_combo_k, celltype_combo in enumerate(celltype_combos):
-            for lfc in threshold_lfc:
-                for expr in threshold_expression:
-                    results = self.run_one_enrichment_test(
-                        adata=adata,
-                        df=df,
-                        celltype_combo=celltype_combo,
-                        celltype_column=celltype_column,
-                        contrasts_combo=contrasts_combo,
-                        contrast_column=contrast_column,
-                        direction=direction,
-                        # Robustness parameters
-                        threshold_pval=threshold_pval,
-                        threshold_lfc=lfc,
-                        threshold_expression=expr,
-                        # GSEA parameters
-                        min_size=min_size,
-                        max_size=max_size,
-                        permutation_num=permutation_num,
-                        weight=weight,
-                        seed=seed,
-                        verbose=verbose,
-                        threads=threads,
-                    )
-
-                    all_enrichment_results.append(results)
-
-        all_enrichment_results = pd.concat(all_enrichment_results, axis=0)
-
-        return all_enrichment_results
-
-    def _check_robustness_fractions(
-        self,
-        df_pivot: pd.DataFrame,
-        threshold_qval: float = 0.1,  # adjusted p value
-        threshold_valid: float = 0.1,  # fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
-        threshold_below_alpha: float = 0.75,  # fraction of results that need to be significant
-    ):
-        n_total = np.prod(df_pivot.shape)
-        n_valid = n_total - df_pivot.isna().sum().sum()
-        n_below_alpha = (
-            (df_pivot < threshold_qval).sum().sum()
-        )  # number of results below pval threshold, i.e., number of significant results
-        frac_valid_results = n_valid / n_total
-        frac_pval_below_alpha = n_below_alpha / n_valid  # fraction of significant results relative to valid results
-        is_robust = (frac_pval_below_alpha > threshold_below_alpha) & (frac_valid_results > threshold_valid)
-        return frac_valid_results, frac_pval_below_alpha, is_robust
-
-    def check_robustness(
-        self,
-        all_results: pd.DataFrame,
-        threshold_qval: float = 0.1,
-        threshold_valid: float = 0.1,
-        threshold_below_alpha: float = 0.9,
-    ) -> pd.DataFrame:
-        """Filters for robust and significant results (<threshold_qval/alpha) out of original enrichments (run_enrichment_test() output).
-
-        Returns only the enrichments that are stable across many different tests and that are statistically significant.
-
-
-        Parameters
-        ----------
-        - results
-            The DataFrame output from run_enrichment_test().
-        - threshold_qval
-            Threshold that checks significance of results (leniently). Result is considered significant if its q-val is below this threshold.
-        - threshold_valid
-            The fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
-        - threshold_below_alpha
-            The fraction of results that need to be significant
-
-
-        Returns:
-        -------
-        - robust_results
-            DataFrame with robust and significant enrichments (includes min and max of nes)
-
-        """
-        all_thresholds_expression = all_results.threshold_expression.sort_values(ascending=False).unique()
-        all_thresholds_lfc = sorted(all_results.threshold_lfc.unique())
-
-        df = pd.DataFrame(index=all_thresholds_expression, columns=all_thresholds_lfc)
-        df.index.rename("threshold_expression", inplace=True)
-        df.columns.rename("threshold_lfc", inplace=True)
-
-        robust_results = []
-
-        # Get gene_program name of your enrichment analysis.
-        if "cytokine" in all_results.columns:
-            gene_program = "cytokine"
-        elif "CIP" in all_results.columns:
-            gene_program = "CIP"
-        elif "query_program" in all_results.columns:
-            gene_program = "query_program"
-        else:
-            raise ValueError("Missing column that is defining gene programs in 'all_results'.")
-            return
-
-        for contrast in tqdm(all_results.contrast.unique()):
-            for celltype_combo in all_results.celltype_combo.unique():
-                results_ct = all_results.loc[
-                    (all_results.celltype_combo == celltype_combo) & (all_results.contrast == contrast)
-                ]
-                for program in results_ct[gene_program].unique():
-                    results_ct_cy = results_ct.loc[results_ct[gene_program] == program]
-                    df_pivot = results_ct_cy.pivot(index="threshold_expression", columns="threshold_lfc", values="fdr")
-                    with warnings.catch_warnings():
-                        warnings.simplefilter(action="ignore", category=FutureWarning)
-                        df_combined = pd.concat([df, df_pivot])
-                    df_merged = df_combined.combine_first(df_pivot)
-                    df_merged = df_merged.loc[~df_merged.index.duplicated()]
-                    df_pivot = df_merged.loc[all_thresholds_expression, all_thresholds_lfc].astype(float)
-                    frac_valid_results, frac_pval_below_alpha, is_robust = self._check_robustness_fractions(
-                        df_pivot,
-                        threshold_qval=threshold_qval,
-                        threshold_valid=threshold_valid,
-                        threshold_below_alpha=threshold_below_alpha,
-                    )
-
-                    if is_robust:
-                        robust_results.append(
-                            (
-                                celltype_combo,
-                                contrast,
-                                program,
-                                frac_valid_results,
-                                frac_pval_below_alpha,
-                                is_robust,
-                                results_ct_cy.nes.min(),
-                                results_ct_cy.nes.max(),
-                                threshold_qval,
-                                threshold_below_alpha,
-                            )
-                        )
-
-        robust_results = pd.DataFrame(robust_results).rename(
-            {
-                0: "celltype_combo",
-                1: "contrast",
-                2: gene_program,
-                3: "frac_valid",
-                4: "frac_significant",
-                5: "is_robust",
-                6: "NES_min",
-                7: "NES_max",
-                8: "qval_threshold",
-                9: "threshold_frac_below_alpha",
-            },
-            axis=1,
-        )
-        return robust_results
-
-    def get_robust_significant_results(
-        self,
-        results: pd.DataFrame,
-        alphas: list[float] | None = None,
-        threshold_valid: float = 0.1,
-        threshold_below_alpha: float = 0.9,
-    ) -> pd.DataFrame:
-        """Function Wrapper: Filters for robust and signifcant results across several alpha/q-val from original enrichments (run_enrichment_test() output).
-
-        Returns only the enrichments that are statistically significant (q-val), and stable across many different tests (per contrast).
-        Calls check_robustness for different qval thresholds to explore more stringent significance thresholds. Use for visualization of results (e.g. in a heatmap). If using thresholds [0.1, 0.05, 0.01] for significant testing, returns significance notations as well (*, **, ***)
-
-        Parameters
-        ----------
-        - results
-            The DataFrame output from run_enrichment_test().
-        - alphas
-            List of thresholds (q-val) to check significance of results. Result is considered significant if its q-val is below this threshold.
-        - threshold_valid
-            The fraction of results required to even consider this condition. I.e. if the test only ran for one set of thresholds, then it is not very robust.
-        - threshold_below_alpha
-            The fraction of results that need to be significant
-
-        Returns:
-        -------
-        - robust_results_dict
-            Dictionary mapping contrasts to lists of the enrichment score results (pivot_df), their significance annotations (annot_df), and significance thresholds (robust_sub).
-            robust_results_dict = {contrast1: [pivot_df1, annot_df1, robust_sub1],
-                                   contrast2: [pivot_df2, annot_df2, robust_sub2]}
-        """
-        # default significant values (matching significance stars)
-        if alphas is None:
-            alphas = [0.1, 0.05, 0.01]
-
-        # Get gene_program name of your enrichment analysis.
-        if "cytokine" in results.columns:
-            gene_program = "cytokine"
-        elif "CIP" in results.columns:
-            gene_program = "CIP"
-        elif "query_program" in results.columns:
-            gene_program = "query_program"
-        else:
-            raise ValueError("Missing column that is defining gene programs in 'results'.")
-            return
-
-        results_robust = [
-            self.check_robustness(
-                results,
-                threshold_qval=alpha,
-                threshold_valid=threshold_valid,
-                threshold_below_alpha=threshold_below_alpha,
-            )
-            for alpha in alphas
-        ]
-
-        results_robust = pd.concat(results_robust)
-
-        # if none of the results in the df pass the filter, exit out and don't return anything.
-        if results_robust.empty:
-            print("No robust results to process. Exiting function.")
-            return
-
-        results_robust = (
-            results_robust.groupby(["contrast", "celltype_combo", gene_program])["qval_threshold"]
-            .min()
-            .to_frame()
-            .reset_index()
-        )
-
-        results_mean = (
-            results.assign(nes=pd.to_numeric(results.nes, errors="coerce"))  # ensure numeric
-            .fillna({"nes": 0})  # only fill NES
-            .groupby(["contrast", "celltype_combo", gene_program])["nes"]
-            .mean()
-            .to_frame()
-            .reset_index()
-        )
-
-        # Create separate robust results dict for every contrast pair.
-        robust_results_dict = {}
-        for contrast in results.contrast.unique():
-            subset = results_mean[results_mean.contrast == contrast]
-            pivot_df = subset.pivot(index=gene_program, columns="celltype_combo", values="nes")
-
-            # create empty annotation df
-            annot_df = pivot_df.copy().astype(object)
-            annot_df[:] = ""
-
-            # fill annotations based on results_robust
-            robust_sub = results_robust[results_robust.contrast == contrast]
-            for program in annot_df.index:
-                for celltype in annot_df.columns:
-                    qval = robust_sub.loc[
-                        (robust_sub[gene_program] == program) & (robust_sub.celltype_combo == celltype),
-                        "qval_threshold",
-                    ]
-                    if len(qval) != 0:
-                        qval = qval.values[0]
-                        if qval == 0.1:
-                            annot_df.loc[program, celltype] = "*"
-                        elif qval == 0.05:
-                            annot_df.loc[program, celltype] = "**"
-                        elif qval == 0.01:
-                            annot_df.loc[program, celltype] = "***"
-
-            robust_results_dict[contrast] = [pivot_df, annot_df, robust_sub]
-
-        return robust_results_dict
-
-    ######## cell communication methods ########
-    def _get_senders(
-        self,
-        adata: AnnData,
-        cytokine_info: pd.DataFrame,
-        cytokine: str = "IL-32-beta",
-        show: bool = False,
-        column_cell_type: str = "cell_type",
-    ) -> pd.DataFrame:
-        genes = np.unique(re.split(", ", cytokine_info.loc[cytokine_info.name == cytokine, "gene"].values[0]))
-        mask = np.isin(genes, adata.var_names)
-
-        if not mask.any():
-            print(f"None of the cytokine producing genes ({genes}) were found in dataset for cytokine {cytokine}.")
-            return None
-        if not mask.all():
-            print(
-                f"The following cytokine producing genes were not found in the dataset and are excluded: {genes[~mask]}"
-            )
-            genes = genes[mask]
-        adata = adata[:, genes]
-
-        # Ranks gene(s) of query sender cytokine across immune cell types.
-        adata_out = sc.tl.rank_genes_groups(
-            adata,
-            groupby=column_cell_type,
-            copy=True,
-            use_raw=False,
-            method="wilcoxon",
-        )
-        result = adata_out.uns["rank_genes_groups"]
-        groups = result["names"].dtype.names
-
-        results_mean, results_frac = [], []
-        rank_genes_df = []
-        for g in groups:
-            df = pd.DataFrame(
-                {
-                    "gene": result["names"][g],
-                    "logfoldchanges": result["logfoldchanges"][g],
-                    "pvals": result["pvals"][g],
-                    "pvals_adj": result["pvals_adj"][g],
-                    column_cell_type: g,
-                }
-            )
-            rank_genes_df.append(df)
-        rank_genes_df = pd.concat(rank_genes_df, axis=0)
-        rank_genes_df.set_index(column_cell_type, inplace=True)
-        grouped = rank_genes_df.groupby(column_cell_type)
-
-        # Chooses minimum rank_genes_group() statistical parameters (considers limiting gene, if there are multiple per cytokine)
-        grouped_rank_genes_df_all = []
-        for celltype in grouped.groups:
-            grouped_celltype_df = grouped.get_group(celltype)
-
-            # get gene with smallest log_fold_change (representing limiting gene), and retrieve stat. parameters
-            limiting_gene_idx = np.argmin(grouped_celltype_df["logfoldchanges"].values)
-            limiting_gene_vals = grouped_celltype_df.iloc[limiting_gene_idx][["logfoldchanges", "pvals", "pvals_adj"]]
-            gene_concat = ", ".join(grouped_celltype_df["gene"])
-            grouped_rank_genes_df = limiting_gene_vals.to_frame().T
-            grouped_rank_genes_df["gene"] = gene_concat
-            grouped_rank_genes_df.index = [celltype]
-            grouped_rank_genes_df_all.append(grouped_rank_genes_df)
-
-        grouped_rank_genes_df_all = pd.concat(grouped_rank_genes_df_all, axis=0)
-        grouped_rank_genes_df_all = grouped_rank_genes_df_all.rename(
-            columns={"logfoldchanges": "min_logfoldchanges", "pvals": "min_pvals", "pvals_adj": "min_pvals_adj"}
-        )
-
-        # Minimum of mean gene expression of sender cytokine genes:
-        X_df = adata[:, genes].to_df()
-        frac_df = X_df > 0
-        X_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
-        frac_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
-
-        # take minimum average gene expression across all genes required for this sender
-        results_mean = (
-            X_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame().rename({0: "mean_X"}, axis=1)
-        )
-        # take minimum expression fraction across all genes required for this sender
-        results_frac = (
-            frac_df.groupby(column_cell_type, observed=False)
-            .mean()
-            .min(axis=1)
-            .to_frame()
-            .rename({0: "frac_X"}, axis=1)
-        )
-
-        # Final df with information about active sender cytokines.
-        results = pd.concat([grouped_rank_genes_df_all, results_mean, results_frac], axis=1)
-        results["mean_X>0"] = results["mean_X"].where(results["mean_X"] > 0, None)
-        results.loc[:, "cytokine"] = cytokine
-        return results
-
-    def _get_receivers(
-        self, adata: AnnData, cytokine_info: pd.DataFrame, cytokine: str, column_cell_type: str = "cell_type"
-    ) -> pd.DataFrame | None:
-        # get receptor genes for this cytokine
-        _receptor_genes = cytokine_info.loc[cytokine_info.name == cytokine, "receptor gene"]
-        if _receptor_genes.isna().all():
-            print(f"No receptor gene found in cytokine_info for cytokine: {cytokine}")
-            return None
-        assert len(_receptor_genes) == 1, _receptor_genes
-        _receptor_genes = _receptor_genes.values[0]
-        # there can be multiple receptors
-        candidates = re.split("; ", _receptor_genes)
-        results_mean, results_frac = [], []
-        # each receptor may require the expression of multiple genes
-        for candidate in candidates:
-            # print(candidate)
-            genes = np.array(re.split(", ", candidate))
-            mask = np.isin(genes, adata.var_names)
-            if not mask.any():
-                print(f"None of the cytokine receptor genes ({genes}) were found in dataset for cytokine {cytokine}.")
-                continue
-            if not mask.all():
-                print(
-                    f"The following cytokine receptor genes were not found in the dataset and are excluded: {genes[~mask]}"
-                )
-                genes = genes[mask]
-            X_df = adata[:, genes].to_df()
-            frac_df = X_df > 0
-            X_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
-            frac_df.loc[:, column_cell_type] = adata.obs.loc[:, column_cell_type].values
-            # take minimum average gene expression across all genes required for this receptor
-            results_mean.append(X_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame())
-            # take minimum expression fraction across all genes required for this receptor
-            results_frac.append(frac_df.groupby(column_cell_type, observed=False).mean().min(axis=1).to_frame())
-        if len(results_mean) == 0:
-            return None
-
-        results_mean = pd.concat(results_mean, axis=1).max(axis=1).to_frame().rename({0: "mean_X"}, axis=1)
-        results_frac = pd.concat(results_frac, axis=1).max(axis=1).to_frame().rename({0: "frac_X"}, axis=1)
-        results = pd.concat([results_mean, results_frac], axis=1)
-        results.loc[:, "cytokine"] = cytokine
-        return results
-
-    def get_one_senders_and_receivers(
-        self,
-        adata: AnnData,
-        cytokine_info: pd.DataFrame,
-        cytokine: str,
-        celltype_colname: str = "cell_type",
-        sender_pvalue_threshold: float = 0.1,
-        receiver_mean_X_threshold: float = 0,
-        sender_lfc_threshold: float = 0,
-    ) -> tuple[pd.DataFrame, pd.DataFrame]:
-        """Generates cytokine producer and receiver statistics (senders and receivers of cell-cell communication) for one cytokine.
-
-        Best for exploration purposes of a singular cytokine.
-
-        Parameters
-        ----------
-        adata : AnnData
-            Query adata object of analysis
-        cytokine_info : pd.DataFrame
-            External file containing info about receptor genes of each cytokine in format
-            pd.DataFrame({"name": cytokine, "receptor gene": [gene1, gene2]})
-        cytokine : str
-            A cytokine, which ideally should be present in robust_results
-            (the outcome of the robust enrichment analysis)
-        celltype_colname : str, default "cell_type"
-            Column name of where cell types are stored in adata
-
-        Returns:
-        -------
-        df_senders : pd.DataFrame
-            Cytokine signal senders per cell type
-        df_receivers : pd.DataFrame
-            Cytokine signal receivers per cell type
-        """
-        df_senders = self._get_senders(
-            adata=adata, cytokine_info=cytokine_info, cytokine=cytokine, column_cell_type=celltype_colname
-        )
-        df_receivers = self._get_receivers(
-            adata=adata, cytokine_info=cytokine_info, cytokine=cytokine, column_cell_type=celltype_colname
-        )
-        if df_senders is not None:
-            df_senders = df_senders.loc[
-                (df_senders.min_pvals < sender_pvalue_threshold)
-                & (df_senders.min_logfoldchanges > sender_lfc_threshold)
-            ]
-        if df_receivers is not None:
-            df_receivers = df_receivers.loc[df_receivers.mean_X > receiver_mean_X_threshold]
-
-        return df_senders, df_receivers
-
-    def get_all_senders_and_receivers(
-        self,
-        adata: AnnData,
-        cytokine_info: pd.DataFrame,
-        cytokine_list: list = None,
-        celltype_colname: str = "cell_type",
-        sender_pvalue_threshold: float = 0.1,
-        receiver_mean_X_threshold: float = 0,
-    ) -> tuple[pd.DataFrame, pd.DataFrame]:
-        """Generates cytokine producer and receiver statistics (senders and receivers of cell-cell communication) for a list of cytokines.
-
-        Best for visualization purposes (for plot_communication function).
-
-        Parameters
-        ----------
-        adata : AnnData
-            Query adata object of analysis
-        cytokine_info : pd.DataFrame
-            External file containing info about receptor genes of each cytokine in format
-            pd.DataFrame({"name": cytokine, "receptor gene": [gene1, gene2]})
-        cytokine_list : list, optional
-            List of cytokines, which ideally should be present in robust_results
-            (the outcome of the robust enrichment analysis). Default is None.
-        celltype_colname : str, default "cell_type"
-            Column name of where cell types are stored in adata
-
-        Returns:
-        -------
-        df_src : pd.DataFrame
-            All cytokine signal senders
-        df_tgt : pd.DataFrame
-            All cytokine signal receivers
-        """
-        senders, receivers = [], []
-        for cytokine in cytokine_list:
-            df_senders, df_receivers = self.get_one_senders_and_receivers(
-                adata=adata,
-                cytokine_info=cytokine_info,
-                cytokine=cytokine,
-                celltype_colname=celltype_colname,
-                sender_pvalue_threshold=0.1,
-                receiver_mean_X_threshold=0,
-            )
-
-            if cytokine == "IL-32-beta":
-                # no known receptor genes - create non-informative df_receivers manually.
-                all_celltypes = sorted(adata.obs[celltype_colname].unique())
-                df_receivers = pd.DataFrame.from_dict(
-                    dict(zip(all_celltypes, np.ones([len(all_celltypes), 2]) * np.inf, strict=True)),
-                    orient="index",
-                ).rename({0: "mean_X", 1: "frac_X"}, axis=1)
-                df_receivers.loc[:, "cytokine"] = cytokine
-
-            if df_senders is not None and df_receivers is not None:
-                df_senders = df_senders.assign(celltype=df_senders.index)
-                df_receivers = df_receivers.assign(celltype=df_receivers.index)
-
-                senders.append(df_senders)
-                receivers.append(df_receivers)
-
-        df_src = pd.concat(senders)
-        df_tgt = pd.concat(receivers)
-
-        return df_src, df_tgt
-
-    ######## PLOTTING: #########
-
-    def _format_cytokine_names(self, x):
-        if isinstance(x, (list, np.ndarray, pd.Index)):
-            return [self._format_cytokine_names(_x) for _x in x]
-        text = x.get_text() if hasattr(x, "get_text") else x
-        text = text.replace("beta", r"$\beta$")
-        text = text.replace("alpha", r"$\alpha$")
-        text = text.replace("gamma", r"$\gamma$")
-        text = text.replace("lambda", r"$\lambda$")
-        text = text.replace("omega", r"$\omega$")
-        return text
-
-    def plot_significant_results(
-        self,
-        results_pivot: pd.DataFrame,
-        df_annot: pd.DataFrame,
-        robust_results_dict: dict[str, pd.DataFrame] | None = None,
-        selected_celltypes: list[str] | None = None,
-        selected_cytokines: list[str] | None = None,
-        fontsize: float = 6.0,
-        save_fig: bool = False,
-        fig_path: str = "",
-        fig_width: float = 10.0,
-        fig_height: float = 12.0,
-    ):
-        """Optional heatmap plotting aid: Plots either the robust results from a dict of contrasts or individually per contrast.
-
-        Parameters
-        ----------
-        - robust_results_dict:
-            robust enrichment score dictionary from get_significant_results(). If this argument is present it has precedence over results_pivot and df_annot.
-        - results_pivot:
-            pandas DataFrame of robust enrichment for results from one contrast
-        - df_annot:
-            pandas DataFrame of robust enrichment significance annotations for results from one contrast
-        - selected_celltypes:
-            Can choose to only visualize selected celltypes out of available from robust results. Must be in robust results, otherwise error.
-        - selected_cytokines:
-            Can choose to only visualize selected celltypes out of available from robust results. Must be in robust results, otherwise error.
-
-        Returns:
-        -------
-        - Nothing. Plotting function only
-
-        """
-        # Case 1: robust_results_dict is provided. This precedes the other arguments. Plots all contrasts together.
-        if robust_results_dict is not None and len(robust_results_dict) > 0:
-            n = len(robust_results_dict)
-            fig, axes = plt.subplots(1, n, squeeze=False)
-
-            for i, (contrast, (_pivot, _annot, _)) in enumerate(robust_results_dict.items()):
-                ax = axes[0, i]
-                pivot = _pivot
-                annot = _annot
-
-                # Apply filtering if requested
-                if selected_celltypes:
-                    pivot = pivot.T.loc[selected_celltypes].T
-                    annot = annot.T.loc[selected_celltypes].T
-                if selected_cytokines:
-                    pivot = pivot.loc[selected_cytokines]
-                    annot = annot.loc[selected_cytokines]
-
-                fig, ax = plt.subplots(figsize=(fig_width, fig_height))
-                sns.heatmap(
-                    pivot,
-                    square=True,
-                    annot=annot,
-                    vmin=-1,
-                    vmax=1,
-                    cmap="RdBu_r",
-                    center=0,
-                    annot_kws={"fontsize": fontsize, "family": "sans-serif"},
-                    fmt="",
-                    linewidths=0.5,
-                    linecolor="white",
-                    cbar=True,
-                    cbar_kws={"shrink": 0.5, "fraction": 0.04, "pad": 0.02},
-                    ax=ax,
-                )
-
-                ax.set_title(contrast, fontsize=10)
-                ax.set_xlabel("")
-                ax.set_ylabel("")
-                ax.set_facecolor("lightgray")
-                ax.tick_params(axis="both", which="both", length=0)
-
-                # Axis labels
-                ax.set_xticks(0.5 + np.arange(pivot.shape[1]))
-                ax.set_xticklabels(pivot.columns, fontsize=fontsize, rotation=90, ha="center")
-                ax.set_yticks(0.5 + np.arange(pivot.shape[0]))
-                ax.set_yticklabels(self._format_cytokine_names(pivot.index), fontsize=fontsize, rotation=0, ha="right")
-
-            if save_fig:
-                fig_file = Path(fig_path) / "all_contrasts_significant_results.svg"
-                # Ensure the directory exists
-                fig_file.parent.mkdir(parents=True, exist_ok=True)
-
-                plt.savefig(
-                    fig_file,
-                    bbox_inches="tight",
-                    pad_inches=0,
-                    dpi=500,
-                )
-            plt.tight_layout()
-            plt.show()
-            return
-
-        # Case 2: single robust_result is provided, only the one chosen contrast comparison is plotted.
-        if isinstance(results_pivot, pd.DataFrame) and isinstance(df_annot, pd.DataFrame):
-            if selected_celltypes:
-                results_pivot = results_pivot.T.loc[selected_celltypes].T
-                df_annot = df_annot.T.loc[selected_celltypes].T
-            if selected_cytokines:
-                results_pivot = results_pivot.loc[selected_cytokines]
-                df_annot = df_annot.loc[selected_cytokines]
-
-            fig, ax = plt.subplots(figsize=(fig_width, fig_height))
-            sns.heatmap(
-                results_pivot,
-                square=True,
-                annot=df_annot,
-                vmin=-1,
-                vmax=1,
-                cmap="RdBu_r",
-                center=0,
-                annot_kws={"fontsize": fontsize, "family": "sans-serif"},
-                fmt="",
-                linewidths=0.5,
-                linecolor="white",
-                cbar=True,
-                cbar_kws={"shrink": 0.5, "fraction": 0.04, "pad": 0.02},
-                ax=ax,
-            )
-            ax.set_title("Contrast1_vs_Contrast2", fontsize=10)
-            ax.set_xlabel("")
-            ax.set_ylabel("")
-            ax.set_facecolor("lightgray")
-            ax.tick_params(axis="both", which="both", length=0)
-
-            # Axis labels
-            ax.set_xticks(0.5 + np.arange(results_pivot.shape[1]))
-            ax.set_xticklabels(results_pivot.columns, fontsize=fontsize, rotation=90, ha="center")
-            ax.set_yticks(0.5 + np.arange(results_pivot.shape[0]))
-            ax.set_yticklabels(
-                self._format_cytokine_names(results_pivot.index), fontsize=fontsize, rotation=0, ha="right"
-            )
-
-            plt.show()
-
-            if save_fig:
-                fig_file = Path(fig_path) / "significant_results.svg"
-                # Ensure the directory exists
-                fig_file.parent.mkdir(parents=True, exist_ok=True)
-
-                plt.savefig(fig_file, bbox_inches="tight", pad_inches=0, dpi=500)
-            return
-
-        print("Nothing was plotted. Check input data!")
-        return
-
-    def plot_communication(
-        self,
-        df_src: pd.DataFrame,
-        df_tgt: pd.DataFrame,
-        frac_expressing_cells_sender: float | None = 0.05,
-        frac_expressing_cells_receiver: float | None = 0.05,
-        mean_cytokine_gene_expression_sender: float | None = None,
-        mean_cytokine_gene_expression_receiver: float | None = None,
-        df_enrichment: pd.DataFrame | None = None,
-        all_celltypes: list | None = None,
-        cytokine2color: dict | None = None,
-        celltype2color: dict | None = None,
-        figsize: tuple[float, float] = (5, 5),
-        show_legend: bool = True,
-        save_path: str | None = None,
-        lw: float = 1.0,
-        fontsize: int = 6,
-        loc: str = "upper left",
-        bbox_to_anchor: tuple[float, float] = (1, 1),
-    ):
-        """Generates a Circos plot to visualize cell-cell communication based on cytokine producers and receivers.
-
-        The function filters the input dataframes based on thresholds for fraction of expressing cells
-        and mean cytokine gene expression, then creates a circular layout with cell type partitions
-        and draws directed links representing cytokine communication between producers and receivers.
-
-        Parameters
-        ----------
-        df_src : pd.DataFrame
-            DataFrame containing producer cell type and cytokine expression statistics,
-            typically from `_get_expression_stats`. Must have 'celltype', 'cytokine',
-            'mean_cytokine_gene_expression', and 'frac_expressing_cells' columns.
-        df_tgt : pd.DataFrame
-            DataFrame containing receiver cell type and cytokine expression statistics,
-            typically from `_get_expression_stats`. Must have 'celltype', 'cytokine',
-            'mean_cytokine_gene_expression', and 'frac_expressing_cells' columns.
-        frac_expressing_cells_sender : float | None, default 0.05
-            Minimum fraction of cells expressing a cytokine gene for a producer cell type.
-            If None, no filtering is applied.
-        frac_expressing_cells_receiver : float | None, default 0.05
-            Minimum fraction of cells expressing a cytokine gene for a receiver cell type.
-            If None, no filtering is applied.
-        mean_cytokine_gene_expression_sender : float | None, default None
-            Minimum mean expression of a cytokine gene for a producer cell type. If None, no filtering is applied.
-        mean_cytokine_gene_expression_receiver : float | None, default None
-            Minimum mean expression of a cytokine gene for a receiver cell type. If None, no filtering is applied.
-        df_enrichment : pd.DataFrame | None, optional
-            Optional dataframe with enrichment information. Default is None.
-        all_celltypes : list | None, optional
-            List of all cell types. If None, inferred from df_src and df_tgt.
-        cytokine2color : dict | None, optional
-            Optional mapping from cytokine names to colors.
-        celltype2color : dict | None, optional
-            Optional mapping from cell type names to colors.
-        figsize : tuple[float, float], default (5, 5)
-            Figure size for the plot.
-        show_legend : bool, default True
-            Whether to show the legend.
-        save_path : str | None, optional
-            Path to save the figure. If None, figure is not saved.
-        lw : float, default 1.0
-            Line width for links.
-        fontsize : int, default 6
-            Font size for labels.
-        loc : str, default "upper left"
-            Legend location.
-        bbox_to_anchor : tuple[float, float], default (1, 1)
-            Bounding box anchor for the legend.
-
-        """
-        if frac_expressing_cells_sender is not None:
-            df_src = df_src.loc[df_src.frac_X > frac_expressing_cells_sender]
-        if frac_expressing_cells_receiver is not None:
-            df_tgt = df_tgt.loc[df_tgt.frac_X > frac_expressing_cells_receiver]
-        if mean_cytokine_gene_expression_sender is not None:
-            df_src = df_src.loc[df_src.mean_X > mean_cytokine_gene_expression_sender]
-        if frac_expressing_cells_receiver is not None:
-            df_tgt = df_tgt.loc[df_tgt.mean_X > mean_cytokine_gene_expression_receiver]
-
-        if all_celltypes is None:
-            all_celltypes = sorted(np.union1d(df_src.celltype.unique(), df_tgt.celltype.unique()))
-        # celltype_colors = all_palettes["Set3"][len(all_celltypes)]
-        if celltype2color is None:
-            n = len(all_celltypes)
-
-            # Get first 20 colors from Category20
-            palette_20 = all_palettes["Category20"][20]
-            # Get 20 colors from Category20b
-            palette_20b = all_palettes["Category20b"][20]
-
-            # Combine palettes
-            combined_palette = palette_20 + palette_20b
-
-            if n > 40:
-                raise ValueError(f"Too many cell types ({n}) for available palettes (max 40).")
-
-            # Assign colors to cell types
-            celltype_colors = combined_palette[:n]
-            celltype2color = dict(zip(all_celltypes, celltype_colors, strict=True))
-
-        all_cytokines = np.union1d(df_src.cytokine.unique(), df_tgt.cytokine.unique())
-        cytokine2idx = {cytokine: k for k, cytokine in enumerate(all_cytokines)}
-        # cytokine_colors = all_palettes["Category20"][len(all_cytokines)]
-        # cytokine2color = dict(zip(all_cytokines, cytokine_colors, strict=True))
-
-        unique_cytokines = df_src.cytokine.unique()
-        if df_enrichment is not None:
-            significant_cytokines = df_enrichment.cytokine.unique()
-            unique_cytokines = np.intersect1d(unique_cytokines, significant_cytokines)
-
-        if cytokine2color is None:
-            cytokine_colors = all_palettes["Colorblind"][max(3, len(unique_cytokines))]
-            cytokine_colors = cytokine_colors[: len(unique_cytokines)]  # in case there are less than 3 unique cytokines
-            # cytokine_colors = all_palettes["Set3"][max(3, len(unique_cytokines))]
-            cytokine2color = dict(zip(unique_cytokines, cytokine_colors, strict=True))
-
-        # draw outer circle / cell type partitions
-        sectors = dict(zip(all_celltypes, (2 * len(all_cytokines) + 3) * np.ones(len(all_celltypes)), strict=True))
-
-        circos = Circos(sectors, space=3)
-        for sector in circos.sectors:
-            start, stop = sector.deg_lim
-            center = (start + stop) / 2
-            track = sector.add_track((92, 100))
-
-            if 160 >= center >= 20:
-                ha = "left"
-            elif 340 >= center >= 200:
-                ha = "right"
-            else:
-                ha = "center"
-
-            va = "bottom" if center < 90 or center > 270 else "top"
-
-            track.axis(facecolor=celltype2color[sector.name])
-            # track.text(shorten_cell_type_names(sector.name), color="black", size=6, r=110, rotation="horizontal", adjust_rotation=False, family="sans-serif", ha=ha)
-            track.text(
-                sector.name,
-                color="black",
-                size=fontsize,
-                r=110,
-                rotation="horizontal",
-                adjust_rotation=False,
-                family="sans-serif",
-                ha=ha,
-                va=va,
-            )
-
-        # draw links
-        legend_cytokine2color = {}
-        for _row_idx, row in df_src.iterrows():
-            src_celltype = row.celltype
-            cytokine_idx = cytokine2idx[row.cytokine]
-            tgt_celltypes = df_tgt.loc[df_tgt.cytokine == row.cytokine].celltype.unique()
-
-            for tgt_celltype in tgt_celltypes:
-                is_enriched = True  # default --> plot if enriched or whenever no enrichment info is provided
-
-                if df_enrichment is not None:
-                    df_enrichment.loc[:, "celltype"] = df_enrichment.celltype_combo.apply(lambda x: x.split(" (")[0])
-                    select = (df_enrichment.celltype == tgt_celltype) & (df_enrichment.cytokine == row.cytokine)
-                    is_enriched = df_enrichment.loc[select].shape[0] > 0
-
-                if is_enriched:
-                    linestyle = None
-                    _score = df_tgt.loc[
-                        (df_tgt.cytokine == row.cytokine) & (df_tgt.celltype == tgt_celltype), "mean_X"
-                    ].values
-                    assert len(_score) == 1
-                    if not np.isfinite(_score[0]):
-                        linestyle = "--"
-
-                    circos.link_line(
-                        (src_celltype, 1 + cytokine_idx),  # src node
-                        (tgt_celltype, 2 + len(all_cytokines) + cytokine_idx),  # tgt node
-                        direction=1,
-                        color=cytokine2color[row.cytokine],
-                        # color=celltype2color[src_celltype],
-                        lw=lw,
-                        arrow_height=8.0,
-                        arrow_width=8.0,
-                        linestyle=linestyle,
-                    )
-                    if row.cytokine not in legend_cytokine2color:
-                        legend_cytokine2color[row.cytokine] = cytokine2color[row.cytokine]
-
-        circos.plotfig(figsize=figsize)
-        plt.gca()
-
-        legend_handles = []
-        legend_labels = []
-        for cytokine, color in legend_cytokine2color.items():
-            legend_handles.append(mlines.Line2D([], [], color=color, lw=1.5))
-            legend_labels.append(cytokine)
-        if show_legend:
-            plt.legend(
-                handles=legend_handles,
-                labels=legend_labels,
-                title="Cytokines",
-                loc=loc,
-                bbox_to_anchor=bbox_to_anchor,
-                prop={"family": "sans-serif", "size": 6},
-                title_fontsize=6,
-            )
-        plt.tight_layout()
-        if save_path:
-            plt.savefig(
-                save_path,
-                bbox_inches="tight",
-                pad_inches=0,
-                transparent=True,
-                dpi=400,
-            )
-        plt.show()
-
-        return legend_handles, legend_labels
diff --git a/pyproject.toml b/pyproject.toml
index 056d870b..be0498d9 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -65,11 +65,7 @@ dependencies = [
     "scikit-learn>=1.4",
     "fast-array-utils[accel,sparse]",
     "arviz",
-    "filelock",
-    "bokeh",
-    "pycirclize",
-    "tqdm"
-
+    "filelock"
 ]
 
 [project.optional-dependencies]
diff --git a/tests/tools/test_hucira.py b/tests/tools/test_hucira.py
deleted file mode 100644
index 003e01da..00000000
--- a/tests/tools/test_hucira.py
+++ /dev/null
@@ -1,105 +0,0 @@
-import numpy as np
-import pandas as pd
-import pytest
-import scanpy as sc
-from anndata import AnnData
-
-import pertpy as pt
-
-
-@pytest.fixture
-def dummy_adata():
-    n_obs = 15
-    n_vars = 5
-    rng = np.random.default_rng()
-    X = rng.random((n_obs, n_vars))
-    adata = AnnData(X)
-    adata.var_names = [f"gene{i}" for i in range(n_vars)]
-    adata.obs["cell_type"] = ["B cell"] * 5 + ["CD8a"] * 5 + ["Mono"] * 5  # celltype column
-    adata.obs["conditions"] = ["Healthy"] * 7 + ["Disease"] * 8  # contrast column
-    return adata
-
-
-@pytest.fixture(scope="module")
-def hucira():
-    return pt.tl.Hucira()
-
-
-@pytest.fixture(scope="module")
-def hcd():
-    return pt.dt.human_cytokine_dict()
-
-
-# Generic test confirming correct output.
-def test_compute_ranking_statistic(dummy_adata, hucira):
-    contrast_column = "conditions"
-    contrasts_combo = [("Healthy", "Disease")]
-
-    ranked_stats, _num_cells = hucira._compute_ranking_statistic(dummy_adata, contrast_column, contrasts_combo)
-    assert isinstance(ranked_stats, pd.DataFrame)
-
-    # with pytest.raises(KeyError):
-    #    hucira._compute_ranking_statistic(dummy_adata, "wrong_conditions", contrasts_combo)
-
-
-# Test confirming correct argument format for celltype_combo
-def test_run_one_enrichment_test(dummy_adata, hcd, hucira):
-    # celltype_combo_correct = ("B cell", "B_cell")
-    celltype_combo_wrong = [
-        ("B cell", "B_cell"),
-        ("CD8a", "CD8_T_cell"),
-        ("Mono", "CD14_Mono"),
-    ]  # can't be a list for "run_one_enrichment_test()"
-
-    with pytest.raises(ValueError):
-        hucira.run_one_enrichment_test(
-            dummy_adata, hcd, celltype_combo_wrong, "cell_type", [("Healthy", "Disease")], "conditions", "upregulated"
-        )
-
-
-# Smoke test run
-def test_smoke_full_enrichment_test(dummy_adata, hcd, hucira):
-    celltype_combo = [
-        ("B cell", "B_cell"),
-        ("CD8a", "CD8_T_cell"),
-        ("Mono", "CD14_Mono"),
-    ]  # can't be a list for "run_one_enrichment_test()"
-    celltype_column = "cell_type"
-    contrasts_combo = [("Healthy", "Disease")]
-    contrast_column = "conditions"
-    # direction
-
-    all_enrichment_results = hucira.run_all_enrichment_test(
-        dummy_adata,
-        hcd,
-        contrasts_combo,
-        celltype_combo,
-        contrast_column,
-        celltype_column,
-        contrasts_combo,
-        contrast_column,
-    )
-    assert isinstance(all_enrichment_results, pd.DataFrame)
-
-    robust_results_dict = hucira.get_robust_significant_results(
-        results=all_enrichment_results,
-        alphas=[0.1, 0.05, 0.01],
-        threshold_valid=0.1,
-        threshold_below_alpha=0.9,
-    )
-    assert isinstance(robust_results_dict, dict)
-
-    cytokine_info = hucira.load_cytokine_info()
-    df_senders, df_receivers = hucira.get_all_senders_and_receivers(
-        dummy_adata,
-        cytokine_info,
-        robust_results_dict[contrasts_combo[0]][
-            2
-        ].cytokine.unique(),  # deep indexing, should change that soon bc not very robust.
-        celltype_column,
-        sender_pvalue_threshold=0.1,
-        receiver_mean_X_threshold=0,
-    )
-
-    assert isinstance(df_senders, pd.DataFrame)
-    assert isinstance(df_receivers, pd.DataFrame)

From e423ccf5f5c5cbca6156ea81b57063829accef4d Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Mon, 25 May 2026 17:54:36 +0200
Subject: [PATCH 08/11] Point tutorials submodule at fork branch for huCIRA
 enrichment tutorial

---
 .gitmodules              | 2 +-
 docs/tutorials/notebooks | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.gitmodules b/.gitmodules
index ff287bb4..b3ec04b3 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -1,3 +1,3 @@
 [submodule "docs/notebooks"]
 	path = docs/tutorials/notebooks
-	url = https://github.com/scverse/pertpy-tutorials/
+	url = https://github.com/Jenniliu12/pertpy-tutorials/
diff --git a/docs/tutorials/notebooks b/docs/tutorials/notebooks
index 86069936..da20cd5e 160000
--- a/docs/tutorials/notebooks
+++ b/docs/tutorials/notebooks
@@ -1 +1 @@
-Subproject commit 86069936d9d811e23558ddefb462ed78ba3eaaa9
+Subproject commit da20cd5ecf24c94543f1e67d28b0b3a353a8ed0f

From 38a3899163a48cfc242dc4e080c8cf5f01fe2632 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Wed, 27 May 2026 23:04:45 +0200
Subject: [PATCH 09/11] Revert .gitmodules URL to scverse/pertpy-tutorials

---
 .gitmodules | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.gitmodules b/.gitmodules
index b3ec04b3..ff287bb4 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -1,3 +1,3 @@
 [submodule "docs/notebooks"]
 	path = docs/tutorials/notebooks
-	url = https://github.com/Jenniliu12/pertpy-tutorials/
+	url = https://github.com/scverse/pertpy-tutorials/

From 14e07c46d013a446a3a9a6eaa697dd2fda5fb865 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Thu, 28 May 2026 01:05:46 +0200
Subject: [PATCH 10/11] changed kernel to default and updated tutorial intro
 for the hucira extension

---
 docs/tutorials/notebooks | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/tutorials/notebooks b/docs/tutorials/notebooks
index da20cd5e..f2e0308f 160000
--- a/docs/tutorials/notebooks
+++ b/docs/tutorials/notebooks
@@ -1 +1 @@
-Subproject commit da20cd5ecf24c94543f1e67d28b0b3a353a8ed0f
+Subproject commit f2e0308f3877ec97792df2cd9802173900213631

From f253cc8920483f0cc7a06394780df113d8535963 Mon Sep 17 00:00:00 2001
From: Jenni Liu <liujenni@umich.edu>
Date: Thu, 28 May 2026 01:32:11 +0200
Subject: [PATCH 11/11] Update tutorials submodule to latest enrichment
 notebook commit

---
 docs/tutorials/notebooks | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/tutorials/notebooks b/docs/tutorials/notebooks
index f2e0308f..ba197060 160000
--- a/docs/tutorials/notebooks
+++ b/docs/tutorials/notebooks
@@ -1 +1 @@
-Subproject commit f2e0308f3877ec97792df2cd9802173900213631
+Subproject commit ba197060e7e195e8efe1d02e2f2e6e7c02abe0e9