import numpy as np
import pandas as pd

import scanpy as sc
import squidpy as sp

from anndata import AnnData


help(sp.gr.ligrec)

Help on function ligrec in module squidpy.gr._ligrec:

ligrec(adata: 'AnnData', cluster_key: 'str', interactions: 'Optional[InteractionType]' = None, complex_policy: 'str' = 'min', threshold: 'float' = 0.01, fdr_method: 'Optional[str]' = None, fdr_axis: 'str' = 'clusters', copy: 'bool' = False, key_added: 'Optional[str]' = None, **kwargs) -> 'Optional[LigrecResult]'
    Perform the permutation test as described in [CellPhoneDB20]_.
    
    Parameters
    ----------
    adata
        Annotated data object. Must contain :attr:`anndata.AnnData.raw` attribute.
    interactions
        Interaction to test. The type can be one of:
    
            - :class:`pandas.DataFrame` - must contain at least 2 columns named `'source'` and `'target'`.
            - :class:`dict` - dictionary with at least 2 keys named `'source'` and `'target'`.
            - :class:`typing.Sequence` - Either a sequence of :class:`str`, in which case all combinations are
              produced, or a sequence of :class:`tuple` of 2 :class:`str` or a :class:`tuple` of 2 sequences.
    
        If `None`, the interactions are extracted from :mod:`omnipath`. Protein complexes can be specified by
        delimiting the components using `_`, such as `'alpha_beta_gamma'`.
    complex_policy
        Policy on how to handle complexes. Can be one of:
    
            - `'min'` - select gene with the minimum average expression.
              This is the same as in [CellPhoneDB20]_.
            - `'all'` - select all possible combinations between complexes `'source'` and `'target'`.
    interactions_params
        Keyword arguments for :func:`omnipath.interactions.import_intercell_network` defining the interactions.
        These datasets from [OmniPath16]_ are used by default: `'omnipath'`, `'pathwayextra'` `'kinaseextra'`,
        `'ligrecextra'`.
    transmitter_params
        Keyword arguments for :func:`omnipath.interactions.import_intercell_network` defining the transmitter
        side of intercellular connections.
    receiver_params
        Keyword arguments for :func:`omnipath.interactions.import_intercell_network` defining the receiver
        side of intercellular connections.
    cluster_key
        Key in :attr:`anndata.AnnData.obs` where clusters are stored.
    clusters
        Clusters from :attr:`anndata.AnnData.obs` ``[cluster_key]``. Can be specified either as a sequence
        of :class:`tuple` or just a sequence of cluster names, in which case all combinations are created.
    n_perms
        Number of permutations for the permutation test.
    threshold
        Do not perform permutation test if any of the interacting components is being expressed
        in less than ``threshold`` percent of cells within a given cluster.
    seed
        Random seed for reproducibility.
    
    Returns
    -------
    :class:`collections.namedtuple` or None
        If ``copy = False``, updates ``adata.uns[{key_added}]`` with the following triple:
    
            - `'means'` - :class:`pandas.DataFrame` containing the mean expression.
            - `'pvalues'` - :class:`pandas.DataFrame` containing the possibly corrected p-values.
            - `'metadata'` - :class:`pandas.DataFrame` containing interaction metadata.
    
        Otherwise, just returns the result.
    
        `NaN` p-values mark combinations for which the mean expression of one of the interacting components was `0`
        or it didn't pass the ``threshold`` percentage of cells being expressed within a given cluster.


adata = sc.datasets.paul15()

WARNING: In Scanpy 0.*, this returned logarithmized data. Now it returns non-logarithmized data.

... storing 'paul15_clusters' as categorical
Trying to set attribute `.uns` of view, copying.


sc.pp.normalize_per_cell(adata)

adata.raw = adata.copy()


res = sp.gr.ligrec(adata, "paul15_clusters",
                   fdr_method=None, copy=True,
                   interactions_params={"resources": "CellPhoneDB"},
                   threshold=0.1, seed=0, n_perms=10000, n_jobs=1)
df = res.pvalues
print("Number of CellPhoneDB interactions (mouse data):", len(df))

df.head()

/home/michal/.miniconda3/envs/spatial/lib/python3.8/site-packages/requests/__init__.py:89: RequestsDependencyWarning: urllib3 (1.26.2) or chardet (3.0.4) doesn't match a supported version!
  warnings.warn("urllib3 ({}) or chardet ({}) doesn't match a supported "

WARNING: Removed `1` duplicate gene(s)

Number of CellPhoneDB interactions (mouse data): 9


sp.pl.ligrec(res, source_groups="10GMP")


res = sp.gr.ligrec(adata, "paul15_clusters",
                   fdr_method=None, copy=True,
                   threshold=0.1, seed=0, n_perms=10000, n_jobs=1)
df = res.pvalues
print("Number of OmniPath interactions (mouse data):", len(df))

df.head()

WARNING: Removed `1` duplicate gene(s)

Number of OmniPath interactions (mouse data): 107


sp.pl.ligrec(res, source_groups="10GMP")


adata = sc.datasets.pbmc3k_processed()
adata

AnnData object with n_obs × n_vars = 2638 × 1838
    obs: 'n_genes', 'percent_mito', 'n_counts', 'louvain'
    var: 'n_cells'
    uns: 'draw_graph', 'louvain', 'louvain_colors', 'neighbors', 'pca', 'rank_genes_groups'
    obsm: 'X_pca', 'X_tsne', 'X_umap', 'X_draw_graph_fr'
    varm: 'PCs'
    obsp: 'distances', 'connectivities'


res = sp.gr.ligrec(adata, "louvain",
                   fdr_method=None, copy=True,
                   interactions_params={"resources": "CellPhoneDB"},
                   threshold=0.1, seed=0, n_perms=10000, n_jobs=1)
df = res.pvalues
print("Number of CellPhoneDB interactions (human data):", len(df))

df.head()

Number of CellPhoneDB interactions (human data): 76


sp.pl.ligrec(res, source_groups=["CD4 T cells", "B cells"])


res = sp.gr.ligrec(adata, "louvain",
                   fdr_method=None, copy=True,
                   threshold=0.1, seed=0, n_perms=10000, n_jobs=1)
df = res.pvalues
print("Number of OmniPath interactions (human data):", len(df))

df.head()

Number of OmniPath interactions (human data): 510


sp.pl.ligrec(res, source_groups=["CD4 T cells", "B cells"])

	cluster_1	10GMP										...	9GMP
	cluster_2	10GMP	11DC	12Baso	13Baso	14Mo	15Mo	16Neu	17Neu	18Eos	19Lymph	...	19Lymph	1Ery	2Ery	3Ery	4Ery	5Ery	6Ery	7MEP	8Mk	9GMP
source	target
FYN	THY1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
FYN	ITGB1	0.0060	0.0843	0.7125	0.0068	0.0036	0.0067	0.4110	0.5669	0.3759	NaN	...	NaN	0.0953	0.0039	0.0001	0.0083	0.0944	0.0291	0.1237	0.0018	0.0292
TGFB1	ITGB1	0.0009	0.0206	0.1831	0.0022	0.0014	0.0010	0.0505	0.2222	0.1867	NaN	...	NaN	0.1474	0.0585	0.0093	0.0590	0.2032	0.1306	0.2321	0.0170	0.0691
ANGPT1	ITGB1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	0.0744	0.0001	NaN	0.0018	0.0430	0.0104	0.0638	0.0005	0.0130
VEGFA	ITGB1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN

Receptor-ligand permutation test¶

Imports¶

Usage¶

Load the mouse data¶

Run the CellPhoneDB's permutation test¶

Use only CellPhoneDB as a resource¶

Use all available resources from OmniPath¶

Load the human data¶

Run the CellPhoneDB's permutation test¶

Use only CellPhoneDB as a resource¶

Use all available resources from OmniPath¶

Conluding remarks¶

	cluster_1	B cells								CD14+ Monocytes		...	Megakaryocytes		NK cells
	cluster_2	B cells	CD14+ Monocytes	CD4 T cells	CD8 T cells	Dendritic cells	FCGR3A+ Monocytes	Megakaryocytes	NK cells	B cells	CD14+ Monocytes	...	Megakaryocytes	NK cells	B cells	CD14+ Monocytes	CD4 T cells	CD8 T cells	Dendritic cells	FCGR3A+ Monocytes	Megakaryocytes	NK cells
source	target
DLL1	NOTCH1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
TNF	NOTCH1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
DLL3	NOTCH1	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
DLL1	NOTCH2	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
DLL3	NOTCH2	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN