# !pip install risk-network --upgrade

import risk as r

# Check the version of the RISK package to ensure it's installed correctly
print(f"RISK version: {r.__version__}")

RISK version: 0.1.1

from risk import RISK

import os
from pathlib import Path

if "__file__" not in globals():
    os.chdir(Path().resolve())

%matplotlib inline

# Initialize the RISK object

risk = RISK(verbose=True)

# Load the network from a Cytoscape file for RISK analysis

network = risk.load_network_cytoscape(
    filepath="./data/cytoscape/michaelis_2023.cys",
    source_label="source",
    target_label="target",
    view_name="",
    compute_sphere=True,
    surface_depth=0.1,
    min_edges_per_node=1,
)

---------------
Loading network
---------------
Filetype: Cytoscape
Filepath: ./data/cytoscape/michaelis_2023.cys
Minimum edges per node: 1
Projection: Sphere
Surface depth: 0.1
Initial node count: 3839
Final node count: 3839
Initial edge count: 30955
Final edge count: 30955

# Load the network from a Cytoscape JSON file for RISK analysis

network = risk.load_network_cyjs(
    filepath="./data/cyjs/michaelis_2023.cyjs",
    source_label="source",
    target_label="target",
    compute_sphere=True,
    surface_depth=0.1,
    min_edges_per_node=1,
)

---------------
Loading network
---------------
Filetype: Cytoscape JSON
Filepath: ./data/cyjs/michaelis_2023.cyjs
Minimum edges per node: 1
Projection: Sphere
Surface depth: 0.1
EDGE LENGTH WARNING — 30955 out of 30955 edges (100.00%) had invalid or non-positive lengths and were replaced with a minimal fallback value (1e-12).
Initial node count: 3839
Final node count: 3839
Initial edge count: 30955
Final edge count: 30955

# Load the network from a GPickle file for RISK analysis

network = risk.load_network_gpickle(
    filepath="./data/gpickle/michaelis_2023.gpickle",
    compute_sphere=True,
    surface_depth=0.1,
    min_edges_per_node=1,
)

---------------
Loading network
---------------
Filetype: GPickle
Filepath: ./data/gpickle/michaelis_2023.gpickle
Minimum edges per node: 1
Projection: Sphere
Surface depth: 0.1
Initial node count: 3839
Final node count: 3839
Initial edge count: 30955
Final edge count: 30955

# Load the network from a NetworkX graph for RISK analysis

network = risk.load_network_networkx(
    network=network,
    compute_sphere=True,
    surface_depth=0.1,
    min_edges_per_node=1,
)

---------------
Loading network
---------------
Filetype: NetworkX
Minimum edges per node: 1
Projection: Sphere
Surface depth: 0.1
Initial node count: 3839
Final node count: 3839
Initial edge count: 30955
Final edge count: 30955

{
  "proline biosynthetic process": ["CAR2", "PRO1", "PRO2", "PRO3", "YHR033W"],
  "glyoxylate metabolic process": ["DAL7", "GOR1", "ICL1", "IDP1", "IDP2", "IDP3", "LEU2", "MDH3", "MLS1"]
}

# Load GO Biological Process (BP) annotations from a JSON file and associate them with the existing network

annotation = risk.load_annotation_json(
    network=network,
    filepath="./data/json/annotation/go_biological_process.json",
    min_nodes_per_term=5,
    max_nodes_per_term=75,
)

# Note: You can also load other GO annotations, such as:
# - 'go_cellular_component.json' for GO Cellular Component (CC) annotations
# - 'go_molecular_function.json' for GO Molecular Function (MF) annotations

------------------
Loading annotation
------------------
Filetype: JSON
Filepath: ./data/json/annotation/go_biological_process.json
Minimum number of nodes per annotation term: 5
Maximum number of nodes per annotation term: 75
Number of input annotation terms: 2214
Number of remaining annotation terms: 1293

# Load GO Biological Process (BP) annotations from a CSV file and associate them with the existing network

annotation = risk.load_annotation_csv(
    network=network,
    filepath="./data/csv/annotation/go_biological_process.csv",
    label_colname="label",
    nodes_colname="nodes",
    nodes_delimiter=";",
    min_nodes_per_term=5,
    max_nodes_per_term=75,
)

# Note: You can also load other GO annotations using similar filenames, such as:
# - 'go_cellular_component.csv' for GO Cellular Component (CC) annotations
# - 'go_molecular_function.csv' for GO Molecular Function (MF) annotations

------------------
Loading annotation
------------------
Filetype: CSV
Filepath: ./data/csv/annotation/go_biological_process.csv
Minimum number of nodes per annotation term: 5
Maximum number of nodes per annotation term: 75
Number of input annotation terms: 2214
Number of remaining annotation terms: 1293

# Load GO Biological Process (BP) annotations from a TSV file and associate them with the existing network

annotation = risk.load_annotation_tsv(
    network=network,
    filepath="./data/tsv/annotation/go_biological_process.tsv",
    label_colname="label",
    nodes_colname="nodes",
    nodes_delimiter=";",
    min_nodes_per_term=5,
    max_nodes_per_term=75,
)

# Note: You can also load other GO annotations using similar filenames, such as:
# - 'go_cellular_component.tsv' for GO Cellular Component (CC) annotations
# - 'go_molecular_function.tsv' for GO Molecular Function (MF) annotations

------------------
Loading annotation
------------------
Filetype: TSV
Filepath: ./data/tsv/annotation/go_biological_process.tsv
Minimum number of nodes per annotation term: 5
Maximum number of nodes per annotation term: 75
Number of input annotation terms: 2214
Number of remaining annotation terms: 1293

# Load GO Biological Process (BP) annotations from an Excel file and associate them with the existing network

annotation = risk.load_annotation_excel(
    network=network,
    filepath="./data/excel/annotation/go_biological_process.xlsx",
    label_colname="label",
    nodes_colname="nodes",
    sheet_name="Sheet1",
    nodes_delimiter=";",
    min_nodes_per_term=5,
    max_nodes_per_term=75,
)

# Note: You can also load other GO annotations using similar filenames, such as:
# - 'go_cellular_component.xlsx' for GO Cellular Component (CC) annotations
# - 'go_molecular_function.xlsx' for GO Molecular Function (MF) annotations

------------------
Loading annotation
------------------
Filetype: Excel
Filepath: ./data/excel/annotation/go_biological_process.xlsx
Minimum number of nodes per annotation term: 5
Maximum number of nodes per annotation term: 75
Number of input annotation terms: 2214
Number of remaining annotation terms: 1293

# Load the JSON file into a dictionary, then use the dictionary to load annotations

import json

json_file_path = "./data/json/annotation/go_biological_process.json"
with open(json_file_path, "r") as file:
    annotation_dict = json.load(file)

# Use the loaded dictionary with the load_annotation_dict method
annotation = risk.load_annotation_dict(
    network=network,
    content=annotation_dict,
    min_nodes_per_term=5,
    max_nodes_per_term=75,
)

------------------
Loading annotation
------------------
Filetype: Dictionary
Filepath: In-memory dictionary
Minimum number of nodes per annotation term: 5
Maximum number of nodes per annotation term: 75
Number of input annotation terms: 2214
Number of remaining annotation terms: 1293

# Louvain clustering example
clusters_louvain = risk.cluster_louvain(
    network=network,
    fraction_shortest_edges=0.25,
    resolution=5.0,
    random_seed=887,
)
print(f"Louvain clusters: shape={clusters_louvain.shape}, nnz={clusters_louvain.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'louvain'
Edge length threshold: 0.25
Resolution: 5.0
Random seed: 887
Louvain clusters: shape=(3839, 3839), nnz=38212

# Leiden clustering example
clusters_leiden = risk.cluster_leiden(
    network=network,
    fraction_shortest_edges=0.25,
    resolution=1.0,
    random_seed=887,
)
print(f"Leiden clusters: shape={clusters_leiden.shape}, nnz={clusters_leiden.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'leiden'
Edge length threshold: 0.25
Resolution: 1.0
Random seed: 887
Leiden clusters: shape=(3839, 3839), nnz=54372

# Greedy modularity clustering example
clusters_greedy = risk.cluster_greedy(
    network=network,
    fraction_shortest_edges=0.25,
)
print(f"Greedy clusters: shape={clusters_greedy.shape}, nnz={clusters_greedy.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'greedy'
Edge length threshold: 0.25
Greedy clusters: shape=(3839, 3839), nnz=68880

# Label propagation clustering example
clusters_labelprop = risk.cluster_labelprop(
    network=network,
    fraction_shortest_edges=0.25,
)
print(
    f"Label propagation clusters: shape={clusters_labelprop.shape}, nnz={clusters_labelprop.getnnz()}"
)

------------------
Computing clusters
------------------
Clustering: 'labelprop'
Edge length threshold: 0.25
Label propagation clusters: shape=(3839, 3839), nnz=42434

# Markov clustering example
clusters_markov = risk.cluster_markov(
    network=network,
    fraction_shortest_edges=0.25,
)
print(f"Markov clusters: shape={clusters_markov.shape}, nnz={clusters_markov.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'markov'
Edge length threshold: 0.25
Markov clusters: shape=(3839, 3839), nnz=31798

# Walktrap clustering example
clusters_walktrap = risk.cluster_walktrap(
    network=network,
    fraction_shortest_edges=0.25,
)
print(f"Walktrap clusters: shape={clusters_walktrap.shape}, nnz={clusters_walktrap.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'walktrap'
Edge length threshold: 0.25
Walktrap clusters: shape=(3839, 3839), nnz=42084

# Spinglass clustering example
clusters_spinglass = risk.cluster_spinglass(
    network=network,
    fraction_shortest_edges=0.25,
)
print(f"Spinglass clusters: shape={clusters_spinglass.shape}, nnz={clusters_spinglass.getnnz()}")

------------------
Computing clusters
------------------
Clustering: 'spinglass'
Edge length threshold: 0.25
Spinglass clusters: shape=(3839, 3839), nnz=38262

# Compute annotation significance by running the permutation test on Louvain clusters

stats_permutation = risk.run_permutation(
    annotation=annotation,
    clusters=clusters_louvain,
    score_metric="stdev",
    null_distribution="network",
    num_permutations=1_000,
    random_seed=887,
    max_workers=4,
)

------------------------
Running permutation test
------------------------
Cluster scoring metric: 'stdev'
Number of permutations: 1000
Maximum workers: 4
Null distribution: 'network'

Total progress: 100%|█████████████████████████| 1000/1000 [00:11<00:00, 87.69it/s]

# Compute annotation significance with the hypergeometric test on Louvain clusters

stats_hypergeom = risk.run_hypergeom(
    annotation=annotation,
    clusters=clusters_louvain,
    null_distribution="network",
)

---------------------------
Running hypergeometric test
---------------------------
Null distribution: 'network'

# Compute annotation significance with the chi-squared test on Louvain clusters

stats_chi2 = risk.run_chi2(
    annotation=annotation,
    clusters=clusters_louvain,
    null_distribution="network",
)

------------------------
Running chi-squared test
------------------------
Null distribution: 'network'

# Compute annotation significance with the binomial test on Louvain clusters

stats_binom = risk.run_binom(
    annotation=annotation,
    clusters=clusters_louvain,
    null_distribution="network",
)

---------------------
Running binomial test
---------------------
Null distribution: 'network'

# Build a NetworkGraph using permutation-based significance results

graph = risk.load_graph(
    network=network,
    annotation=annotation,
    stats_results=stats_permutation,
    tail="right",
    pval_cutoff=0.05,
    fdr_cutoff=1.00,
    display_prune_threshold=0.125,
    linkage_criterion="distance",
    linkage_method="single",
    linkage_metric="sokalmichener",
    linkage_threshold=0.063,
    min_cluster_size=5,
    max_cluster_size=1_000,
)

----------------------------
Finding significant clusters
----------------------------
p-value cutoff: 0.05
FDR BH cutoff: 1.0
Significance tail: 'right' (enrichment)
-------------------------------
Processing significant clusters
-------------------------------
Display prune threshold: 0.125
-----------------------
Finding top annotations
-----------------------
Min cluster size: 5
Max cluster size: 1000
------------------------------
Grouping clusters into domains
------------------------------

Evaluating linkage methods and metrics: 100%|██████████████████| 1/1 [00:00<00:00]

Linkage criterion: 'distance'
Linkage method: 'single'
Linkage metric: 'sokalmichener'
Linkage threshold: 0.063

# Remove every reference to Domain ID 1 from the NetworkGraph instance and retrieve the associated node labels

# domain_1_labels =  graph.pop(1)

# Fetching key NetworkGraph attributes from the graph object

domain_id_to_node_ids_map = graph.domain_id_to_node_ids_map
domain_id_to_node_labels_map = graph.domain_id_to_node_labels_map
domain_id_to_enriched_node_labels_map = graph.domain_id_to_enriched_node_labels_map
domain_id_to_domain_terms_map = graph.domain_id_to_domain_terms_map
domain_id_to_domain_info_map = graph.domain_id_to_domain_info_map

node_id_to_node_label_map = graph.node_id_to_node_label_map
node_label_to_significance_map = graph.node_label_to_significance_map
node_label_to_node_id_map = graph.node_label_to_node_id_map

node_significance_sums = graph.node_significance_sums

# Load the analysis summary into a DataFrame

loaded_summary = graph.summary.load()
loaded_summary.head()

------------------------
Loading analysis summary
------------------------

# Export analysis summary to a CSV file

graph.summary.to_csv(filepath="./data/csv/summary/michaelis_2023.csv")

------------------------
Loading analysis summary
------------------------
Analysis summary exported to CSV file: ./data/csv/summary/michaelis_2023.csv

# Export analysis summary to a JSON file

graph.summary.to_json(filepath="./data/json/summary/michaelis_2023.json")

------------------------
Loading analysis summary
------------------------
Analysis summary exported to JSON file: ./data/json/summary/michaelis_2023.json

# Export analysis summary to a text file

graph.summary.to_txt(filepath="./data/txt/summary/michaelis_2023.txt")

------------------------
Loading analysis summary
------------------------
Analysis summary exported to text file: ./data/txt/summary/michaelis_2023.txt

# Turn interactive plotting off - this enables the graph to be built across multiple cells

import matplotlib.pyplot as plt

plt.ioff()

<contextlib.ExitStack at 0x32b212570>

# Initialize the NetworkPlotter with the NetworkGraph object

plotter = risk.load_plotter(
    graph=graph,
    figsize=(15, 15),
    background_color="black",
    background_alpha=1.0,
    pad=0.3,
)

# Set random seed for reproducibility
random_seed = 887

---------------
Loading plotter
---------------

# Plot network title and subtitle

plotter.plot_title(
    title="Yeast PPI Network",
    subtitle="Michaelis et al., 2023",
    title_fontsize=24,
    subtitle_fontsize=18,
    font="DejaVu Sans",
    title_color="white",
    subtitle_color="lightblue",
    title_x=0.5,
    title_y=0.925,
    title_space_offset=0.08,
    subtitle_offset=0.025,
)

# Plot network perimeter as a circle

plotter.plot_circle_perimeter(
    scale=1.02,
    center_offset_x=0.0,
    center_offset_y=0.0,
    linestyle="solid",
    linewidth=1.5,
    color="white",
    outline_alpha=1.0,
    fill_alpha=0.0,
)

# Draw a KDE-based contour around the network perimeter

plotter.plot_contour_perimeter(
    scale=1.02,
    levels=3,
    bandwidth=0.6,
    grid_size=250,
    color="white",
    linestyle="solid",
    linewidth=1.5,
    outline_alpha=1.0,
    fill_alpha=0.0,
)

# Plot network nodes and edges

plotter.plot_network(
    node_size=plotter.get_annotated_node_sizes(
        significant_size=225,
        nonsignificant_size=12.5,
    ),
    node_shape="o",
    node_edgewidth=1.0,
    edge_width=0.03,
    node_color=plotter.get_annotated_node_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        alpha=1.0,
        nonsignificant_color="white",
        nonsignificant_alpha=0.75,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    node_edgecolor="black",
    edge_color="white",
    node_alpha=1.0,
    edge_alpha=1.0,
)

# Plot a subnetwork with custom node and edge attributes

plotter.plot_subnetwork(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    node_size=225,
    node_shape="^",
    node_edgewidth=1.0,
    edge_width=0.04,
    node_color="white",
    node_edgecolor="black",
    edge_color="white",
    node_alpha=1.0,
    edge_alpha=1.0,
)

# Plot KDE-based contours around network nodes

plotter.plot_contours(
    levels=5,
    bandwidth=0.8,
    grid_size=250,
    color=plotter.get_annotated_contour_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    linestyle="solid",
    linewidth=2.0,
    alpha=1.0,
    fill_alpha=0.25,
)

# Plot custom KDE-based contours around a subset of nodes

plotter.plot_subcontour(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    levels=5,
    bandwidth=0.8,
    grid_size=250,
    color="white",
    linestyle="solid",
    linewidth=2.0,
    alpha=1.0,
    fill_alpha=0.25,
)

# Plot labels on the network

plotter.plot_labels(
    scale=1.1,
    offset=0.12,
    font="DejaVu Sans",
    fontcase={"title": "lower"},
    fontsize=15,
    fontcolor="white",
    fontalpha=1.0,
    arrow_linewidth=2.0,
    arrow_style="-",
    arrow_color=plotter.get_annotated_label_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    arrow_alpha=1.0,
    arrow_base_shrink=10.0,
    arrow_tip_shrink=0.0,
    max_labels=28,
    min_label_lines=3,
    max_label_lines=4,
    min_chars_per_line=3,
    max_chars_per_line=12,
    words_to_omit=["from", "the", "into", "via", "novo", "process", "activity"],
    overlay_ids=False,
    ids_to_keep=None,
    ids_to_labels=None,
)

# Plot sublabels on the network

plotter.plot_sublabel(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    label="LSM1-7-PAT1 Complex",
    radial_position=73,
    scale=1.6,
    offset=0.12,
    font="DejaVu Sans",
    fontsize=15,
    fontcolor="white",
    fontalpha=1.0,
    arrow_linewidth=2.0,
    arrow_style="-",
    arrow_color="white",
    arrow_alpha=1.0,
    arrow_base_shrink=10.0,
    arrow_tip_shrink=0.0,
)

# Save the plot to a file

# plotter.savefig("network_plot.png", pad_inches=0.5, dpi=100)

# Display the plot

plotter.show()

# Set random seed for reproducibility
random_seed = 887

# Initialize the NetworkPlotter with the NetworkGraph object
plotter = risk.load_plotter(
    graph=graph,
    figsize=(15, 15),
    background_color="black",
)

# Plot network title and subtitle
plotter.plot_title(
    title="Yeast PPI Network",
    subtitle="Michaelis et al., 2023",
    title_fontsize=24,
    subtitle_fontsize=18,
    font="DejaVu Sans",
    title_color="white",
    subtitle_color="lightblue",
    title_x=0.5,
    title_y=0.925,
    title_space_offset=0.08,
    subtitle_offset=0.025,
)

# Plot network perimeter as a circle
plotter.plot_circle_perimeter(
    scale=1.02,
    center_offset_x=0.0,
    center_offset_y=0.0,
    linestyle="solid",
    linewidth=1.5,
    color="white",
    outline_alpha=1.0,
    fill_alpha=0.0,
)

# Plot network nodes and edges
plotter.plot_network(
    node_size=plotter.get_annotated_node_sizes(
        significant_size=225,
        nonsignificant_size=12.5,
    ),
    node_shape="o",
    node_edgewidth=1.0,
    edge_width=0.03,
    node_color=plotter.get_annotated_node_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        alpha=1.0,
        nonsignificant_color="white",
        nonsignificant_alpha=0.75,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    node_edgecolor="black",
    edge_color="white",
    node_alpha=1.0,
    edge_alpha=1.0,
)
# Plot a subnetwork with custom node and edge attributes
plotter.plot_subnetwork(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    node_size=225,
    node_shape="^",
    node_edgewidth=1.0,
    edge_width=0.04,
    node_color="white",
    node_edgecolor="black",
    edge_color="white",
    node_alpha=1.0,
    edge_alpha=1.0,
)

# Plot KDE-based contours around network nodes
plotter.plot_contours(
    levels=5,
    bandwidth=0.8,
    grid_size=250,
    color=plotter.get_annotated_contour_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    linestyle="solid",
    linewidth=2.0,
    alpha=1.0,
    fill_alpha=0.25,
)

# Plot custom KDE-based contours around a subset of nodes
plotter.plot_subcontour(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    levels=5,
    bandwidth=0.8,
    grid_size=250,
    color="white",
    linestyle="solid",
    linewidth=2.0,
    alpha=1.0,
    fill_alpha=0.25,
)

# Plot labels on the network
plotter.plot_labels(
    scale=1.1,
    offset=0.12,
    font="DejaVu Sans",
    fontcase={"title": "lower"},
    fontsize=15,
    fontcolor="white",
    fontalpha=1.0,
    arrow_linewidth=2.0,
    arrow_style="-",
    arrow_color=plotter.get_annotated_label_colors(
        cmap="gist_rainbow",
        color=None,
        blend_colors=False,
        blend_gamma=2.2,
        min_scale=1.0,
        max_scale=1.0,
        scale_factor=0.5,
        ids_to_colors={
            10: "#f200ff",
            32: "#fcec00",
        },
        random_seed=random_seed,
    ),
    arrow_alpha=1.0,
    arrow_base_shrink=10.0,
    arrow_tip_shrink=0.0,
    max_labels=28,
    min_label_lines=3,
    max_label_lines=4,
    min_chars_per_line=3,
    max_chars_per_line=12,
    words_to_omit=["from", "the", "into", "via", "novo", "process", "activity"],
    overlay_ids=False,
    ids_to_keep=None,
    ids_to_labels=None,
)

# Plot sublabels on the network
plotter.plot_sublabel(
    nodes=[
        "LSM1",
        "LSM2",
        "LSM3",
        "LSM4",
        "LSM5",
        "LSM6",
        "LSM7",
        "PAT1",
    ],
    label="LSM1-7-PAT1 Complex",
    radial_position=73,
    scale=1.6,
    offset=0.12,
    font="DejaVu Sans",
    fontsize=15,
    fontcolor="white",
    fontalpha=1.0,
    arrow_linewidth=2.0,
    arrow_style="-",
    arrow_color="white",
    arrow_alpha=1.0,
    arrow_base_shrink=10.0,
    arrow_tip_shrink=0.0,
)

# Display the plot
plotter.show()

---------------
Loading plotter
---------------

import pandas as pd
from IPython.display import display

# Load the parameters into a dictionary
loaded_params = risk.params.load()

# Display parameters in a tidy table for Jupyter documentation purposes
# This is intended for clarity in notebook examples, not for full inspection of nested fields
pd.set_option("display.max_colwidth", 200)
display(pd.DataFrame(list(loaded_params.items()), columns=["Parameter", "Value"]))
pd.reset_option("display.max_colwidth")

------------------
Loading parameters
------------------

# Export parameters to a CSV file

risk.params.to_csv(filepath="./data/csv/params/michaelis_2023.csv")

------------------
Loading parameters
------------------
Parameters exported to CSV file: ./data/csv/params/michaelis_2023.csv

# Export parameters to a JSON file

risk.params.to_json(filepath="./data/json/params/michaelis_2023.json")

------------------
Loading parameters
------------------
Parameters exported to JSON file: ./data/json/params/michaelis_2023.json

# Export parameters to a text file

risk.params.to_txt(filepath="./data/txt/params/michaelis_2023.txt")

------------------
Loading parameters
------------------
Parameters exported to text file: ./data/txt/params/michaelis_2023.txt

Format	Method	Description
Cytoscape (`.cys`)	`load_network_cytoscape`	Import from Cytoscape session files; supports source/target labels and view selection.
Cytoscape JSON (`.cyjs`)	`load_network_cyjs`	Import from Cytoscape JSON exports; specify source/target labels for nodes/edges.
GPickle (`.gpickle`)	`load_network_gpickle`	Reload networks serialized with GPickle; preserves complex structures.
NetworkX Graph	`load_network_networkx`	Convert existing NetworkX objects into RISK-compatible format.

Format	Method	Description
JSON	`load_annotation_json`	Import annotations from a JSON term–to–gene mapping file.
CSV	`load_annotation_csv`	Import from a CSV file (supports custom delimiters).
TSV	`load_annotation_tsv`	Import from a tab-separated file.
Excel	`load_annotation_excel`	Import annotations from a specified sheet in an XLSX file.

Algorithm	Speed	Primary use	When/Why (assumptions & notes)
Louvain	Fast	Default, scalable to very large networks	Greedy modularity optimization (Blondel et al., 2008); efficient for >10⁴ nodes; may produce disconnected subclusters.
Leiden	Fast	Improved Louvain with better resolution	Guarantees well-connected communities; more stable than Louvain (Traag et al., 2019); slightly higher runtime.
Markov Clustering	Medium	Detect smaller, compact complexes	Flow-based algorithm (Van Dongen, 2008); good for protein complexes or tightly connected submodules.
Walktrap	Medium	Hierarchical detection in mid-sized graphs	Random-walk based (Pons & Latapy, 2005); effective for local structure; slower on >10⁴ nodes.
Greedy Modularity	Fast	Coarse partitioning	Optimizes modularity via agglomeration; very fast but suffers from resolution limit (Newman, 2004).
Label Propagation	Fast	Quick heuristic	Unsupervised label spreading; no objective function; non-deterministic and unstable (Raghavan et al., 2007).
Spinglass	Slow	Small networks; theoretical interest	Statistical mechanics approach (Reichardt & Bornholdt, 2006); finds communities by simulating spin states; computationally intensive.

Test	Speed	Primary use	When/Why (assumptions & notes)
Permutation	Slow	Most rigorous; non-parametric	Distribution-free empirical null (permute network or labels); preferred when assumptions are unclear; computationally intensive.
Hypergeometric	Medium	Standard for GO/pathway overrepresentation	Exact test for finite populations sampled without replacement; widely used for term–to–gene membership tables.
Chi-squared	Fast	Approximate contingency-table testing	Suitable for large samples with expected counts ≥ 5 per cell; fast but approximate; avoid with sparse/low counts.
Binomial	Fast	Scalable approximation	Fast approximation assuming independent trials/with-replacement; useful for large populations with small samples.

	Annotation	Domain ID	Matched Members	Matched Count	Enrichment P-value	Enrichment Q-value	Depletion P-value	Depletion Q-value
0	maintenance of protein location in cell	-1		0	1.000	1.000000	1.0	1.0
1	mRNA splice site recognition	20	CDC40;ISY1;LUC7;NAM8;PRP28;PRP39;PRP42;PRP8;PR...	11	0.001	0.184714	1.0	1.0
2	transsulfuration	-1		0	1.000	1.000000	1.0	1.0
3	signal peptide processing	-1		0	1.000	1.000000	1.0	1.0
4	regulation of phosphatidylinositol dephosphory...	-1		0	1.000	1.000000	1.0	1.0

	Parameter	Value
0	annotation	{'filetype': 'JSON', 'filepath': './data/json/annotation/go_biological_process.json', 'min_nodes_per_term': 5, 'max_nodes_per_term': 75}
1	datetime	2026-01-14 12:34:18
2	graph	{'tail': 'right', 'pval_cutoff': 0.05, 'fdr_cutoff': 1.0, 'display_prune_threshold': 0.125, 'linkage_criterion': 'distance', 'linkage_method': 'single', 'linkage_metric': 'sokalmichener', 'linkage...
3	clusters	{'clustering': 'louvain', 'fraction_shortest_edges': 0.25, 'resolution': 5.0, 'random_seed': 887}
4	network	{'compute_sphere': True, 'surface_depth': 0.1, 'min_edges_per_node': 1, 'filetype': 'Cytoscape', 'filepath': './data/cytoscape/michaelis_2023.cys'}
5	plotter	{'figsize': (15, 15), 'background_color': 'black', 'background_alpha': 1.0, 'pad': 0.3, 'title': 'Yeast PPI Network', 'subtitle': 'Michaelis et al., 2023', 'title_fontsize': 24, 'subtitle_fontsize...

RISK Tutorial and Examples¶

Yeast Protein–Protein Interaction (PPI) Network Demonstration¶

Tutorial Sections¶

0. Installing RISK¶

1. Importing RISK¶

2. Initializing RISK¶

Parameters¶

3. Loading Networks into RISK¶

Supported Network Formats¶

Cytoscape Files (.cys)¶

Parameters¶

Returns¶

Cytoscape JSON Files (.cyjs)¶

Parameters¶

Returns¶

GPickle Files (.gpickle)¶

Parameters¶

Returns¶

NetworkX Graphs¶

Parameters¶

Returns¶

4. Loading Annotations into RISK¶

Supported Annotation Formats¶

JSON Files (.json)¶

Parameters¶

Returns¶

CSV Files (.csv)¶

Parameters¶

Returns¶

TSV Files (.tsv)¶

Parameters¶

Returns¶

Excel Files (.xlsx, .xls)¶

Parameters¶

Returns¶

Dictionary Annotation¶

Parameters¶

Returns¶

5. Clustering Algorithms¶

Louvain Clustering¶

Leiden Clustering¶

Greedy Modularity Clustering¶

Label Propagation Clustering¶

Markov Clustering (MCL)¶

Walktrap Clustering¶

Spinglass Clustering¶

6. Statistical Methods¶

Permutation Test¶

Parameters¶

Returns¶

Hypergeometric Test¶

Parameters¶

Returns¶

Chi-squared Test¶

Parameters¶

Returns¶

Binomial Test¶

Parameters¶

Returns¶

7. Building and Analyzing Results¶

Parameters¶

Returns¶

7a. NetworkGraph Methods¶

7b. NetworkGraph Attributes¶

7c. NetworkGraph Analysis Summary¶

Loading Results¶

Returns¶

Exporting Analysis Summary to CSV¶

Parameters¶

Exporting Analysis Summary to JSON¶

Parameters¶

Exporting Analysis Summary to Text¶

Parameters¶

8. Visualizing Networks in RISK¶

Parameters¶

Returns¶

8a. Plotting the Network Title and Subtitle¶

Plotting the Title and Subtitle¶

Parameters¶

8b. Plotting the Network Perimeter¶

Annotated Node Size Parameters (for param `node_size`)¶

Annotated Node Color (for param `node_color`)¶

Annotated Contour Color Parameters (for param `color`)¶

Annotated Label Color Parameters (for params `fontcolor` and `arrow_color`)¶

9. Overview of `risk.params`¶