AnnNet Introduction - Multilayer Network Analysis in Systems Biology¶

In [ ]:

Copied!





# . Setup & Initialization

import numpy as np
import polars as pl
from scipy.sparse.linalg import eigsh
from collections import defaultdict

import sys
import os

sys.path.insert(0, os.path.abspath('..'))
from annnet.core.graph import AnnNet

# visualization
import matplotlib.pyplot as plt
# . Setup & Initialization

import numpy as np
import polars as pl
from scipy.sparse.linalg import eigsh
from collections import defaultdict

import sys
import os

sys.path.insert(0, os.path.abspath('..'))
from annnet.core.graph import AnnNet

# visualization
import matplotlib.pyplot as plt

In [ ]:

Copied!





try:
    print('polars available')
except Exception:
    print('polars unavailable')

try:
    print('pandas available')
except Exception:
    print('pandas unavailable')
try:
    print('polars available')
except Exception:
    print('polars unavailable')

try:
    print('pandas available')
except Exception:
    print('pandas unavailable')

In [ ]:

Copied!





# . Initialize AnnNet with Full Configuration

G = AnnNet(directed=None, v=100, e=300)  # None = mixed directionality allowed

# Enable mutation history
G.history.enable(True)
G.history.mark('initialization')

# Set graph-level attributes (unstructured metadata)
G.graph_attributes['name'] = 'Multi-Omic Disease Network'
G.graph_attributes['organism'] = 'Homo sapiens'
G.graph_attributes['disease_context'] = 'inflammatory_pathway'
G.graph_attributes['version'] = '1.0'

print(f'AnnNet initialized: capacity={G._matrix.shape}, history={G._history_enabled}')
print(f'AnnNet attributes: {G.graph_attributes}')
# . Initialize AnnNet with Full Configuration

G = AnnNet(directed=None, v=100, e=300)  # None = mixed directionality allowed

# Enable mutation history
G.history.enable(True)
G.history.mark('initialization')

# Set graph-level attributes (unstructured metadata)
G.graph_attributes['name'] = 'Multi-Omic Disease Network'
G.graph_attributes['organism'] = 'Homo sapiens'
G.graph_attributes['disease_context'] = 'inflammatory_pathway'
G.graph_attributes['version'] = '1.0'

print(f'AnnNet initialized: capacity={G._matrix.shape}, history={G._history_enabled}')
print(f'AnnNet attributes: {G.graph_attributes}')

In [ ]:

Copied!





# . Define Multilayer Structure (Kivelä Formalism)

# Define multi-aspect structure
G.layers.set_aspects(
    aspects=['omic'], elem_layers={'omic': ['PPI', 'metabolic', 'regulatory', 'phenotype']}
)

# Set aspect-level metadata
G.layers.set_aspect_attrs(
    'omic',
    description='Biological interaction layer',
    data_sources=['STRING', 'KEGG', 'TRRUST', 'DisGeNET'],
)

# Set layer-level metadata
G.layers.set_layer_attrs(
    ('PPI',), interaction_type='physical', evidence='experimental', database='STRING'
)
G.layers.set_layer_attrs(
    ('metabolic',),
    interaction_type='enzymatic',
    pathways=['glycolysis', 'TCA', 'lipid'],
    database='KEGG',
)
G.layers.set_layer_attrs(
    ('regulatory',), interaction_type='transcriptional', direction='TF_to_target', database='TRRUST'
)
G.layers.set_layer_attrs(
    ('phenotype',), interaction_type='association', evidence='GWAS', database='DisGeNET'
)

print(f'Aspects: {G.aspects}')
print(f'Elementary layers: {G.layers.elem_layers}')
print('\n=== Aspects View ===')
print(G.aspects_view())
print('\n=== Layers View ===')
print(G.layers_view())
# . Define Multilayer Structure (Kivelä Formalism)

# Define multi-aspect structure
G.layers.set_aspects(
    aspects=['omic'], elem_layers={'omic': ['PPI', 'metabolic', 'regulatory', 'phenotype']}
)

# Set aspect-level metadata
G.layers.set_aspect_attrs(
    'omic',
    description='Biological interaction layer',
    data_sources=['STRING', 'KEGG', 'TRRUST', 'DisGeNET'],
)

# Set layer-level metadata
G.layers.set_layer_attrs(
    ('PPI',), interaction_type='physical', evidence='experimental', database='STRING'
)
G.layers.set_layer_attrs(
    ('metabolic',),
    interaction_type='enzymatic',
    pathways=['glycolysis', 'TCA', 'lipid'],
    database='KEGG',
)
G.layers.set_layer_attrs(
    ('regulatory',), interaction_type='transcriptional', direction='TF_to_target', database='TRRUST'
)
G.layers.set_layer_attrs(
    ('phenotype',), interaction_type='association', evidence='GWAS', database='DisGeNET'
)

print(f'Aspects: {G.aspects}')
print(f'Elementary layers: {G.layers.elem_layers}')
print('\n=== Aspects View ===')
print(G.aspects_view())
print('\n=== Layers View ===')
print(G.layers_view())

In [ ]:

Copied!





# . Create Biological Entities

# Genes/proteins
genes = [
    'GENE_A',
    'GENE_B',
    'GENE_C',
    'GENE_D',
    'GENE_E',
    'GENE_F',
    'GENE_G',
    'GENE_H',
    'GENE_I',
    'GENE_J',
]
tfs = ['GENE_A', 'GENE_C', 'GENE_F']
enzymes = ['GENE_B', 'GENE_D', 'GENE_G', 'GENE_I']

# Metabolites
metabolites = ['MET_1', 'MET_2', 'MET_3', 'MET_4', 'MET_5', 'MET_6']

# Phenotypes
phenotypes = ['inflammation', 'cell_death', 'proliferation', 'immune_response']

# Add genes with attributes
for g in genes:
    G.add_vertices(
        g,
        entity_type='gene',
        is_tf=(g in tfs),
        is_enzyme=(g in enzymes),
        chromosome=np.random.randint(1, 23),
        expression_level=np.random.uniform(0, 100),
        druggable=np.random.choice([True, False]),
        annotation_source='Ensembl',
    )

# Add metabolites
for i, m in enumerate(metabolites):
    G.add_vertices(
        m,
        entity_type='metabolite',
        molecular_weight=100 + i * 50,
        pathway='glycolysis' if i < 3 else 'lipid',
        KEGG_id=f'C{10000 + i}',
        concentration_uM=np.random.uniform(1, 1000),
    )

# Add phenotypes
for p in phenotypes:
    G.add_vertices(
        p,
        entity_type='phenotype',
        category='disease' if p in ['inflammation', 'cell_death'] else 'process',
        MeSH_id=f'D{np.random.randint(10000, 99999)}',
        severity_score=np.random.uniform(0, 1),
    )

G.history.mark('vertices_added')
print(f'Total vertices: {G.nv}')
# . Create Biological Entities

# Genes/proteins
genes = [
    'GENE_A',
    'GENE_B',
    'GENE_C',
    'GENE_D',
    'GENE_E',
    'GENE_F',
    'GENE_G',
    'GENE_H',
    'GENE_I',
    'GENE_J',
]
tfs = ['GENE_A', 'GENE_C', 'GENE_F']
enzymes = ['GENE_B', 'GENE_D', 'GENE_G', 'GENE_I']

# Metabolites
metabolites = ['MET_1', 'MET_2', 'MET_3', 'MET_4', 'MET_5', 'MET_6']

# Phenotypes
phenotypes = ['inflammation', 'cell_death', 'proliferation', 'immune_response']

# Add genes with attributes
for g in genes:
    G.add_vertices(
        g,
        entity_type='gene',
        is_tf=(g in tfs),
        is_enzyme=(g in enzymes),
        chromosome=np.random.randint(1, 23),
        expression_level=np.random.uniform(0, 100),
        druggable=np.random.choice([True, False]),
        annotation_source='Ensembl',
    )

# Add metabolites
for i, m in enumerate(metabolites):
    G.add_vertices(
        m,
        entity_type='metabolite',
        molecular_weight=100 + i * 50,
        pathway='glycolysis' if i < 3 else 'lipid',
        KEGG_id=f'C{10000 + i}',
        concentration_uM=np.random.uniform(1, 1000),
    )

# Add phenotypes
for p in phenotypes:
    G.add_vertices(
        p,
        entity_type='phenotype',
        category='disease' if p in ['inflammation', 'cell_death'] else 'process',
        MeSH_id=f'D{np.random.randint(10000, 99999)}',
        severity_score=np.random.uniform(0, 1),
    )

G.history.mark('vertices_added')
print(f'Total vertices: {G.nv}')

In [ ]:

Copied!





# . Vertex Attribute Views (Polars DataFrames)

# Full vertex attribute table
print('=== Complete Vertex Attributes ===')
print(G.views.vertices())

# Filter by entity type using Polars
vertex_df = G.views.vertices()
print('\n=== Genes Only ===')
genes_df = vertex_df.filter(pl.col('entity_type') == 'gene')
print(genes_df)

# Get specific attributes
print('\n=== Enzymes with Expression Levels ===')
enzymes_df = vertex_df.filter(pl.col('is_enzyme')).select(
    ['vertex_id', 'expression_level', 'druggable']
)
print(enzymes_df)
# . Vertex Attribute Views (Polars DataFrames)

# Full vertex attribute table
print('=== Complete Vertex Attributes ===')
print(G.views.vertices())

# Filter by entity type using Polars
vertex_df = G.views.vertices()
print('\n=== Genes Only ===')
genes_df = vertex_df.filter(pl.col('entity_type') == 'gene')
print(genes_df)

# Get specific attributes
print('\n=== Enzymes with Expression Levels ===')
enzymes_df = vertex_df.filter(pl.col('is_enzyme')).select(
    ['vertex_id', 'expression_level', 'druggable']
)
print(enzymes_df)

In [ ]:

Copied!





# . Define Layer Presence (V_M)

# PPI layer: all genes
for g in genes:
    G.add_vertices(g, layer=('PPI',))

# Metabolic layer: metabolites + enzymes
for m in metabolites:
    G.add_vertices(m, layer=('metabolic',))
for e in enzymes:
    G.add_vertices(e, layer=('metabolic',))

# Regulatory layer: all genes (TF -> target relationships)
for g in genes:
    G.add_vertices(g, layer=('regulatory',))

# Phenotype layer: phenotypes + disease-associated genes
for p in phenotypes:
    G.add_vertices(p, layer=('phenotype',))
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_vertices(g, layer=('phenotype',))

# Set vertex-layer specific attributes
G.set_vertex_layer_attrs('GENE_A', ('PPI',), ppi_degree=5, hub_score=0.9)
G.set_vertex_layer_attrs('GENE_A', ('regulatory',), n_targets=3, tf_activity=0.8)
G.set_vertex_layer_attrs('GENE_A', ('phenotype',), disease_association=0.95)

print(f'Total (vertex, layer) pairs: {len(G._VM)}')
for layer in [('PPI',), ('metabolic',), ('regulatory',), ('phenotype',)]:
    verts = G.layers.layer_vertex_set(layer)
    print(f'  {layer[0]}: {len(verts)} entities')
# . Define Layer Presence (V_M)

# PPI layer: all genes
for g in genes:
    G.add_vertices(g, layer=('PPI',))

# Metabolic layer: metabolites + enzymes
for m in metabolites:
    G.add_vertices(m, layer=('metabolic',))
for e in enzymes:
    G.add_vertices(e, layer=('metabolic',))

# Regulatory layer: all genes (TF -> target relationships)
for g in genes:
    G.add_vertices(g, layer=('regulatory',))

# Phenotype layer: phenotypes + disease-associated genes
for p in phenotypes:
    G.add_vertices(p, layer=('phenotype',))
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_vertices(g, layer=('phenotype',))

# Set vertex-layer specific attributes
G.set_vertex_layer_attrs('GENE_A', ('PPI',), ppi_degree=5, hub_score=0.9)
G.set_vertex_layer_attrs('GENE_A', ('regulatory',), n_targets=3, tf_activity=0.8)
G.set_vertex_layer_attrs('GENE_A', ('phenotype',), disease_association=0.95)

print(f'Total (vertex, layer) pairs: {len(G._VM)}')
for layer in [('PPI',), ('metabolic',), ('regulatory',), ('phenotype',)]:
    verts = G.layers.layer_vertex_set(layer)
    print(f'  {layer[0]}: {len(verts)} entities')

In [ ]:

Copied!





# . Build Intra-Layer Edges with
#
# Binary Edge Expressiveness:
# - Weighted edges
# - Directed vs undirected; edge level and graph level; flexible directionality
# - Parallel edges
# - Self-loops
# - Edge attributes
# - Hybrid edges (edge-edge; vertex-edge)

# === PPI Layer (UNDIRECTED, weighted) ===
ppi_edges = [
    ('GENE_A', 'GENE_B', 0.9),
    ('GENE_A', 'GENE_C', 0.8),
    ('GENE_A', 'GENE_D', 0.7),
    ('GENE_A', 'GENE_E', 0.6),
    ('GENE_B', 'GENE_C', 0.5),
    ('GENE_B', 'GENE_F', 0.8),
    ('GENE_C', 'GENE_G', 0.7),
    ('GENE_D', 'GENE_H', 0.6),
    ('GENE_E', 'GENE_F', 0.5),
    ('GENE_F', 'GENE_G', 0.9),
    ('GENE_F', 'GENE_H', 0.7),
    ('GENE_G', 'GENE_I', 0.6),
    ('GENE_H', 'GENE_I', 0.8),
    ('GENE_I', 'GENE_J', 0.9),
    ('GENE_J', 'GENE_A', 0.4),
]

for src, tgt, w in ppi_edges:
    eid = G.add_edges((src, ('PPI',)), (tgt, ('PPI',)), weight=w)
    # Add edge attributes
    G.attrs.set_edge_attrs(
        eid,
        interaction_type='physical',
        evidence_score=w,
        detection_method='co-IP' if w > 0.7 else 'Y2H',
        pubmed_ids=[f'PMID{np.random.randint(10000000, 99999999)}'],
    )

# === SELF-LOOP: Gene A auto-regulation ===
self_loop_eid = G.add_edges(('GENE_A', ('PPI',)), ('GENE_A', ('PPI',)), weight=0.3)
G.attrs.set_edge_attrs(
    self_loop_eid,
    interaction_type='homodimerization',
    evidence_score=0.3,
    note='GENE_A forms homodimer',
)
print(f'Self-loop added: {self_loop_eid}')

# === PARALLEL EDGES: Multiple evidence types ===
# Two different experiments detected GENE_B - GENE_F interaction
parallel_eid_1 = G.add_edges(
    ('GENE_B', ('PPI',)), ('GENE_F', ('PPI',)), weight=0.75, eid='GENE_B--GENE_F@PPI_coIP'
)
G.attrs.set_edge_attrs(parallel_eid_1, detection_method='co-IP', experiment_id='EXP001')

parallel_eid_2 = G.add_edges(
    ('GENE_B', ('PPI',)), ('GENE_F', ('PPI',)), weight=0.65, eid='GENE_B--GENE_F@PPI_Y2H'
)
G.attrs.set_edge_attrs(parallel_eid_2, detection_method='Y2H', experiment_id='EXP002')

print(f'Parallel edges: {parallel_eid_1}, {parallel_eid_2}')

# === Metabolic Layer (UNDIRECTED for enzyme-metabolite associations) ===
metabolic_edges = [
    ('GENE_B', 'MET_1', 1.0),
    ('GENE_B', 'MET_2', 1.0),
    ('MET_1', 'MET_2', 0.8),
    ('GENE_D', 'MET_2', 1.0),
    ('GENE_D', 'MET_3', 1.0),
    ('MET_2', 'MET_3', 0.9),
    ('GENE_G', 'MET_3', 1.0),
    ('GENE_G', 'MET_4', 1.0),
    ('MET_3', 'MET_4', 0.7),
    ('GENE_I', 'MET_4', 1.0),
    ('GENE_I', 'MET_5', 1.0),
    ('GENE_I', 'MET_6', 1.0),
    ('MET_4', 'MET_5', 0.6),
    ('MET_5', 'MET_6', 0.8),
]

for src, tgt, w in metabolic_edges:
    eid = G.add_edges((src, ('metabolic',)), (tgt, ('metabolic',)), weight=w)
    # Determine if enzyme-metabolite or metabolite-metabolite
    src_type = G.attrs.get_vertex_attrs(src).get('entity_type')
    tgt_type = G.attrs.get_vertex_attrs(tgt).get('entity_type')
    if src_type == 'gene' or tgt_type == 'gene':
        G.attrs.set_edge_attrs(eid, reaction_type='catalysis', reversible=False)
    else:
        G.attrs.set_edge_attrs(eid, reaction_type='conversion', reversible=True)

# === Regulatory Layer (DIRECTED: TF -> Target) ===
regulatory_edges = [
    ('GENE_A', 'GENE_B', 0.9, 'activation'),
    ('GENE_A', 'GENE_D', 0.8, 'activation'),
    ('GENE_A', 'GENE_E', 0.7, 'activation'),
    ('GENE_C', 'GENE_F', 0.9, 'activation'),
    ('GENE_C', 'GENE_G', 0.8, 'repression'),  # repression
    ('GENE_C', 'GENE_H', 0.6, 'activation'),
    ('GENE_F', 'GENE_I', 0.9, 'activation'),
    ('GENE_F', 'GENE_J', 0.7, 'activation'),
    ('GENE_H', 'GENE_A', 0.3, 'repression'),  # negative feedback
]

for src, tgt, w, reg_type in regulatory_edges:
    # Regulatory edges are DIRECTED
    eid = G.add_edges((src, ('regulatory',)), (tgt, ('regulatory',)), weight=w, directed=True)
    G.attrs.set_edge_attrs(eid, regulation_type=reg_type, binding_site='promoter', confidence=w)
    # Also annotate with Kivelä role

# === Phenotype Layer (UNDIRECTED associations) ===
phenotype_edges = [
    ('GENE_A', 'inflammation', 0.9),
    ('GENE_A', 'immune_response', 0.7),
    ('GENE_C', 'cell_death', 0.8),
    ('GENE_F', 'proliferation', 0.9),
    ('GENE_F', 'inflammation', 0.5),
    ('GENE_H', 'cell_death', 0.6),
    ('GENE_H', 'immune_response', 0.4),
    ('inflammation', 'immune_response', 0.8),
    ('cell_death', 'inflammation', 0.6),
    ('proliferation', 'cell_death', 0.4),
]

for src, tgt, w in phenotype_edges:
    eid = G.add_edges((src, ('phenotype',)), (tgt, ('phenotype',)), weight=w)
    G.attrs.set_edge_attrs(
        eid,
        association_type='GWAS' if 'GENE' in src else 'comorbidity',
        p_value=10 ** (-w * 10),
        odds_ratio=1 + w * 2,
    )

G.history.mark('intra_edges_added')
print(f'\nTotal edges after intra-layer: {G.ne}')
for layer in [('PPI',), ('metabolic',), ('regulatory',), ('phenotype',)]:
    edges = G.layers.layer_edge_set(layer)
    print(f'  {layer[0]}: {len(edges)} edges')
# . Build Intra-Layer Edges with
#
# Binary Edge Expressiveness:
# - Weighted edges
# - Directed vs undirected; edge level and graph level; flexible directionality
# - Parallel edges
# - Self-loops
# - Edge attributes
# - Hybrid edges (edge-edge; vertex-edge)

# === PPI Layer (UNDIRECTED, weighted) ===
ppi_edges = [
    ('GENE_A', 'GENE_B', 0.9),
    ('GENE_A', 'GENE_C', 0.8),
    ('GENE_A', 'GENE_D', 0.7),
    ('GENE_A', 'GENE_E', 0.6),
    ('GENE_B', 'GENE_C', 0.5),
    ('GENE_B', 'GENE_F', 0.8),
    ('GENE_C', 'GENE_G', 0.7),
    ('GENE_D', 'GENE_H', 0.6),
    ('GENE_E', 'GENE_F', 0.5),
    ('GENE_F', 'GENE_G', 0.9),
    ('GENE_F', 'GENE_H', 0.7),
    ('GENE_G', 'GENE_I', 0.6),
    ('GENE_H', 'GENE_I', 0.8),
    ('GENE_I', 'GENE_J', 0.9),
    ('GENE_J', 'GENE_A', 0.4),
]

for src, tgt, w in ppi_edges:
    eid = G.add_edges((src, ('PPI',)), (tgt, ('PPI',)), weight=w)
    # Add edge attributes
    G.attrs.set_edge_attrs(
        eid,
        interaction_type='physical',
        evidence_score=w,
        detection_method='co-IP' if w > 0.7 else 'Y2H',
        pubmed_ids=[f'PMID{np.random.randint(10000000, 99999999)}'],
    )

# === SELF-LOOP: Gene A auto-regulation ===
self_loop_eid = G.add_edges(('GENE_A', ('PPI',)), ('GENE_A', ('PPI',)), weight=0.3)
G.attrs.set_edge_attrs(
    self_loop_eid,
    interaction_type='homodimerization',
    evidence_score=0.3,
    note='GENE_A forms homodimer',
)
print(f'Self-loop added: {self_loop_eid}')

# === PARALLEL EDGES: Multiple evidence types ===
# Two different experiments detected GENE_B - GENE_F interaction
parallel_eid_1 = G.add_edges(
    ('GENE_B', ('PPI',)), ('GENE_F', ('PPI',)), weight=0.75, eid='GENE_B--GENE_F@PPI_coIP'
)
G.attrs.set_edge_attrs(parallel_eid_1, detection_method='co-IP', experiment_id='EXP001')

parallel_eid_2 = G.add_edges(
    ('GENE_B', ('PPI',)), ('GENE_F', ('PPI',)), weight=0.65, eid='GENE_B--GENE_F@PPI_Y2H'
)
G.attrs.set_edge_attrs(parallel_eid_2, detection_method='Y2H', experiment_id='EXP002')

print(f'Parallel edges: {parallel_eid_1}, {parallel_eid_2}')

# === Metabolic Layer (UNDIRECTED for enzyme-metabolite associations) ===
metabolic_edges = [
    ('GENE_B', 'MET_1', 1.0),
    ('GENE_B', 'MET_2', 1.0),
    ('MET_1', 'MET_2', 0.8),
    ('GENE_D', 'MET_2', 1.0),
    ('GENE_D', 'MET_3', 1.0),
    ('MET_2', 'MET_3', 0.9),
    ('GENE_G', 'MET_3', 1.0),
    ('GENE_G', 'MET_4', 1.0),
    ('MET_3', 'MET_4', 0.7),
    ('GENE_I', 'MET_4', 1.0),
    ('GENE_I', 'MET_5', 1.0),
    ('GENE_I', 'MET_6', 1.0),
    ('MET_4', 'MET_5', 0.6),
    ('MET_5', 'MET_6', 0.8),
]

for src, tgt, w in metabolic_edges:
    eid = G.add_edges((src, ('metabolic',)), (tgt, ('metabolic',)), weight=w)
    # Determine if enzyme-metabolite or metabolite-metabolite
    src_type = G.attrs.get_vertex_attrs(src).get('entity_type')
    tgt_type = G.attrs.get_vertex_attrs(tgt).get('entity_type')
    if src_type == 'gene' or tgt_type == 'gene':
        G.attrs.set_edge_attrs(eid, reaction_type='catalysis', reversible=False)
    else:
        G.attrs.set_edge_attrs(eid, reaction_type='conversion', reversible=True)

# === Regulatory Layer (DIRECTED: TF -> Target) ===
regulatory_edges = [
    ('GENE_A', 'GENE_B', 0.9, 'activation'),
    ('GENE_A', 'GENE_D', 0.8, 'activation'),
    ('GENE_A', 'GENE_E', 0.7, 'activation'),
    ('GENE_C', 'GENE_F', 0.9, 'activation'),
    ('GENE_C', 'GENE_G', 0.8, 'repression'),  # repression
    ('GENE_C', 'GENE_H', 0.6, 'activation'),
    ('GENE_F', 'GENE_I', 0.9, 'activation'),
    ('GENE_F', 'GENE_J', 0.7, 'activation'),
    ('GENE_H', 'GENE_A', 0.3, 'repression'),  # negative feedback
]

for src, tgt, w, reg_type in regulatory_edges:
    # Regulatory edges are DIRECTED
    eid = G.add_edges((src, ('regulatory',)), (tgt, ('regulatory',)), weight=w, directed=True)
    G.attrs.set_edge_attrs(eid, regulation_type=reg_type, binding_site='promoter', confidence=w)
    # Also annotate with Kivelä role

# === Phenotype Layer (UNDIRECTED associations) ===
phenotype_edges = [
    ('GENE_A', 'inflammation', 0.9),
    ('GENE_A', 'immune_response', 0.7),
    ('GENE_C', 'cell_death', 0.8),
    ('GENE_F', 'proliferation', 0.9),
    ('GENE_F', 'inflammation', 0.5),
    ('GENE_H', 'cell_death', 0.6),
    ('GENE_H', 'immune_response', 0.4),
    ('inflammation', 'immune_response', 0.8),
    ('cell_death', 'inflammation', 0.6),
    ('proliferation', 'cell_death', 0.4),
]

for src, tgt, w in phenotype_edges:
    eid = G.add_edges((src, ('phenotype',)), (tgt, ('phenotype',)), weight=w)
    G.attrs.set_edge_attrs(
        eid,
        association_type='GWAS' if 'GENE' in src else 'comorbidity',
        p_value=10 ** (-w * 10),
        odds_ratio=1 + w * 2,
    )

G.history.mark('intra_edges_added')
print(f'\nTotal edges after intra-layer: {G.ne}')
for layer in [('PPI',), ('metabolic',), ('regulatory',), ('phenotype',)]:
    edges = G.layers.layer_edge_set(layer)
    print(f'  {layer[0]}: {len(edges)} edges')

In [ ]:

Copied!





# . Edge Attribute Views

print('=== Edge Attributes View ===')
edges_df = G.views.edges(include_weight=True, include_directed=True)
print(edges_df.head(20))

# Filter edges by attribute
print('\n=== Regulatory Activation Edges ===')
reg_edges = G.views.edges().filter(pl.col('regulation_type') == 'activation')
print(reg_edges)

# Get edges by attribute value
repression_edges = G.get_edges_by_attr('regulation_type', 'repression')
print(f'\nRepression edges: {repression_edges}')
# . Edge Attribute Views

print('=== Edge Attributes View ===')
edges_df = G.views.edges(include_weight=True, include_directed=True)
print(edges_df.head(20))

# Filter edges by attribute
print('\n=== Regulatory Activation Edges ===')
reg_edges = G.views.edges().filter(pl.col('regulation_type') == 'activation')
print(reg_edges)

# Get edges by attribute value
repression_edges = G.get_edges_by_attr('regulation_type', 'repression')
print(f'\nRepression edges: {repression_edges}')

In [ ]:

Copied!





# . Hyperedges: Protein Complexes (Undirected)

# Protein complexes as undirected hyperedges
complexes = [
    {
        'name': 'TF_complex_A',
        'members': ['GENE_A', 'GENE_B', 'GENE_C'],
        'function': 'transcription_initiation',
    },
    {
        'name': 'signaling_hub',
        'members': ['GENE_F', 'GENE_G', 'GENE_H', 'GENE_I'],
        'function': 'signal_transduction',
    },
    {
        'name': 'metabolic_complex',
        'members': ['GENE_B', 'GENE_D', 'MET_2'],
        'function': 'metabolon',
    },
]

for cplx in complexes:
    valid_members = [m for m in cplx['members'] if m in G.entity_to_idx]
    if len(valid_members) >= 2:
        heid = G.add_edges(
            src=valid_members, edge_id=f'complex_{cplx["name"]}', directed=False, weight=1.0
        )
        G.attrs.set_edge_attrs(
            heid,
            complex_name=cplx['name'],
            function=cplx['function'],
            n_subunits=len(valid_members),
            stoichiometry='1:1:1',
        )
        print(f'Added hyperedge: {heid} with {len(valid_members)} members')

print(f'\nHyperedge definitions: {G.hyperedge_definitions}')
# . Hyperedges: Protein Complexes (Undirected)

# Protein complexes as undirected hyperedges
complexes = [
    {
        'name': 'TF_complex_A',
        'members': ['GENE_A', 'GENE_B', 'GENE_C'],
        'function': 'transcription_initiation',
    },
    {
        'name': 'signaling_hub',
        'members': ['GENE_F', 'GENE_G', 'GENE_H', 'GENE_I'],
        'function': 'signal_transduction',
    },
    {
        'name': 'metabolic_complex',
        'members': ['GENE_B', 'GENE_D', 'MET_2'],
        'function': 'metabolon',
    },
]

for cplx in complexes:
    valid_members = [m for m in cplx['members'] if m in G.entity_to_idx]
    if len(valid_members) >= 2:
        heid = G.add_edges(
            src=valid_members, edge_id=f'complex_{cplx["name"]}', directed=False, weight=1.0
        )
        G.attrs.set_edge_attrs(
            heid,
            complex_name=cplx['name'],
            function=cplx['function'],
            n_subunits=len(valid_members),
            stoichiometry='1:1:1',
        )
        print(f'Added hyperedge: {heid} with {len(valid_members)} members')

print(f'\nHyperedge definitions: {G.hyperedge_definitions}')

In [ ]:

Copied!





# 0. Hyperedges: Multi-Substrate Reactions (Directed)

# Directed hyperedges for metabolic reactions
# head = substrates/enzymes, tail = products

directed_reactions = [
    {
        'name': 'glycolysis_step1',
        'head': ['MET_1', 'GENE_B'],  # substrate + enzyme
        'tail': ['MET_2'],  # product
        'stoich': {'MET_1': -1, 'MET_2': 1},
    },
    {
        'name': 'glycolysis_step2',
        'head': ['MET_2', 'GENE_D'],
        'tail': ['MET_3'],
        'stoich': {'MET_2': -1, 'MET_3': 1},
    },
    {
        'name': 'branch_point',
        'head': ['MET_3', 'GENE_G'],
        'tail': ['MET_4', 'MET_5'],  # two products
        'stoich': {'MET_3': -1, 'MET_4': 0.5, 'MET_5': 0.5},
    },
]

for rxn in directed_reactions:
    valid_head = [h for h in rxn['head'] if h in G.entity_to_idx]
    valid_tail = [t for t in rxn['tail'] if t in G.entity_to_idx]

    if valid_head and valid_tail:
        heid = G.add_edges(
            src=valid_head, tgt=valid_tail, edge_id=f'rxn_{rxn["name"]}', directed=True, weight=1.0
        )
        G.attrs.set_edge_attrs(
            heid,
            reaction_name=rxn['name'],
            EC_number=f'EC:1.1.1.{np.random.randint(1, 100)}',
            delta_G=-np.random.uniform(5, 30),
        )
        # Set stoichiometric coefficients
        G.set_hyperedge_coeffs(heid, rxn['stoich'])
        print(f'Added directed hyperedge: {heid}')

G.history.mark('hyperedges_added')
# 0. Hyperedges: Multi-Substrate Reactions (Directed)

# Directed hyperedges for metabolic reactions
# head = substrates/enzymes, tail = products

directed_reactions = [
    {
        'name': 'glycolysis_step1',
        'head': ['MET_1', 'GENE_B'],  # substrate + enzyme
        'tail': ['MET_2'],  # product
        'stoich': {'MET_1': -1, 'MET_2': 1},
    },
    {
        'name': 'glycolysis_step2',
        'head': ['MET_2', 'GENE_D'],
        'tail': ['MET_3'],
        'stoich': {'MET_2': -1, 'MET_3': 1},
    },
    {
        'name': 'branch_point',
        'head': ['MET_3', 'GENE_G'],
        'tail': ['MET_4', 'MET_5'],  # two products
        'stoich': {'MET_3': -1, 'MET_4': 0.5, 'MET_5': 0.5},
    },
]

for rxn in directed_reactions:
    valid_head = [h for h in rxn['head'] if h in G.entity_to_idx]
    valid_tail = [t for t in rxn['tail'] if t in G.entity_to_idx]

    if valid_head and valid_tail:
        heid = G.add_edges(
            src=valid_head, tgt=valid_tail, edge_id=f'rxn_{rxn["name"]}', directed=True, weight=1.0
        )
        G.attrs.set_edge_attrs(
            heid,
            reaction_name=rxn['name'],
            EC_number=f'EC:1.1.1.{np.random.randint(1, 100)}',
            delta_G=-np.random.uniform(5, 30),
        )
        # Set stoichiometric coefficients
        G.set_hyperedge_coeffs(heid, rxn['stoich'])
        print(f'Added directed hyperedge: {heid}')

G.history.mark('hyperedges_added')

In [ ]:

Copied!





import annnet.adapters.networkx_adapter as anx
import networkx as nx

# Obtain a simple NX view (collapse Multi* edges with sensible aggregations)
nxG, manifest = anx.to_nx(G, directed=True, hyperedge_mode='skip')  # skip, expand or reify
pos = nx.spring_layout(nxG, seed=42)
plt.figure(figsize=(6, 4))
nx.draw(nxG, pos, with_labels=True, node_size=800)
nx.draw_networkx_edge_labels(nxG, pos, edge_labels=nx.get_edge_attributes(nxG, 'weight'))
plt.title('Demo graph (simple NX view)')
plt.show()
import annnet.adapters.networkx_adapter as anx
import networkx as nx

# Obtain a simple NX view (collapse Multi* edges with sensible aggregations)
nxG, manifest = anx.to_nx(G, directed=True, hyperedge_mode='skip')  # skip, expand or reify
pos = nx.spring_layout(nxG, seed=42)
plt.figure(figsize=(6, 4))
nx.draw(nxG, pos, with_labels=True, node_size=800)
nx.draw_networkx_edge_labels(nxG, pos, edge_labels=nx.get_edge_attributes(nxG, 'weight'))
plt.title('Demo graph (simple NX view)')
plt.show()

In [ ]:

Copied!

from annnet.utils import plotting

plotting.plot(G)
from annnet.utils import plotting

plotting.plot(G)

In [ ]:

Copied!

from annnet.io.cx2 import show_cx2

show_cx2(G, hyperedges='reify')
from annnet.io.cx2 import show_cx2

show_cx2(G, hyperedges='reify')

In [ ]:

Copied!





# 1. Edge Entities (Reactions as Nodes, as_entity=True)

# Create edge entities - reactions that can connect to other reactions
reaction_entities = [
    {'id': 'RXN_glycolysis_1', 'enzyme': 'GENE_B', 'pathway': 'glycolysis'},
    {'id': 'RXN_glycolysis_2', 'enzyme': 'GENE_D', 'pathway': 'glycolysis'},
    {'id': 'RXN_lipid_1', 'enzyme': 'GENE_G', 'pathway': 'lipid'},
]

for rxn in reaction_entities:
    G.add_edges(
        edge_id=rxn['id'],
        entity_type='reaction',
        enzyme=rxn['enzyme'],
        pathway=rxn['pathway'],
        as_entity=True,
    )

# Connect substrates -> reaction -> products using vertex-edge edges
# MET_1 -> RXN_glycolysis_1 -> MET_2
G.add_edges(
    'MET_1',
    'RXN_glycolysis_1',
    edge_type='vertex_edge',
    weight=1.0,
    relation='substrate',
    as_entity=True,
)
G.add_edges(
    'RXN_glycolysis_1',
    'MET_2',
    edge_type='vertex_edge',
    weight=1.0,
    relation='product',
    as_entity=True,
)
G.add_edges(
    'GENE_B',
    'RXN_glycolysis_1',
    edge_type='vertex_edge',
    weight=1.0,
    relation='catalyzes',
    as_entity=True,
)

# Chain reactions together
G.add_edges(
    'RXN_glycolysis_1',
    'RXN_glycolysis_2',
    edge_type='vertex_edge',
    weight=1.0,
    relation='feeds_into',
    as_entity=True,
)

print(f'Edge entities: {[e for e, t in G.entity_types.items() if t == "edge"]}', as_entity=True)
G.history.mark('edge_entities_added')
# 1. Edge Entities (Reactions as Nodes, as_entity=True)

# Create edge entities - reactions that can connect to other reactions
reaction_entities = [
    {'id': 'RXN_glycolysis_1', 'enzyme': 'GENE_B', 'pathway': 'glycolysis'},
    {'id': 'RXN_glycolysis_2', 'enzyme': 'GENE_D', 'pathway': 'glycolysis'},
    {'id': 'RXN_lipid_1', 'enzyme': 'GENE_G', 'pathway': 'lipid'},
]

for rxn in reaction_entities:
    G.add_edges(
        edge_id=rxn['id'],
        entity_type='reaction',
        enzyme=rxn['enzyme'],
        pathway=rxn['pathway'],
        as_entity=True,
    )

# Connect substrates -> reaction -> products using vertex-edge edges
# MET_1 -> RXN_glycolysis_1 -> MET_2
G.add_edges(
    'MET_1',
    'RXN_glycolysis_1',
    edge_type='vertex_edge',
    weight=1.0,
    relation='substrate',
    as_entity=True,
)
G.add_edges(
    'RXN_glycolysis_1',
    'MET_2',
    edge_type='vertex_edge',
    weight=1.0,
    relation='product',
    as_entity=True,
)
G.add_edges(
    'GENE_B',
    'RXN_glycolysis_1',
    edge_type='vertex_edge',
    weight=1.0,
    relation='catalyzes',
    as_entity=True,
)

# Chain reactions together
G.add_edges(
    'RXN_glycolysis_1',
    'RXN_glycolysis_2',
    edge_type='vertex_edge',
    weight=1.0,
    relation='feeds_into',
    as_entity=True,
)

print(f'Edge entities: {[e for e, t in G.entity_types.items() if t == "edge"]}', as_entity=True)
G.history.mark('edge_entities_added')

In [ ]:

Copied!





# 2. Inter-Layer Coupling Edges

omega = 1.0  # coupling strength

# PPI <-> regulatory (all genes)
for g in genes:
    G.add_edges((g, ('PPI',)), (g, ('regulatory',)), weight=omega)

# PPI <-> metabolic (enzymes only)
for e in enzymes:
    G.add_edges((e, ('PPI',)), (e, ('metabolic',)), weight=omega)

# regulatory <-> metabolic (enzymes only)
for e in enzymes:
    G.add_edges((e, ('regulatory',)), (e, ('metabolic',)), weight=omega)

# PPI <-> phenotype (disease genes)
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_edges((g, ('PPI',)), (g, ('phenotype',)), weight=omega)

# regulatory <-> phenotype (disease genes)
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_edges((g, ('regulatory',)), (g, ('phenotype',)), weight=omega)

coupling_edges = [e for e, k in G.edge_kind.items() if k == 'coupling']
print(f'Total edges after coupling: {G.ne}')
print(f'Coupling edges: {len(coupling_edges)}')
G.history.mark('coupling_edges_added')
# 2. Inter-Layer Coupling Edges

omega = 1.0  # coupling strength

# PPI <-> regulatory (all genes)
for g in genes:
    G.add_edges((g, ('PPI',)), (g, ('regulatory',)), weight=omega)

# PPI <-> metabolic (enzymes only)
for e in enzymes:
    G.add_edges((e, ('PPI',)), (e, ('metabolic',)), weight=omega)

# regulatory <-> metabolic (enzymes only)
for e in enzymes:
    G.add_edges((e, ('regulatory',)), (e, ('metabolic',)), weight=omega)

# PPI <-> phenotype (disease genes)
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_edges((g, ('PPI',)), (g, ('phenotype',)), weight=omega)

# regulatory <-> phenotype (disease genes)
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G.add_edges((g, ('regulatory',)), (g, ('phenotype',)), weight=omega)

coupling_edges = [e for e, k in G.edge_kind.items() if k == 'coupling']
print(f'Total edges after coupling: {G.ne}')
print(f'Coupling edges: {len(coupling_edges)}')
G.history.mark('coupling_edges_added')

In [ ]:

Copied!





# 3. Slices: Named Subgraph Partitions

# Create slices from layers
for layer in ['PPI', 'metabolic', 'regulatory', 'phenotype']:
    G.layers.create_slice_from_layer(
        slice_id=f'layer_{layer}',
        layer_tuple=(layer,),
        source='layer_extraction',
        description=f'All entities in {layer} layer',
    )

# Create functional slices
G.slices.add('hub_genes', description='High-degree genes')
for g in ['GENE_A', 'GENE_F']:  # known hubs
    G._slices['hub_genes']['vertices'].add(g)

G.slices.add('disease_associated', description='Phenotype-linked genes')
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G._slices['disease_associated']['vertices'].add(g)

G.slices.add('enzymes_only', description='Metabolic enzymes')
for e in enzymes:
    G._slices['enzymes_only']['vertices'].add(e)

# Set slice attributes
G.set_slice_attrs('hub_genes', centrality_threshold=0.8, n_hubs=2)
G.set_slice_attrs('disease_associated', disease='inflammatory', source='DisGeNET')

print('=== Slices View ===')
print(G.slices_view())

print('\n=== Slice Contents ===')
for sid in G.slices.list():
    info = G.get_slice_info(sid)
    print(f'  {sid}: {len(info["vertices"])} vertices, {len(info["edges"])} edges')
# 3. Slices: Named Subgraph Partitions

# Create slices from layers
for layer in ['PPI', 'metabolic', 'regulatory', 'phenotype']:
    G.layers.create_slice_from_layer(
        slice_id=f'layer_{layer}',
        layer_tuple=(layer,),
        source='layer_extraction',
        description=f'All entities in {layer} layer',
    )

# Create functional slices
G.slices.add('hub_genes', description='High-degree genes')
for g in ['GENE_A', 'GENE_F']:  # known hubs
    G._slices['hub_genes']['vertices'].add(g)

G.slices.add('disease_associated', description='Phenotype-linked genes')
for g in ['GENE_A', 'GENE_C', 'GENE_F', 'GENE_H']:
    G._slices['disease_associated']['vertices'].add(g)

G.slices.add('enzymes_only', description='Metabolic enzymes')
for e in enzymes:
    G._slices['enzymes_only']['vertices'].add(e)

# Set slice attributes
G.set_slice_attrs('hub_genes', centrality_threshold=0.8, n_hubs=2)
G.set_slice_attrs('disease_associated', disease='inflammatory', source='DisGeNET')

print('=== Slices View ===')
print(G.slices_view())

print('\n=== Slice Contents ===')
for sid in G.slices.list():
    info = G.get_slice_info(sid)
    print(f'  {sid}: {len(info["vertices"])} vertices, {len(info["edges"])} edges')

In [ ]:

Copied!





# 4. Slice Set Operations

# Union of slices
hub_disease_union = G.slices.union(['hub_genes', 'disease_associated'])
print(f'Hub ∪ Disease: {hub_disease_union["vertices"]}')

# Intersection
hub_disease_intersection = G.slices.intersect(['hub_genes', 'disease_associated'])
print(f'Hub ∩ Disease: {hub_disease_intersection["vertices"]}')

# Difference
disease_not_hub = G.slices.difference('disease_associated', 'hub_genes')
print(f'Disease \\ Hub: {disease_not_hub["vertices"]}')

# Create new slice from operation
G.create_slice_from_operation(
    'hub_disease_overlap',
    hub_disease_intersection,
    operation='intersection',
    description='Genes that are both hubs and disease-associated',
)

# Layer algebra
layer_union = G.layers.layer_union([('PPI',), ('regulatory',)])
print(f'\nPPI ∪ regulatory: {len(layer_union["vertices"])} vertices')

layer_intersection = G.layers.layer_intersection([('PPI',), ('regulatory',)])
print(f'PPI ∩ regulatory: {len(layer_intersection["vertices"])} vertices')
# 4. Slice Set Operations

# Union of slices
hub_disease_union = G.slices.union(['hub_genes', 'disease_associated'])
print(f'Hub ∪ Disease: {hub_disease_union["vertices"]}')

# Intersection
hub_disease_intersection = G.slices.intersect(['hub_genes', 'disease_associated'])
print(f'Hub ∩ Disease: {hub_disease_intersection["vertices"]}')

# Difference
disease_not_hub = G.slices.difference('disease_associated', 'hub_genes')
print(f'Disease \\ Hub: {disease_not_hub["vertices"]}')

# Create new slice from operation
G.create_slice_from_operation(
    'hub_disease_overlap',
    hub_disease_intersection,
    operation='intersection',
    description='Genes that are both hubs and disease-associated',
)

# Layer algebra
layer_union = G.layers.layer_union([('PPI',), ('regulatory',)])
print(f'\nPPI ∪ regulatory: {len(layer_union["vertices"])} vertices')

layer_intersection = G.layers.layer_intersection([('PPI',), ('regulatory',)])
print(f'PPI ∩ regulatory: {len(layer_intersection["vertices"])} vertices')

In [ ]:

Copied!





# 5. Per-Slice Edge Weights

# Same edge can have different weights in different contexts
# Create context slices
G.slices.add('healthy_context', condition='healthy')
G.slices.add('disease_context', condition='inflammatory')

# Get an edge ID
test_edge = list(G.edge_definitions.keys())[0]
print(f'Testing per-slice weights on edge: {test_edge}')

# Set different weights for different contexts
G.set_edge_slice_attrs('healthy_context', test_edge, weight=0.5, context_note='baseline')
G.set_edge_slice_attrs('disease_context', test_edge, weight=2.0, context_note='upregulated')

# Query effective weights
w_healthy = G.get_effective_edge_weight(test_edge, slice='healthy_context')
w_disease = G.get_effective_edge_weight(test_edge, slice='disease_context')
w_global = G.get_effective_edge_weight(test_edge)

print(f'Weight in healthy context: {w_healthy}')
print(f'Weight in disease context: {w_disease}')
print(f'Global weight: {w_global}')
# 5. Per-Slice Edge Weights

# Same edge can have different weights in different contexts
# Create context slices
G.slices.add('healthy_context', condition='healthy')
G.slices.add('disease_context', condition='inflammatory')

# Get an edge ID
test_edge = list(G.edge_definitions.keys())[0]
print(f'Testing per-slice weights on edge: {test_edge}')

# Set different weights for different contexts
G.set_edge_slice_attrs('healthy_context', test_edge, weight=0.5, context_note='baseline')
G.set_edge_slice_attrs('disease_context', test_edge, weight=2.0, context_note='upregulated')

# Query effective weights
w_healthy = G.get_effective_edge_weight(test_edge, slice='healthy_context')
w_disease = G.get_effective_edge_weight(test_edge, slice='disease_context')
w_global = G.get_effective_edge_weight(test_edge)

print(f'Weight in healthy context: {w_healthy}')
print(f'Weight in disease context: {w_disease}')
print(f'Global weight: {w_global}')

In [ ]:

Copied!





# 6. AnnData-like API

print('=== AnnData-like API ===')

# X() - incidence matrix
X = G.X()
print(f'G.X() shape: {X.shape}, nnz: {X.nnz}')
print('  (entities x edges incidence matrix)')

# obs - vertex attributes (observations)
obs = G.obs
print('\nG.obs (vertex attributes):')
print(obs.head())

# var - edge attributes (variables)
var = G.var
print('\nG.var (edge attributes):')
print(var.head())

# uns - unstructured metadata
uns = G.uns
print('\nG.uns (graph attributes):')
print(uns)
# 6. AnnData-like API

print('=== AnnData-like API ===')

# X() - incidence matrix
X = G.X()
print(f'G.X() shape: {X.shape}, nnz: {X.nnz}')
print('  (entities x edges incidence matrix)')

# obs - vertex attributes (observations)
obs = G.obs
print('\nG.obs (vertex attributes):')
print(obs.head())

# var - edge attributes (variables)
var = G.var
print('\nG.var (edge attributes):')
print(var.head())

# uns - unstructured metadata
uns = G.uns
print('\nG.uns (graph attributes):')
print(uns)

In [ ]:

Copied!





# 7. Managers' APIs

print('=== Manager APIs ===')

# Slice manager
slices_mgr = G.slices
print(f'G.slices: {type(slices_mgr)}')

# Layer manager
layers_mgr = G.layers
print(f'G.layers: {type(layers_mgr)}')

# Index manager
idx_mgr = G.idx
print(f'G.idx: {type(idx_mgr)}')

# Cache manager
cache_mgr = G.cache
print(f'G.cache: {type(cache_mgr)}')

# Use index manager for lookups
print('\nIndex lookups via G.idx:')
print(f'  GENE_A row index: {G.entity_to_idx.get("GENE_A")}')
print(f'  Edge 0 ID: {G.idx_to_edge.get(0)}')
# 7. Managers' APIs

print('=== Manager APIs ===')

# Slice manager
slices_mgr = G.slices
print(f'G.slices: {type(slices_mgr)}')

# Layer manager
layers_mgr = G.layers
print(f'G.layers: {type(layers_mgr)}')

# Index manager
idx_mgr = G.idx
print(f'G.idx: {type(idx_mgr)}')

# Cache manager
cache_mgr = G.cache
print(f'G.cache: {type(cache_mgr)}')

# Use index manager for lookups
print('\nIndex lookups via G.idx:')
print(f'  GENE_A row index: {G.entity_to_idx.get("GENE_A")}')
print(f'  Edge 0 ID: {G.idx_to_edge.get(0)}')

In [ ]:

Copied!





# 8. Build Supra-Adjacency and Supra-Laplacian

# Build vertex-layer index
n_supra = G.ensure_vertex_layer_index()
print(f'Supra-graph size: {n_supra} nodes')

# Supra-adjacency matrix
A_supra = G.supra_adjacency()
print(f'Supra-adjacency: {A_supra.shape}, nnz={A_supra.nnz}')

# Supra-Laplacian (combinatorial)
L_supra = G.supra_laplacian(kind='comb')
print(f'Supra-Laplacian (combinatorial): {L_supra.shape}')

# Normalized Laplacian
L_norm = G.supra_laplacian(kind='norm')
print(f'Supra-Laplacian (normalized): {L_norm.shape}')

# Verify Laplacian property (row sums = 0)
row_sums = np.abs(L_supra.sum(axis=1).A.ravel())
print(f'Max row sum (should be ~0): {row_sums.max():.2e}')

# Transition matrix (random walk)
P = G.transition_matrix()
print(f'Transition matrix: {P.shape}')

# 9. Spectral Analysis

# Compute smallest eigenvalues
k = min(10, n_supra - 1)
eigenvalues, eigenvectors = eigsh(L_supra.astype(float), k=k, which='SM')

# Sort
idx = np.argsort(eigenvalues)
eigenvalues = eigenvalues[idx]
eigenvectors = eigenvectors[:, idx]

print('Smallest eigenvalues of supra-Laplacian:')
for i, ev in enumerate(eigenvalues):
    print(f'  λ_{i} = {ev:.6f}')

# Algebraic connectivity
lambda2, fiedler = G.algebraic_connectivity()
print(f'\nAlgebraic connectivity (λ₂): {lambda2:.6f}')

print('===========================================\n')

# Via AnnNet built in method
vals, vecs = G.k_smallest_laplacian_eigs(k=6)
print(f'6 smallest eigenvalues: {vals}')
# 8. Build Supra-Adjacency and Supra-Laplacian

# Build vertex-layer index
n_supra = G.ensure_vertex_layer_index()
print(f'Supra-graph size: {n_supra} nodes')

# Supra-adjacency matrix
A_supra = G.supra_adjacency()
print(f'Supra-adjacency: {A_supra.shape}, nnz={A_supra.nnz}')

# Supra-Laplacian (combinatorial)
L_supra = G.supra_laplacian(kind='comb')
print(f'Supra-Laplacian (combinatorial): {L_supra.shape}')

# Normalized Laplacian
L_norm = G.supra_laplacian(kind='norm')
print(f'Supra-Laplacian (normalized): {L_norm.shape}')

# Verify Laplacian property (row sums = 0)
row_sums = np.abs(L_supra.sum(axis=1).A.ravel())
print(f'Max row sum (should be ~0): {row_sums.max():.2e}')

# Transition matrix (random walk)
P = G.transition_matrix()
print(f'Transition matrix: {P.shape}')

# 9. Spectral Analysis

# Compute smallest eigenvalues
k = min(10, n_supra - 1)
eigenvalues, eigenvectors = eigsh(L_supra.astype(float), k=k, which='SM')

# Sort
idx = np.argsort(eigenvalues)
eigenvalues = eigenvalues[idx]
eigenvectors = eigenvectors[:, idx]

print('Smallest eigenvalues of supra-Laplacian:')
for i, ev in enumerate(eigenvalues):
    print(f'  λ_{i} = {ev:.6f}')

# Algebraic connectivity
lambda2, fiedler = G.algebraic_connectivity()
print(f'\nAlgebraic connectivity (λ₂): {lambda2:.6f}')

print('===========================================\n')

# Via AnnNet built in method
vals, vecs = G.k_smallest_laplacian_eigs(k=6)
print(f'6 smallest eigenvalues: {vals}')

In [ ]:

Copied!





# . NetworkX backend accessor (G.nx)

print('=== NetworkX backend accessor ===')
print('Using G.nx.algorithm(G, ...) pattern')

# Degree centrality via backend accessor
degree_cent = G.nx.degree_centrality(G)
top_degree = sorted(degree_cent.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by degree centrality:')
for node, cent in top_degree:
    print(f'  {node}: {cent:.4f}')

# Betweenness centrality
betweenness = G.nx.betweenness_centrality(G)
top_between = sorted(betweenness.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by betweenness centrality:')
for node, cent in top_between:
    print(f'  {node}: {cent:.4f}')

# PageRank
pagerank = G.nx.pagerank(G, alpha=0.85)
top_pr = sorted(pagerank.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by PageRank:')
for node, pr in top_pr:
    print(f'  {node}: {pr:.4f}')


# Shortest path

path = G.nx.shortest_path(G, 'GENE_A', 'GENE_F')
sp = []
for i in path:
    sp.append(G.idx.row_to_entity(i))
print(f'\nShortest path GENE_A → inflammation: {(sp)}')

# Community detection (Louvain)

communities = G.nx.louvain_communities(G, seed=79)
print(f'\nLouvain communities: {len(communities)}')
for i, comm in enumerate(communities[:4]):
    print(f'  Community {i}: {list(comm)[:10]}...')
# . NetworkX backend accessor (G.nx)

print('=== NetworkX backend accessor ===')
print('Using G.nx.algorithm(G, ...) pattern')

# Degree centrality via backend accessor
degree_cent = G.nx.degree_centrality(G)
top_degree = sorted(degree_cent.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by degree centrality:')
for node, cent in top_degree:
    print(f'  {node}: {cent:.4f}')

# Betweenness centrality
betweenness = G.nx.betweenness_centrality(G)
top_between = sorted(betweenness.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by betweenness centrality:')
for node, cent in top_between:
    print(f'  {node}: {cent:.4f}')

# PageRank
pagerank = G.nx.pagerank(G, alpha=0.85)
top_pr = sorted(pagerank.items(), key=lambda x: -x[1])[:5]
print('\nTop 5 by PageRank:')
for node, pr in top_pr:
    print(f'  {node}: {pr:.4f}')


# Shortest path

path = G.nx.shortest_path(G, 'GENE_A', 'GENE_F')
sp = []
for i in path:
    sp.append(G.idx.row_to_entity(i))
print(f'\nShortest path GENE_A → inflammation: {(sp)}')

# Community detection (Louvain)

communities = G.nx.louvain_communities(G, seed=79)
print(f'\nLouvain communities: {len(communities)}')
for i, comm in enumerate(communities[:4]):
    print(f'  Community {i}: {list(comm)[:10]}...')

In [ ]:

Copied!





# . igraph backend accessor (G.ig)

print('=== igraph backend accessor ===')

# Transitivity via backend accessor
transitivity = G.ig.transitivity_undirected()
print(f'Global transitivity: {transitivity:.4f}')

# Diameter
diameter = G.ig.diameter(G)
print(f'Diameter: {diameter}')
# . igraph backend accessor (G.ig)

print('=== igraph backend accessor ===')

# Transitivity via backend accessor
transitivity = G.ig.transitivity_undirected()
print(f'Global transitivity: {transitivity:.4f}')

# Diameter
diameter = G.ig.diameter(G)
print(f'Diameter: {diameter}')

In [ ]:

Copied!





# . Fiedler Vector Analysis (Community Structure)

fiedler_vec = eigenvectors[:, 1]

# Map back to (vertex, layer) pairs
fiedler_mapping = {}
for i, (v, layer) in enumerate(G._row_to_nl):
    fiedler_mapping[(v, layer[0])] = fiedler_vec[i]

# Create DataFrame
fiedler_data = [
    {'vertex': v, 'layer': L, 'fiedler_value': val} for (v, L), val in fiedler_mapping.items()
]
fiedler_df = pl.DataFrame(fiedler_data).sort('fiedler_value')

print('Fiedler vector extremes:')
print('\nMost negative (Cluster A):')
print(fiedler_df.head(10))
print('\nMost positive (Cluster B):')
print(fiedler_df.tail(10))

# Binary partition
cluster_A = [(v, L) for (v, L), val in fiedler_mapping.items() if val < 0]
cluster_B = [(v, L) for (v, L), val in fiedler_mapping.items() if val >= 0]

print(f'\nCluster A: {len(cluster_A)} vertex-layer pairs')
print(f'Cluster B: {len(cluster_B)} vertex-layer pairs')
# . Fiedler Vector Analysis (Community Structure)

fiedler_vec = eigenvectors[:, 1]

# Map back to (vertex, layer) pairs
fiedler_mapping = {}
for i, (v, layer) in enumerate(G._row_to_nl):
    fiedler_mapping[(v, layer[0])] = fiedler_vec[i]

# Create DataFrame
fiedler_data = [
    {'vertex': v, 'layer': L, 'fiedler_value': val} for (v, L), val in fiedler_mapping.items()
]
fiedler_df = pl.DataFrame(fiedler_data).sort('fiedler_value')

print('Fiedler vector extremes:')
print('\nMost negative (Cluster A):')
print(fiedler_df.head(10))
print('\nMost positive (Cluster B):')
print(fiedler_df.tail(10))

# Binary partition
cluster_A = [(v, L) for (v, L), val in fiedler_mapping.items() if val < 0]
cluster_B = [(v, L) for (v, L), val in fiedler_mapping.items() if val >= 0]

print(f'\nCluster A: {len(cluster_A)} vertex-layer pairs')
print(f'Cluster B: {len(cluster_B)} vertex-layer pairs')

In [ ]:

Copied!





# . Diffusion Simulation

# Initial perturbation: activate GENE_A in regulatory layer
x0 = np.zeros(n_supra)

for i, (v, layer) in enumerate(G._row_to_nl):
    if v == 'GENE_A' and layer == ('regulatory',):
        x0[i] = 1.0
        print(f'Initial perturbation at index {i}: ({v}, {layer[0]})')
        break

# Diffusion parameters
tau = 0.1
n_steps = 50

# Store trajectory
trajectory = [x0.copy()]
x = x0.copy()

for _step in range(n_steps):
    x = x - tau * (L_supra @ x)
    trajectory.append(x.copy())

trajectory = np.array(trajectory)
print(f'Trajectory shape: {trajectory.shape}')

# Alternative: use library method
x_one_step = G.diffusion_step(x0, tau=0.1, kind='comb')
print(f'One diffusion step via G.diffusion_step(): ||x||={np.linalg.norm(x_one_step):.4f}')

# Random walk step
p_rw = G.random_walk_step(x0)
print(f'Random walk step: sum={p_rw.sum():.4f}')
# . Diffusion Simulation

# Initial perturbation: activate GENE_A in regulatory layer
x0 = np.zeros(n_supra)

for i, (v, layer) in enumerate(G._row_to_nl):
    if v == 'GENE_A' and layer == ('regulatory',):
        x0[i] = 1.0
        print(f'Initial perturbation at index {i}: ({v}, {layer[0]})')
        break

# Diffusion parameters
tau = 0.1
n_steps = 50

# Store trajectory
trajectory = [x0.copy()]
x = x0.copy()

for _step in range(n_steps):
    x = x - tau * (L_supra @ x)
    trajectory.append(x.copy())

trajectory = np.array(trajectory)
print(f'Trajectory shape: {trajectory.shape}')

# Alternative: use library method
x_one_step = G.diffusion_step(x0, tau=0.1, kind='comb')
print(f'One diffusion step via G.diffusion_step(): ||x||={np.linalg.norm(x_one_step):.4f}')

# Random walk step
p_rw = G.random_walk_step(x0)
print(f'Random walk step: sum={p_rw.sum():.4f}')

In [ ]:

Copied!





# . Analyze Diffusion Results

x_final = trajectory[-1]

# Map back to (vertex, layer)
final_activation = {}
for i, (v, layer) in enumerate(G._row_to_nl):
    final_activation[(v, layer[0])] = x_final[i]

activation_df = pl.DataFrame(
    [{'vertex': v, 'layer': L, 'activation': val} for (v, L), val in final_activation.items()]
).sort('activation', descending=True)

print('Top activated nodes after diffusion:')
print(activation_df.head(15))

# Activation by layer
layer_activation = activation_df.group_by('layer').agg(
    pl.col('activation').mean().alias('mean'),
    pl.col('activation').max().alias('max'),
    pl.col('activation').sum().alias('total'),
)
print('\nActivation by layer:')
print(layer_activation)
# . Analyze Diffusion Results

x_final = trajectory[-1]

# Map back to (vertex, layer)
final_activation = {}
for i, (v, layer) in enumerate(G._row_to_nl):
    final_activation[(v, layer[0])] = x_final[i]

activation_df = pl.DataFrame(
    [{'vertex': v, 'layer': L, 'activation': val} for (v, L), val in final_activation.items()]
).sort('activation', descending=True)

print('Top activated nodes after diffusion:')
print(activation_df.head(15))

# Activation by layer
layer_activation = activation_df.group_by('layer').agg(
    pl.col('activation').mean().alias('mean'),
    pl.col('activation').max().alias('max'),
    pl.col('activation').sum().alias('total'),
)
print('\nActivation by layer:')
print(layer_activation)

In [ ]:

Copied!





# . History & Versioning

print('=== Mutation History ===')
print(f'Total events: {len(G._history)}')
print(f'Current version: {G._version}')

# View history as DataFrame
history_df = pl.DataFrame(G._history, infer_schema_length=10000)
print(f'\nHistory columns: {history_df.columns}')

# Show checkpoints
marks = history_df.filter(pl.col('op') == 'mark')
print('\nCheckpoints:')
print(marks.select(['version', 'ts_utc', 'label']))

# Operation counts
op_counts = history_df.group_by('op').agg(pl.count().alias('count')).sort('count', descending=True)
print('\nOperations by type:')
print(op_counts.head(10))
# . History & Versioning

print('=== Mutation History ===')
print(f'Total events: {len(G._history)}')
print(f'Current version: {G._version}')

# View history as DataFrame
history_df = pl.DataFrame(G._history, infer_schema_length=10000)
print(f'\nHistory columns: {history_df.columns}')

# Show checkpoints
marks = history_df.filter(pl.col('op') == 'mark')
print('\nCheckpoints:')
print(marks.select(['version', 'ts_utc', 'label']))

# Operation counts
op_counts = history_df.group_by('op').agg(pl.count().alias('count')).sort('count', descending=True)
print('\nOperations by type:')
print(op_counts.head(10))

In [ ]:

Copied!





# . Summary Statistics

print('=' * 70)
print('MULTILAYER NETWORK ANALYSIS - COMPLETE SUMMARY')
print('=' * 70)

# Entity counts
entity_counts = defaultdict(int)
for v in G.vertices():
    etype = G.attrs.get_vertex_attrs(v).get('entity_type', 'unknown')
    entity_counts[etype] += 1

print('\n Entity Counts:')
for etype, count in sorted(entity_counts.items()):
    print(f'  {etype}: {count}')

# Edge statistics
print('\n Edge Statistics:')
print(f'  Total edges: {G.ne}')
print(f'  Binary edges: {len(G.edge_definitions)}')
print(f'  Hyperedges: {len(G.hyperedge_definitions)}')
print(f'  Edge entities: {len([e for e, t in G.entity_types.items() if t == "edge"])}')
print(f'  Coupling edges: {len([e for e, k in G.edge_kind.items() if k == "coupling"])}')

# Directionality
directed_edges = G.get_edges_by_direction(True)
undirected_edges = G.get_edges_by_direction(False)
print(f'  Directed: {len(directed_edges)}')
print(f'  Undirected: {len(undirected_edges)}')

# Layer statistics
print('\n Layer Statistics:')
for layer in G.layers.elem_layers['omic']:
    n_verts = len(G.layers.layer_vertex_set((layer,)))
    n_edges = len(G.layers.layer_edge_set((layer,)))
    print(f'  {layer}: {n_verts} vertices, {n_edges} edges')

# Supra statistics
print('\n Supra-AnnNet:')
print(f'  Nodes (vertex-layer pairs): {n_supra}')
print(f'  Algebraic connectivity: {lambda2:.6f}')

# Slice statistics
print(f'\n Slices: {len(G.slices.list())}')

# Memory
mem = G.memory_usage()
print(f'\n Memory: {mem / 1024:.2f} KB')

# History
print(f'\n History: {len(G._history)} events, version {G._version}')
# . Summary Statistics

print('=' * 70)
print('MULTILAYER NETWORK ANALYSIS - COMPLETE SUMMARY')
print('=' * 70)

# Entity counts
entity_counts = defaultdict(int)
for v in G.vertices():
    etype = G.attrs.get_vertex_attrs(v).get('entity_type', 'unknown')
    entity_counts[etype] += 1

print('\n Entity Counts:')
for etype, count in sorted(entity_counts.items()):
    print(f'  {etype}: {count}')

# Edge statistics
print('\n Edge Statistics:')
print(f'  Total edges: {G.ne}')
print(f'  Binary edges: {len(G.edge_definitions)}')
print(f'  Hyperedges: {len(G.hyperedge_definitions)}')
print(f'  Edge entities: {len([e for e, t in G.entity_types.items() if t == "edge"])}')
print(f'  Coupling edges: {len([e for e, k in G.edge_kind.items() if k == "coupling"])}')

# Directionality
directed_edges = G.get_edges_by_direction(True)
undirected_edges = G.get_edges_by_direction(False)
print(f'  Directed: {len(directed_edges)}')
print(f'  Undirected: {len(undirected_edges)}')

# Layer statistics
print('\n Layer Statistics:')
for layer in G.layers.elem_layers['omic']:
    n_verts = len(G.layers.layer_vertex_set((layer,)))
    n_edges = len(G.layers.layer_edge_set((layer,)))
    print(f'  {layer}: {n_verts} vertices, {n_edges} edges')

# Supra statistics
print('\n Supra-AnnNet:')
print(f'  Nodes (vertex-layer pairs): {n_supra}')
print(f'  Algebraic connectivity: {lambda2:.6f}')

# Slice statistics
print(f'\n Slices: {len(G.slices.list())}')

# Memory
mem = G.memory_usage()
print(f'\n Memory: {mem / 1024:.2f} KB')

# History
print(f'\n History: {len(G._history)} events, version {G._version}')

In [ ]:

Copied!





# . Visualization

fig, axes = plt.subplots(1, 2, figsize=(14, 5))

# Plot 1: Eigenvalue spectrum
# Axes indexing changes from axes[0, 0] to axes[0]
ax = axes[0]
ax.bar(range(len(eigenvalues)), eigenvalues, color='steelblue')
ax.axhline(y=eigenvalues[1], color='red', linestyle='--', label=f'λ₂={eigenvalues[1]:.3f}')
ax.set_xlabel('Eigenvalue index')
ax.set_ylabel('Eigenvalue')
ax.set_title('Supra-Laplacian Spectrum')
ax.legend()

# Plot 2: Fiedler vector
# Axes indexing changes from axes[0, 1] to axes[1]
ax = axes[1]
sorted_indices = np.argsort(fiedler_vec)
sorted_fiedler = fiedler_vec[sorted_indices]
colors = ['red' if f < 0 else 'blue' for f in sorted_fiedler]
ax.scatter(range(len(fiedler_vec)), np.sort(fiedler_vec), c=colors, alpha=0.6, s=30)
ax.axhline(y=0, color='black', linestyle='-', linewidth=0.5)
ax.set_xlabel('Node index (sorted)')
ax.set_ylabel('Fiedler value')
ax.set_title('Fiedler Vector (Spectral Partition)')

# 3. Remove Plot 3 and Plot 4 code entirely

plt.tight_layout()
plt.show()
# . Visualization

fig, axes = plt.subplots(1, 2, figsize=(14, 5))

# Plot 1: Eigenvalue spectrum
# Axes indexing changes from axes[0, 0] to axes[0]
ax = axes[0]
ax.bar(range(len(eigenvalues)), eigenvalues, color='steelblue')
ax.axhline(y=eigenvalues[1], color='red', linestyle='--', label=f'λ₂={eigenvalues[1]:.3f}')
ax.set_xlabel('Eigenvalue index')
ax.set_ylabel('Eigenvalue')
ax.set_title('Supra-Laplacian Spectrum')
ax.legend()

# Plot 2: Fiedler vector
# Axes indexing changes from axes[0, 1] to axes[1]
ax = axes[1]
sorted_indices = np.argsort(fiedler_vec)
sorted_fiedler = fiedler_vec[sorted_indices]
colors = ['red' if f < 0 else 'blue' for f in sorted_fiedler]
ax.scatter(range(len(fiedler_vec)), np.sort(fiedler_vec), c=colors, alpha=0.6, s=30)
ax.axhline(y=0, color='black', linestyle='-', linewidth=0.5)
ax.set_xlabel('Node index (sorted)')
ax.set_ylabel('Fiedler value')
ax.set_title('Fiedler Vector (Spectral Partition)')

# 3. Remove Plot 3 and Plot 4 code entirely

plt.tight_layout()
plt.show()

In [ ]:

Copied!

from annnet.io import cx2
# . Cytoscape layer visualization

import json

G.layers.create_slice_from_layer('ppi_only', ('PPI',), include_inter=False, include_coupling=False)
ppi_subgraph = G.subgraph_from_slice('ppi_only')

sbuc = cx2.to_cx2(ppi_subgraph)

output_file = 'sbuc.cx2'

with open(output_file, 'w') as f:
    json.dump(sbuc, f)

print(f'Saved to {output_file}')
from annnet.io import cx2
# . Cytoscape layer visualization

import json

G.layers.create_slice_from_layer('ppi_only', ('PPI',), include_inter=False, include_coupling=False)
ppi_subgraph = G.subgraph_from_slice('ppi_only')

sbuc = cx2.to_cx2(ppi_subgraph)

output_file = 'sbuc.cx2'

with open(output_file, 'w') as f:
    json.dump(sbuc, f)

print(f'Saved to {output_file}')

In [ ]:

Copied!

from annnet.io import cx2
# . SBML import and Cytoscape

from annnet.io import sbml as sb

# From SBML
gg = sb.from_sbml('Haridansyah2019.sbml')

# To cx2 (Cytoscape exchange 2)
H2 = cx2.to_cx2(gg, hyperedges='expand')
output_file = 'Haridansyah2019.cx2'

with open(output_file, 'w') as f:
    json.dump(H2, f)

print(f'Saved to {output_file}')
from annnet.io import cx2
# . SBML import and Cytoscape

from annnet.io import sbml as sb

# From SBML
gg = sb.from_sbml('Haridansyah2019.sbml')

# To cx2 (Cytoscape exchange 2)
H2 = cx2.to_cx2(gg, hyperedges='expand')
output_file = 'Haridansyah2019.cx2'

with open(output_file, 'w') as f:
    json.dump(H2, f)

print(f'Saved to {output_file}')

In [ ]:

Copied!

# . Lossless write/read as .annnet:

G.write('SBUCpl.annnet', overwrite=True)
# . Lossless write/read as .annnet:

G.write('SBUCpl.annnet', overwrite=True)

In [ ]:

Copied!

G2 = AnnNet.read('SBUCpl.annnet')
G2 = AnnNet.read('SBUCpl.annnet')

In [ ]:

Copied!

assert G2.V == G.V
assert G2.E == G.E
print('Lossless roundtrip Ok')
assert G2.V == G.V
assert G2.E == G.E
print('Lossless roundtrip Ok')

In [ ]: