Function bodies 69 total

create_table_component function · python · L7-L83 (77 LOC)

src/papersift/ui/components/table.py

def create_table_component(row_data: list) -> html.Div:
    """
    Create AG Grid table with multi-select enabled.

    Args:
        row_data: List of row dictionaries

    Returns:
        Dash Div containing the AG Grid component
    """
    column_defs = [
        {
            'headerName': '',
            'field': 'cluster_color',
            'width': 30,
            'cellStyle': {
                'function': "{'backgroundColor': params.value}"
            },
            'headerCheckboxSelection': True,
            'checkboxSelection': True,
        },
        {
            'headerName': 'Cluster',
            'field': 'cluster',
            'width': 80,
            'filter': 'agNumberColumnFilter',
            'sortable': True,
        },
        {
            'headerName': 'Year',
            'field': 'year',
            'width': 70,
            'filter': 'agNumberColumnFilter',
            'sortable': True,
        },
        {
            'headerName': 'Title',
            '

export_network_html function · python · L14-L51 (38 LOC)

src/papersift/ui/exporter.py

def export_network_html(
    papers_path: str,
    output_path: str,
    resolution: float = 1.0,
    mode: str = "cluster",
) -> None:
    """
    Export paper network as standalone interactive HTML.

    Args:
        papers_path: Path to papers JSON
        output_path: Output HTML file path
        resolution: Leiden clustering resolution
        mode: Visualization mode ("cluster" or "paper")
    """
    # Load and cluster
    papers = load_papers(papers_path)
    clusters, builder = cluster_papers(papers, resolution=resolution)
    colors = generate_cluster_colors(len(set(clusters.values())))

    if mode == "cluster":
        summaries = builder.get_cluster_summary(clusters)
        fig = _create_cluster_view_figure(summaries, builder, papers, colors)
    else:
        # Paper mode (original)
        G = _build_networkx_graph(papers, clusters, builder, colors)
        fig = _create_plotly_figure(G, papers)

    # Export as self-contained HTML
    fig.write_html(
        output_p

_build_networkx_graph function · python · L54-L78 (25 LOC)

src/papersift/ui/exporter.py

def _build_networkx_graph(papers, clusters, builder, colors):
    """Convert PaperSift graph to NetworkX."""
    G = nx.Graph()

    # Add nodes
    doi_to_title = {p['doi']: p.get('title', p['doi']) for p in papers}
    for doi, cluster_id in clusters.items():
        G.add_node(
            doi,
            title=doi_to_title.get(doi, doi),
            cluster=cluster_id,
            color=colors[cluster_id % len(colors)],
        )

    # Add edges from builder.graph (igraph)
    # NOTE: EntityLayerBuilder uses 'doi' attribute, not 'name'
    # Reference: entity_layer.py:323, data_loader.py:135-136
    for edge in builder.graph.es:
        source = builder.graph.vs[edge.source]['doi']
        target = builder.graph.vs[edge.target]['doi']
        weight = edge['weight'] if 'weight' in edge.attributes() else 1
        if source in clusters and target in clusters:
            G.add_edge(source, target, weight=weight)

    return G

_compute_cluster_edges function · python · L81-L99 (19 LOC)

src/papersift/ui/exporter.py

def _compute_cluster_edges(summaries, builder):
    """Compute edges between clusters based on shared entities."""
    cluster_entities = {}
    for summary in summaries:
        cid = summary['cluster_id']
        entities = set()
        for doi in summary['dois']:
            entities |= builder._paper_entities.get(doi, set())
        cluster_entities[cid] = entities

    edges = []
    cluster_ids = list(cluster_entities.keys())
    for i, cid_a in enumerate(cluster_ids):
        for cid_b in cluster_ids[i+1:]:
            shared = cluster_entities[cid_a] & cluster_entities[cid_b]
            if len(shared) >= 2:
                edges.append((cid_a, cid_b, len(shared)))

    return edges

_create_cluster_view_figure function · python · L102-L188 (87 LOC)

src/papersift/ui/exporter.py

def _create_cluster_view_figure(summaries, builder, papers, colors):
    """Create Plotly figure with cluster-level nodes."""
    G = nx.Graph()

    # Build DOI-to-title map
    doi_to_title = {p['doi']: p.get('title', p['doi']) for p in papers}

    # Add cluster nodes
    for s in summaries:
        cid = s['cluster_id']
        # Sample papers (first 3)
        sample_titles = []
        for doi in s['dois'][:3]:
            title = doi_to_title.get(doi, doi)
            sample_titles.append(title[:60])

        hover = (
            f"<b>Cluster {cid + 1}</b> ({s['size']} papers)<br>"
            f"<br>Top Entities: {', '.join(s['top_entities'][:5])}<br>"
            f"<br>Sample Papers:<br>"
            + "<br>".join(f"- {t}" for t in sample_titles)
        )

        G.add_node(
            cid,
            size=s['size'],
            color=colors[cid % len(colors)],
            hover=hover,
        )

    # Add inter-cluster edges
    edges = _compute_cluster_edges(summaries, b

_create_plotly_figure function · python · L191-L247 (57 LOC)

src/papersift/ui/exporter.py

def _create_plotly_figure(G: nx.Graph, papers: list) -> go.Figure:
    """Create Plotly figure from NetworkX graph."""
    # Layout
    pos = nx.spring_layout(G, k=0.5, iterations=50, seed=42)

    # Edge traces
    edge_x, edge_y = [], []
    for u, v in G.edges():
        x0, y0 = pos[u]
        x1, y1 = pos[v]
        edge_x.extend([x0, x1, None])
        edge_y.extend([y0, y1, None])

    edge_trace = go.Scatter(
        x=edge_x, y=edge_y,
        mode='lines',
        line=dict(width=0.5, color='#ccc'),
        hoverinfo='none'
    )

    # Node traces (grouped by cluster for coloring)
    node_traces = []
    cluster_nodes = {}
    for node in G.nodes():
        cluster = G.nodes[node]['cluster']
        if cluster not in cluster_nodes:
            cluster_nodes[cluster] = {'x': [], 'y': [], 'text': [], 'color': G.nodes[node]['color']}
        x, y = pos[node]
        cluster_nodes[cluster]['x'].append(x)
        cluster_nodes[cluster]['y'].append(y)
        title = G.nodes[node

_truncate function · python · L9-L15 (7 LOC)