<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/archiving/1.2/JATS-archivearticle1.dtd">
<article article-type="brief-report" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-title-group>
        <journal-title>microPublication Biology</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2578-9430</issn>
      <publisher>
        <publisher-name>Caltech Library</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.17912/micropub.biology.001796</article-id>
      <article-id pub-id-type="accession" assigning-authority="wormbase">WBPaper00069433</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>methodology</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>computational biology</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>interaction data</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>software</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>biochemistry</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>methods</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>zebrafish</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>arabidopsis</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>o. sativa</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>s. cerevisiae</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>escherichia coli</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>zea mays</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>human</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>rat</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>drosophila</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>gPPIpred: A User-Friendly PPI Predictor Based on Protein Molecular Graphs</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" equal-contrib="yes">
          <name>
            <surname>Matiolli</surname>
            <given-names>Cleverson C.</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/onceptualization">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing-review-editing">Writing - review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision">Supervision</role>
          <xref ref-type="aff" rid="aff1">1</xref>
        </contrib>
        <contrib contrib-type="author" equal-contrib="yes">
          <name>
            <surname>Marques</surname>
            <given-names>Joana </given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft">Writing - original draft</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing-review-editing">Writing - review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology">Methodology</role>
          <xref ref-type="aff" rid="aff1">1</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Abreu</surname>
            <given-names>Isabel A.</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/onceptualization">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision">Supervision</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing-review-editing">Writing - review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition">Funding acquisition</role>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="corresp" rid="cor1">§</xref>
        </contrib>
        <aff id="aff1">
          <label>1</label>
          Instituto de Tecnologia Química e Biológica António Xavier, Universidade Nova de Lisboa (ITQB NOVA), Avenida da República, 2780-157 Oeiras, Portugal
        </aff>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <anonymous/>
        </contrib>
      </contrib-group>
      <author-notes>
        <corresp id="cor1">
          <label>§</label>
          Correspondence to: Isabel A. Abreu (
          <email>abreu@itqb.unl.pt</email>
          )
        </corresp>
        <fn fn-type="coi-statement">
          <p>The authors declare that there are no conflicts of interest present.</p>
        </fn>
      </author-notes>
      <pub-date date-type="pub" publication-format="electronic">
        <day>10</day>
        <month>4</month>
        <year>2026</year>
      </pub-date>
      <pub-date date-type="collection" publication-format="electronic">
        <year>2026</year>
      </pub-date>
      <volume>2026</volume>
      <elocation-id>10.17912/micropub.biology.001796</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>8</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>2</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>10</day>
          <month>4</month>
          <year>2026</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 by the authors</copyright-statement>
        <copyright-year>2026</copyright-year>
        <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Protein–protein interactions (PPIs) govern essential cellular processes but remain challenging to characterize experimentally due to high cost and labor intensity. We present gPPIpred, a scalable computational framework leveraging graph neural networks (GNNs) and attention mechanisms to predict PPIs at residue-level resolution. Proteins are encoded as spatially informed molecular graphs integrating physicochemical features. Using curated structural datasets for training and validation, gPPIpred was fine-tuned to reliably predict positive interactions and actual interacting sites. Attention scores highlight key residues mediating interactions, offering interpretable insights to guide experimental design. gPPIpred combines high predictive performance with explainability, providing a user-friendly pipeline for large-scale PPI discovery.</p>
      </abstract>
      <funding-group>
        <funding-statement>
          We acknowledge the Portuguese Fundação para a Ciência e a Tecnologia (FCT) for a PhD fellowship for JM (
          <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.54499/2020.06917.BD">https://doi.org/10.54499/2020.06917.BD</ext-link>
          ) and project 
          <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.54499/PTDC/ASP-PLA/1920/2021">https://doi.org/10.54499/PTDC/ASP-PLA/1920/2021</ext-link>
          , which also supported CM contract. We also acknowledge funding by GREEN-it ‘Bioresources4sustainability’ (https://doi.org/10.54499/UIDB/04551/2020 ). The funding sources were not involved in analyses, interpretation of data, writing, or in the decision to submit this paper.
        </funding-statement>
      </funding-group>
    </article-meta>
  </front>
  <body>
    <fig position="anchor" id="f1">
      <label>Figure 1. gPPipred: a user friendly, protein-protein interaction predictor</label>
      <caption>
        <p>
          The gPPipred app, built in gradio, is available at: https://huggingface.co/spaces/1143Joana/gPPIpredv2_2 . 
          <bold>a)</bold>
           Model Convergence plot showing cross-entropy loss over 20 epochs. 
          <bold>b)</bold>
           Model Performance measured in MCC over 20 epochs of training. To calculate the MCC during training a balanced test dataset (10,000 samples) was used. MCC – Matthew’s correlation coefficient. 
          <bold>c) </bold>
          Precision and
          <bold/>
          Sensitivity
          <bold/>
          plot in function of interaction threshold.
          <bold> d)</bold>
           Receiver Operation Characteristic Curve. Final AUC-ROC: 0.9109. Optimal Threshold: 0.85. ROC - Receiver Operation Characteristic. AUC - Area Under the ROC Curve. 
          <bold>e)</bold>
           Confusion Matrix. MCC – Matthew’s correlation coefficient. 
          <bold>f)</bold>
           gPPipred web app. Users can input proteins by their UniProt Accession IDs. Additionally, users can define their desired threshold. 
          <bold>g)</bold>
           Here, we show an example of an output generated by gPPIpred. Once the program is finished analysing, the status area indicates how many preys were analysed. The chart shows the probability of each interaction as well as the line for the defined threshold. The interaction is considered positive if probability ≥ than the defined threshold. 
          <bold>h)</bold>
           Data area. Here, the users can find and download the list of the tested interactors. This list shows bait and prey IDs, the interaction probability, Binds (Yes, if probability ≥ than the defined threshold. No, probability &lt;&amp;nbsp; than the defined threshold), Bait and Prey Hotspots (Hotspot residues are at the interface of either bait or prey proteins that provide the bulk of the binding free energy (ΔG) for the specific interaction pair), and full sequences of Bait and Preys.
        </p>
      </caption>
    </fig>
    <graphic xlink:href="25789430-2026-micropub.biology.001796"/>
    <sec>
      <title>Description</title>
      <p>Protein–protein interactions (PPIs) are fundamental to essential biological processes, including signal transduction, immune response, and metabolic regulation. Traditionally, PPIs have been characterized using low-throughput experimental methods such as Fluorescence Resonance Energy Transfer (FRET), Bimolecular Fluorescence Complementation (BiFC), and yeast two-hybrid (Y2H) systems. High-throughput approaches often use mass spectrometry-coupled techniques, including co-immunoprecipitation (Co-IP) and tandem-affinity purification (TAP) (Bajar et al., 2016; Fields &amp; Song, 1989; Gavin et al., 2002; Ho et al., 2002; Low et al., 2021; Miller et al., 2015). However, these experimental techniques are often labor-intensive, time-consuming, costly, and prone to high rates of false positives and false negatives (Ito et al., 2001; Low et al., 2021; Mrowka et al., 2001). Recently, AlphaFold has provided a crucial advance in protein structural information by greatly increasing the number of high-accuracy protein structure models (Jumper et al., 2021; Varadi et al., 2022). As a result, computational approaches have emerged as efficient, scalable alternatives for PPI prediction.</p>
      <p>PPI prediction has relied on scalable computing techniques like machine learning (ML) and deep learning (DL) frameworks. Traditional ML techniques, such as support vector machines (SVM) and Random Forests, have been extensively used for PPI prediction (You et al., 2014, 2015). These methods typically use sequence-based features, including position-specific scoring matrices (PSSM), which capture evolutionary conservation, and physicochemical properties of amino acids to represent proteins (Guo et al., 2008; Shen et al., 2007). While effective, these methods depend on manual feature engineering, which limits scalability and hinders the integration of structural context. Advances in deep learning, particularly convolutional neural networks (CNNs) and recurrent neural networks (RNNs), have improved performance by learning high-level features directly from protein sequences (Hashemifar et al., 2018; Sun et al., 2017). However, these models often underutilize the structural information crucial for capturing the spatial relationships in protein interactions.</p>
      <p>Graph Neural Networks (GNNs) are a type of deep learning method that can infer information from graphically represented data. GNNs are now being used to integrate protein structural information with convolutional and recurrent networks to increase prediction robustness (Réau et al., 2021). Both Zhou et al. (2022) and Lee (2023) have summarized and compared methods that use GNN-based strategies (Lee, 2023; Zhou et al., 2022). AlphaFold represents a landmark in the application of GNNs to biological problems (Jumper et al., 2021; Varadi et al., 2022). While AlphaFold was initially used to predict the 3D structure of proteins, it can now be applied to predict complexes between proteins. Its latest update, AlphaFold3, can test interactions between a range of molecules, including DNA, RNA, ligands, ions, and proteins (Abramson et al., 2024). Notably, the model can now account for post-translational modifications and chemical modifications of nucleic acids. All of this is presented in a user-friendly environment, the AlphaFold server, where users only need to input their molecules sequences. However, it does not support high-throughput analysis, as users are limited to 30 jobs per day, and each job cannot exceed 5,000 tokens (1 amino acid =1 token).</p>
      <p>Here, we introduce gPPIpred, a novel framework that leverages Graph Neural Networks (GNNs) with integrated attention mechanisms to simultaneously consider physicochemical properties and structural information to predict PPIs. In gPPIpred, proteins are represented as residue-level graphs, where nodes correspond to amino acid residues and edges are established based on spatial proximity within three-dimensional protein structures. Each protein is modeled as a graph, with nodes representing residues of significant structural and functional relevance. Nodes encode the following residue-level physicochemical properties: hydrophobicity, volume, polarizability, pI, and pKa (see Feature Extraction section). The specific values for each amino acid are listed in Extended data  Table 1 (Kyte &amp; Doolittle, 1982). Edges in the graph are defined using a spatial threshold. By structuring the graph around both residue properties and spatial threshold rather than individual residues, the model effectively captures biologically relevant interaction motifs. For each predicted interacting pair, interaction hotspots are calculated via saliency mapping (see Methods). Here, the saliency mapping is based on the final interaction probability, providing information on which residues in both prey and bait are critical for that specific interaction.</p>
      <p>To iteratively refine residue embeddings, we employed a Graph Attention Network (GATv2) architecture. gPPIpred is a GATv2 model with eight layers of recursive message passing and multi-head attention. Two independent PPI datasets were created to train and validate this model. The breakdown of these datasets is in Table 1. The Siamese neural network was trained for 20 epochs using 128 shuffled graph batches. The use of shuffled batches and independent validation sets ensures the model's ability to generalize across different protein families. Cross-entropy losses observed during training are shown in Figure 1a. During training, the model exhibited a consistent decrease in cross-entropy loss, reaching convergence within 20 epochs.</p>
      <p>
        <bold>Table 1. Number of samples contained in each dataset</bold>
        . Number of Unique Proteins IDs in each dataset. No protein was used in both datasets to prevent data leakage. The percentage of species represented in each dataset is also listed.
      </p>
      <table-wrap>
        <table>
          <tbody>
            <tr>
              <td>
                <p>Dataset</p>
              </td>
              <td>
                <p>Total&amp;nbsp;</p>
              </td>
              <td>
                <p>Positive&amp;nbsp;</p>
                <p>interactions</p>
              </td>
              <td>
                <p>Negative&amp;nbsp;interactions</p>
              </td>
              <td>
                <p>Unique Proteins</p>
              </td>
            </tr>
            <tr>
              <td rowspan="4">
                <p>Training</p>
              </td>
              <td rowspan="4">
                <p>159,655 interactions:</p>
                <p>
                  77.87 % 
                  <italic>Homo sapiens</italic>
                  ,
                </p>
                <p>
                  22.05 % 
                  <italic>Arabidopsis thaliana</italic>
                  ,
                </p>
                <p>
                  0.05 % 
                  <italic>Oryza sativa</italic>
                  ,
                </p>
                <p>
                  0.02 % 
                  <italic>Saccharomyces cerevisiae</italic>
                </p>
              </td>
              <td rowspan="4">
                <p>77,508</p>
                <p>(48%)</p>
              </td>
              <td rowspan="4">
                <p>82,147</p>
                <p>(52%)</p>
              </td>
              <td rowspan="4">
                <p>10,349 proteins:</p>
                <p>
                  64 % 
                  <italic>Arabidopsis thaliana,</italic>
                </p>
                <p>
                  35 % 
                  <italic>Homo sapiens</italic>
                  ,
                </p>
                <p>
                  0.8 % 
                  <italic>Oryza sativa</italic>
                  ,
                </p>
                <p>
                  0.2 % 
                  <italic>Saccharomyces cerevisiae</italic>
                </p>
              </td>
            </tr>
            <tr>
              <td>
                <p>Validation</p>
              </td>
              <td>
                <p>72,358 interactions:&amp;nbsp;</p>
                <p>
                  50.42 % 
                  <italic>Homo sapiens</italic>
                  ,
                </p>
                <p>
                  49.54&amp;nbsp; % 
                  <italic>Saccharomyces cerevisiae</italic>
                </p>
              </td>
              <td>
                <p>36,179</p>
                <p>(50%)</p>
              </td>
              <td>
                <p>36,179</p>
                <p>(50%)</p>
              </td>
              <td>
                <p>4,192 proteins:</p>
                <p>
                  67.6 % 
                  <italic>Homo sapiens</italic>
                  ,
                </p>
                <p>
                  32.4 % 
                  <italic>Saccharomyces cerevisiae</italic>
                </p>
              </td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>The Matthew’s Correlation Coefficient (MCC) values obtained during each epoch are shown in Figure 1b. The GATv2-based Siamese network achieved an MCC of 0.57 during training. To verify the model’s ability to generalize to unseen biological data, we tested gPPIpred on an independent validation dataset of 72,358 protein pairs. The model achieved an MCC of 0.4641, confirming that the Siamese architecture and graph-based representations are not overfitting to specific protein families. The optimal threshold of 0.85 is determined by the point where Precision is maximized without sacrificing the model’s Sensitivity of 96% (Figure 1c). This threshold ensures the model remains a robust screening tool, capturing nearly all true interactions while maintaining an acceptable precision level. The performance metrics – ROC-AUC: 0.8451, MCC: 0.4641, and accuracy: 0.6992—reflect the model’s robust classification ability (Figure 1d). At a 0.85 threshold, performance differed between classes: non-binders (N = 36,179) showed high precision (0.91) but lower recall (0.43; F1 = 0.59), whereas binders (N = 36,801) showed high recall (0.96) with moderate precision (0.63; F1 = 0.76). Overall performance was balanced, with macro and weighted averages of 0.77 (precision), 0.70 (recall), and 0.68 (F1-score). The macro average of 0.70–0.77 across these metrics confirms that the model performs robustly for both classes, despite the distinct challenges each class presents. The high recall (96%) is particularly significant biologically, as it means nearly all true biological interactions are captured. The precision of 0.65 indicates a moderate rate of false positives. The confusion matrix (Figure 1e) shows that the model effectively prioritizes true-positive interactions, making it a viable computational filter for large-scale protein-protein interaction screening.</p>
      <p>This level of performance is especially notable given that the training dataset included proteins from diverse species, representing a broad spectrum of the proteome (Table 1). We offer gPPIpred in two ways: as a ready-to-use app accessible here (https://huggingface.co/spaces/1143Joana/gPPIpredv2_2), or by installing gPPIpred (see Extended Data section). To use the app, users only need to provide the UniProt IDs to run a query and define a threshold (Figure 1f). Once the prediction is complete, a bar chart will appear, providing the full list of preys and their interactions probabilities (Figure 1g). Additionally, in the data window, users can find and download the list of tested interactors. This list shows bait and prey IDs, interaction probability, Binds (Yes, if probability ≥ than the defined threshold; No, if probability &lt; than the defined threshold), Bait and Prey Hotspots (hotspot residues are at the interface of either bait or prey proteins and provide the bulk of the binding free energy (ΔG) for the specific interaction pair), and the full sequences of Bait and Preys (Figure 1h).</p>
      <p>
        To install gPPIpred, the following dependencies are required: Python 3.8+, PyTorch, PyTorch Geometric (PyG), and BioPython. We recommend using an NVIDIA GPU with CUDA support due to the high computational demand of graph attention mechanisms; however, execution on a CPU is possible. For the full list of requirements, see the Extended Data section. When using the manually installed version, gPPIpred will generate a link redirecting to an interface like the one shown in 
        <xref ref-type="fig" rid="f1">Figure 1,</xref>
         making it easy to use once installed.
      </p>
      <p>Despite its strengths, gPPIpred has limitations. For example, it depends on the availability of protein structural data, such as high-quality 3D structures, whether experimental or predicted, which are required to construct accurate graphs. Therefore, gPPIpred should not be used to predict interactions involving proteins that are intrinsically disordered or lack a reliable structural model, as this will yield low-confidence results.</p>
      <p>Overall, by leveraging structural representations through graph-based learning and integrating advanced embedding techniques, gPPIpred reduces research costs associated with large-scale interaction screenings and enhances our understanding of the structural determinants of protein interactions. The detailed insights provided by residue-level predictions have important implications for studying the biological mechanisms underlying these interactions, potentially guiding experimental validation and therapeutic targeting. The practical utility of gPPIpred is further enhanced by its interpretability via Saliency Mapping. For the predicted interactions, the model successfully identified residue-level hotspots at the interaction interfaces. The residues assigned the highest saliency scores correspond to those with significant functional relevance, such as those involved in hydrogen bonding or hydrophobic packing at the interface. These "saliency-identified" residues provide a direct roadmap for experimentalists looking to validate predictions through point mutations. Additionally, the gPPIpred pipeline facilitates PPI predictions by offering a simplified interface that automates the download and processing of protein and compound structural files, generates interactive 3D plots to visualize putative interaction sites, and creates detailed reports.</p>
    </sec>
    <sec>
      <title>Methods</title>
      <p>
        <bold>Dataset Preparation</bold>
      </p>
      <p>The training and validation datasets are available in the Extended Data section. Positive interaction data were curated from the Gold Standard Dataset and multi-validated experiments from BioGRID (Bernett, 2022; Chatr-Aryamontri et al., 2015; Oughtred et al., 2021; Szklarczyk et al., 2019). A common strategy for generating negative datasets is Subcellular Localization Filtering, which involves selecting proteins from different subcellular locations and labeling them as non-interacting. Although this strategy is widely accepted, the risk of false negatives can be further reduced by using experimentally validated negative examples. Therefore, we used a negative dataset curated by Russel Lab, dataset Stelzl (2005) (Stelzl et al., 2005; Trabuco et al., 2012). For negative interactions, the shortest path between the two proteins in the underlying two-hybrid interactome is assigned a confidence score in the following format: shortestPath:2, shortestPath:3, etc., or shortestPath:NA if there is no path connecting the two proteins. We created two separate datasets, ensuring that no individual protein sequence appeared in both datasets to prevent data leakage (Table 1). Only interactions where both proteins had high-resolution structures were included. When possible, we ensured the model had examples of both positive and negative interactions for the same protein.</p>
      <p>
        <bold>Protein Graph Construction</bold>
      </p>
      <p>Protein graphs were constructed by representing individual residues as nodes, with edges indicating spatial proximity based on a distance threshold of less than 9.5 Å between alpha carbon atoms. This threshold provides an accurate representation of the protein's tertiary structure and local chemical environment. Preprocessing included extracting Cartesian coordinates (x, y, z) from structural files and standardizing amino acid nomenclature into single-letter codes (Berman et al., 2000). To maximize structural coverage, we integrated experimentally determined structures from the PDB with high-confidence predicted models from AlphaFold2 (Jumper et al., 2021; Varadi et al., 2022). Missing entries were retrieved via the AlphaFold API, resulting in a nearly complete structural dataset. Node features were defined by a five-dimensional vector of physicochemical properties (hydrophobicity, volume, polarizability, pI, and pKa), while edges were defined by Euclidean distances, capturing the spatial constraints essential for predicting protein-protein interactions.</p>
      <p>
        <bold>Feature Extraction</bold>
      </p>
      <p>Node-level embeddings were generated by assigning relative values (0 to 1) for five physicochemical properties to each amino acid (Extended data Table 1). Thus, the model recognizes that 1.0 represents the maximum expression of that specific property. Each physicochemical property provides the model with different information. Hydrophobicity indicates the tendency of an amino acid to repel water, with 1 being the most hydrophobic and 0 the least. Volume is calculated as the Van der Waals volume, where 1 corresponds to the largest and 0 to the smallest amino acid. Polarizability measures how well an amino acid can engage in Van der Waals or London dispersion forces. Mathematically, polarizability (α) is defined as α = p/E, where p is the induced dipole moment and E is the electric field. Colloquially, polarizability reflects how "sticky" an amino acid is. The isoelectric point (pI) is calculated as pI = (pKa1 + pKa2)/2, indicating how basic (1) or acidic (0) an amino acid is. The dissociation constant (pKa) is determined empirically and informs the model whether a residue will be protonated or deprotonated at pH 7.4. These features capture local structural motifs and inter-residue interactions, enabling the model to identify spatial dependencies critical for predicting PPIs. The residue adjacency matrices, constructed with a 9.5 Å spatial threshold, preserved topological structures and emphasized meaningful connections between residues (Kipf &amp; Welling, 2016).</p>
      <p>
        <bold>Graph Neural Network Architecture</bold>
      </p>
      <p>A Graph Attention Network (GATv2) architecture was employed to iteratively refine residue embeddings. Through eight layers of recursive message passing and multi-head attention, the model aggregated neighborhood information into a global graph-level representation (Brody et al., 2021). This process ensured that the final representations were robust descriptors of protein geometry and chemistry, forming the foundation for accurate interaction prediction.</p>
      <p>
        <bold>Training and Validation</bold>
      </p>
      <p>The gPPIpred model was implemented as a Siamese Neural Network, a dual-stream architecture designed to learn relationships between pairs of entities. The gPPIpred GATv2 was trained for 20 epochs in batches of 128 shuffled graphs (Figure 1a and b). Here, we use a Siamese neural network that employs error back-propagation during training; the networks operate in parallel and compare their outputs at the end, usually using cosine distance. The training and validation scripts can be found in the Extended Data section.</p>
      <p>
        <bold>Interaction Site Analysis</bold>
      </p>
      <p>To move beyond "black-box" predictions, we used Saliency Mapping to identify interaction "hotspots." Saliency mapping calculates the gradient of the output probability with respect to the input node features. By visualizing these gradients, we can identify specific residues that contribute most to the predicted binding event. These residues typically correspond to interface regions that provide most of the binding free energy (ΔG), offering actionable targets for site-directed mutagenesis or therapeutic intervention.</p>
    </sec>
  </body>
  <back>
    <ack>
      <sec>
        <p>The authors thank the BioGRID, IntAct, and PDB teams for providing invaluable datasets, and the developers of ProtBERT for enabling advanced feature extraction.</p>
      </sec>
    </ack>
    <ref-list>
      <ref id="R1">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Abramson</surname>
              <given-names>Josh</given-names>
            </name>
            <name>
              <surname>Adler</surname>
              <given-names>Jonas</given-names>
            </name>
            <name>
              <surname>Dunger</surname>
              <given-names>Jack</given-names>
            </name>
            <name>
              <surname>Evans</surname>
              <given-names>Richard</given-names>
            </name>
            <name>
              <surname>Green</surname>
              <given-names>Tim</given-names>
            </name>
            <name>
              <surname>Pritzel</surname>
              <given-names>Alexander</given-names>
            </name>
            <name>
              <surname>Ronneberger</surname>
              <given-names>Olaf</given-names>
            </name>
            <name>
              <surname>Willmore</surname>
              <given-names>Lindsay</given-names>
            </name>
            <name>
              <surname>Ballard</surname>
              <given-names>Andrew J.</given-names>
            </name>
            <name>
              <surname>Bambrick</surname>
              <given-names>Joshua</given-names>
            </name>
            <name>
              <surname>Bodenstein</surname>
              <given-names>Sebastian W.</given-names>
            </name>
            <name>
              <surname>Evans</surname>
              <given-names>David A.</given-names>
            </name>
            <name>
              <surname>Hung</surname>
              <given-names>Chia-Chun</given-names>
            </name>
            <name>
              <surname>O’Neill</surname>
              <given-names>Michael</given-names>
            </name>
            <name>
              <surname>Reiman</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Tunyasuvunakool</surname>
              <given-names>Kathryn</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>Zachary</given-names>
            </name>
            <name>
              <surname>Žemgulytė</surname>
              <given-names>Akvilė</given-names>
            </name>
            <name>
              <surname>Arvaniti</surname>
              <given-names>Eirini</given-names>
            </name>
            <name>
              <surname>Beattie</surname>
              <given-names>Charles</given-names>
            </name>
            <name>
              <surname>Bertolli</surname>
              <given-names>Ottavia</given-names>
            </name>
            <name>
              <surname>Bridgland</surname>
              <given-names>Alex</given-names>
            </name>
            <name>
              <surname>Cherepanov</surname>
              <given-names>Alexey</given-names>
            </name>
            <name>
              <surname>Congreve</surname>
              <given-names>Miles</given-names>
            </name>
            <name>
              <surname>Cowen-Rivers</surname>
              <given-names>Alexander I.</given-names>
            </name>
            <name>
              <surname>Cowie</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Figurnov</surname>
              <given-names>Michael</given-names>
            </name>
            <name>
              <surname>Fuchs</surname>
              <given-names>Fabian B.</given-names>
            </name>
            <name>
              <surname>Gladman</surname>
              <given-names>Hannah</given-names>
            </name>
            <name>
              <surname>Jain</surname>
              <given-names>Rishub</given-names>
            </name>
            <name>
              <surname>Khan</surname>
              <given-names>Yousuf A.</given-names>
            </name>
            <name>
              <surname>Low</surname>
              <given-names>Caroline M. R.</given-names>
            </name>
            <name>
              <surname>Perlin</surname>
              <given-names>Kuba</given-names>
            </name>
            <name>
              <surname>Potapenko</surname>
              <given-names>Anna</given-names>
            </name>
            <name>
              <surname>Savy</surname>
              <given-names>Pascal</given-names>
            </name>
            <name>
              <surname>Singh</surname>
              <given-names>Sukhdeep</given-names>
            </name>
            <name>
              <surname>Stecula</surname>
              <given-names>Adrian</given-names>
            </name>
            <name>
              <surname>Thillaisundaram</surname>
              <given-names>Ashok</given-names>
            </name>
            <name>
              <surname>Tong</surname>
              <given-names>Catherine</given-names>
            </name>
            <name>
              <surname>Yakneen</surname>
              <given-names>Sergei</given-names>
            </name>
            <name>
              <surname>Zhong</surname>
              <given-names>Ellen D.</given-names>
            </name>
            <name>
              <surname>Zielinski</surname>
              <given-names>Michal</given-names>
            </name>
            <name>
              <surname>Žídek</surname>
              <given-names>Augustin</given-names>
            </name>
            <name>
              <surname>Bapst</surname>
              <given-names>Victor</given-names>
            </name>
            <name>
              <surname>Kohli</surname>
              <given-names>Pushmeet</given-names>
            </name>
            <name>
              <surname>Jaderberg</surname>
              <given-names>Max</given-names>
            </name>
            <name>
              <surname>Hassabis</surname>
              <given-names>Demis</given-names>
            </name>
            <name>
              <surname>Jumper</surname>
              <given-names>John M.</given-names>
            </name>
          </person-group>
          <year>2024</year>
          <month>5</month>
          <day>8</day>
          <article-title>Accurate structure prediction of biomolecular interactions with AlphaFold 3</article-title>
          <source>Nature</source>
          <volume>630</volume>
          <issue>8016</issue>
          <issn>0028-0836</issn>
          <fpage>493</fpage>
          <lpage>500</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-024-07487-w</pub-id>
        </element-citation>
      </ref>
      <ref id="R2">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bajar</surname>
              <given-names>Bryce</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Emily</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Shu</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>Michael</given-names>
            </name>
            <name>
              <surname>Chu</surname>
              <given-names>Jun</given-names>
            </name>
          </person-group>
          <year>2016</year>
          <month>9</month>
          <day>14</day>
          <article-title>A Guide to Fluorescent Protein FRET Pairs</article-title>
          <source>Sensors</source>
          <volume>16</volume>
          <issue>9</issue>
          <issn>1424-8220</issn>
          <fpage>1488</fpage>
          <lpage>1488</lpage>
          <pub-id pub-id-type="doi">10.3390/s16091488</pub-id>
        </element-citation>
      </ref>
      <ref id="R3">
        <mixed-citation>Bernett, Judith (2022). PPI prediction from sequence, gold standard dataset. figshare. Dataset. https://doi.org/10.6084/m9.figshare.21591618.v3</mixed-citation>
      </ref>
      <ref id="R4">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Berman</surname>
              <given-names>Helen M.</given-names>
            </name>
            <name>
              <surname>Bhat</surname>
              <given-names>T. N.</given-names>
            </name>
            <name>
              <surname>Bourne</surname>
              <given-names>Philip E.</given-names>
            </name>
            <name>
              <surname>Feng</surname>
              <given-names>Zukang</given-names>
            </name>
            <name>
              <surname>Gilliland</surname>
              <given-names>Gary</given-names>
            </name>
            <name>
              <surname>Weissig</surname>
              <given-names>Helge</given-names>
            </name>
            <name>
              <surname>Westbrook</surname>
              <given-names>John</given-names>
            </name>
          </person-group>
          <year>2000</year>
          <month>11</month>
          <day>1</day>
          <article-title>null</article-title>
          <source>Nature Structural Biology</source>
          <volume>7</volume>
          <issn>1072-8368</issn>
          <fpage>957</fpage>
          <lpage>959</lpage>
          <pub-id pub-id-type="doi">10.1038/80734</pub-id>
        </element-citation>
      </ref>
      <ref id="R5">
        <mixed-citation>
          Brody, S., Alon, U., &amp; Yahav, E.&amp;nbsp;(2021).&amp;nbsp;How Attentive are Graph Attention Networks?&amp;nbsp;
          <italic>ArXiv</italic>
          .&amp;nbsp;https://arxiv.org/abs/2105.14491
        </mixed-citation>
      </ref>
      <ref id="R6">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chatr-aryamontri</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Breitkreutz</surname>
              <given-names>Bobby-Joe</given-names>
            </name>
            <name>
              <surname>Oughtred</surname>
              <given-names>Rose</given-names>
            </name>
            <name>
              <surname>Boucher</surname>
              <given-names>Lorrie</given-names>
            </name>
            <name>
              <surname>Heinicke</surname>
              <given-names>Sven</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Daici</given-names>
            </name>
            <name>
              <surname>Stark</surname>
              <given-names>Chris</given-names>
            </name>
            <name>
              <surname>Breitkreutz</surname>
              <given-names>Ashton</given-names>
            </name>
            <name>
              <surname>Kolas</surname>
              <given-names>Nadine</given-names>
            </name>
            <name>
              <surname>O'Donnell</surname>
              <given-names>Lara</given-names>
            </name>
            <name>
              <surname>Reguly</surname>
              <given-names>Teresa</given-names>
            </name>
            <name>
              <surname>Nixon</surname>
              <given-names>Julie</given-names>
            </name>
            <name>
              <surname>Ramage</surname>
              <given-names>Lindsay</given-names>
            </name>
            <name>
              <surname>Winter</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Sellam</surname>
              <given-names>Adnane</given-names>
            </name>
            <name>
              <surname>Chang</surname>
              <given-names>Christie</given-names>
            </name>
            <name>
              <surname>Hirschman</surname>
              <given-names>Jodi</given-names>
            </name>
            <name>
              <surname>Theesfeld</surname>
              <given-names>Chandra</given-names>
            </name>
            <name>
              <surname>Rust</surname>
              <given-names>Jennifer</given-names>
            </name>
            <name>
              <surname>Livstone</surname>
              <given-names>Michael S.</given-names>
            </name>
            <name>
              <surname>Dolinski</surname>
              <given-names>Kara</given-names>
            </name>
            <name>
              <surname>Tyers</surname>
              <given-names>Mike</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <month>11</month>
          <day>26</day>
          <article-title>The BioGRID interaction database: 2015 update</article-title>
          <source>Nucleic Acids Research</source>
          <volume>43</volume>
          <issue>D1</issue>
          <issn>1362-4962</issn>
          <fpage>D470</fpage>
          <lpage>D478</lpage>
          <pub-id pub-id-type="doi">10.1093/nar/gku1204</pub-id>
        </element-citation>
      </ref>
      <ref id="R7">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fields</surname>
              <given-names>Stanley</given-names>
            </name>
            <name>
              <surname>Song</surname>
              <given-names>Ok-kyu</given-names>
            </name>
          </person-group>
          <year>1989</year>
          <month>7</month>
          <day>1</day>
          <article-title>A novel genetic system to detect protein–protein interactions</article-title>
          <source>Nature</source>
          <volume>340</volume>
          <issue>6230</issue>
          <issn>0028-0836</issn>
          <fpage>245</fpage>
          <lpage>246</lpage>
          <pub-id pub-id-type="doi">10.1038/340245a0</pub-id>
        </element-citation>
      </ref>
      <ref id="R8">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gavin</surname>
              <given-names>Anne-Claude</given-names>
            </name>
            <name>
              <surname>Bösche</surname>
              <given-names>Markus</given-names>
            </name>
            <name>
              <surname>Krause</surname>
              <given-names>Roland</given-names>
            </name>
            <name>
              <surname>Grandi</surname>
              <given-names>Paola</given-names>
            </name>
            <name>
              <surname>Marzioch</surname>
              <given-names>Martina</given-names>
            </name>
            <name>
              <surname>Bauer</surname>
              <given-names>Andreas</given-names>
            </name>
            <name>
              <surname>Schultz</surname>
              <given-names>Jörg</given-names>
            </name>
            <name>
              <surname>Rick</surname>
              <given-names>Jens M.</given-names>
            </name>
            <name>
              <surname>Michon</surname>
              <given-names>Anne-Marie</given-names>
            </name>
            <name>
              <surname>Cruciat</surname>
              <given-names>Cristina-Maria</given-names>
            </name>
            <name>
              <surname>Remor</surname>
              <given-names>Marita</given-names>
            </name>
            <name>
              <surname>Höfert</surname>
              <given-names>Christian</given-names>
            </name>
            <name>
              <surname>Schelder</surname>
              <given-names>Malgorzata</given-names>
            </name>
            <name>
              <surname>Brajenovic</surname>
              <given-names>Miro</given-names>
            </name>
            <name>
              <surname>Ruffner</surname>
              <given-names>Heinz</given-names>
            </name>
            <name>
              <surname>Merino</surname>
              <given-names>Alejandro</given-names>
            </name>
            <name>
              <surname>Klein</surname>
              <given-names>Karin</given-names>
            </name>
            <name>
              <surname>Hudak</surname>
              <given-names>Manuela</given-names>
            </name>
            <name>
              <surname>Dickson</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Rudi</surname>
              <given-names>Tatjana</given-names>
            </name>
            <name>
              <surname>Gnau</surname>
              <given-names>Volker</given-names>
            </name>
            <name>
              <surname>Bauch</surname>
              <given-names>Angela</given-names>
            </name>
            <name>
              <surname>Bastuck</surname>
              <given-names>Sonja</given-names>
            </name>
            <name>
              <surname>Huhse</surname>
              <given-names>Bettina</given-names>
            </name>
            <name>
              <surname>Leutwein</surname>
              <given-names>Christina</given-names>
            </name>
            <name>
              <surname>Heurtier</surname>
              <given-names>Marie-Anne</given-names>
            </name>
            <name>
              <surname>Copley</surname>
              <given-names>Richard R.</given-names>
            </name>
            <name>
              <surname>Edelmann</surname>
              <given-names>Angela</given-names>
            </name>
            <name>
              <surname>Querfurth</surname>
              <given-names>Erich</given-names>
            </name>
            <name>
              <surname>Rybin</surname>
              <given-names>Vladimir</given-names>
            </name>
            <name>
              <surname>Drewes</surname>
              <given-names>Gerard</given-names>
            </name>
            <name>
              <surname>Raida</surname>
              <given-names>Manfred</given-names>
            </name>
            <name>
              <surname>Bouwmeester</surname>
              <given-names>Tewis</given-names>
            </name>
            <name>
              <surname>Bork</surname>
              <given-names>Peer</given-names>
            </name>
            <name>
              <surname>Seraphin</surname>
              <given-names>Bertrand</given-names>
            </name>
            <name>
              <surname>Kuster</surname>
              <given-names>Bernhard</given-names>
            </name>
            <name>
              <surname>Neubauer</surname>
              <given-names>Gitte</given-names>
            </name>
            <name>
              <surname>Superti-Furga</surname>
              <given-names>Giulio</given-names>
            </name>
          </person-group>
          <year>2002</year>
          <month>1</month>
          <day>1</day>
          <article-title>Functional organization of the yeast proteome by systematic analysis of protein complexes</article-title>
          <source>Nature</source>
          <volume>415</volume>
          <issue>6868</issue>
          <issn>0028-0836</issn>
          <fpage>141</fpage>
          <lpage>147</lpage>
          <pub-id pub-id-type="doi">10.1038/415141a</pub-id>
        </element-citation>
      </ref>
      <ref id="R9">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Guo</surname>
              <given-names>Yanzhi</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Lezheng</given-names>
            </name>
            <name>
              <surname>Wen</surname>
              <given-names>Zhining</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Menglong</given-names>
            </name>
          </person-group>
          <year>2008</year>
          <month>4</month>
          <day>4</day>
          <article-title>Using support vector machine combined with auto covariance to predict protein–protein interactions from protein sequences</article-title>
          <source>Nucleic Acids Research</source>
          <volume>36</volume>
          <issue>9</issue>
          <issn>1362-4962</issn>
          <fpage>3025</fpage>
          <lpage>3030</lpage>
          <pub-id pub-id-type="doi">10.1093/nar/gkn159</pub-id>
        </element-citation>
      </ref>
      <ref id="R10">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hashemifar</surname>
              <given-names>Somaye</given-names>
            </name>
            <name>
              <surname>Neyshabur</surname>
              <given-names>Behnam</given-names>
            </name>
            <name>
              <surname>Khan</surname>
              <given-names>Aly A</given-names>
            </name>
            <name>
              <surname>Xu</surname>
              <given-names>Jinbo</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <month>9</month>
          <day>1</day>
          <article-title>Predicting protein–protein interactions through sequence-based deep learning</article-title>
          <source>Bioinformatics</source>
          <volume>34</volume>
          <issue>17</issue>
          <issn>1367-4803</issn>
          <fpage>i802</fpage>
          <lpage>i810</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bty573</pub-id>
        </element-citation>
      </ref>
      <ref id="R11">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ho</surname>
              <given-names>Yuen</given-names>
            </name>
            <name>
              <surname>Gruhler</surname>
              <given-names>Albrecht</given-names>
            </name>
            <name>
              <surname>Heilbut</surname>
              <given-names>Adrian</given-names>
            </name>
            <name>
              <surname>Bader</surname>
              <given-names>Gary D.</given-names>
            </name>
            <name>
              <surname>Moore</surname>
              <given-names>Lynda</given-names>
            </name>
            <name>
              <surname>Adams</surname>
              <given-names>Sally-Lin</given-names>
            </name>
            <name>
              <surname>Millar</surname>
              <given-names>Anna</given-names>
            </name>
            <name>
              <surname>Taylor</surname>
              <given-names>Paul</given-names>
            </name>
            <name>
              <surname>Bennett</surname>
              <given-names>Keiryn</given-names>
            </name>
            <name>
              <surname>Boutilier</surname>
              <given-names>Kelly</given-names>
            </name>
            <name>
              <surname>Yang</surname>
              <given-names>Lingyun</given-names>
            </name>
            <name>
              <surname>Wolting</surname>
              <given-names>Cheryl</given-names>
            </name>
            <name>
              <surname>Donaldson</surname>
              <given-names>Ian</given-names>
            </name>
            <name>
              <surname>Schandorff</surname>
              <given-names>Søren</given-names>
            </name>
            <name>
              <surname>Shewnarane</surname>
              <given-names>Juanita</given-names>
            </name>
            <name>
              <surname>Vo</surname>
              <given-names>Mai</given-names>
            </name>
            <name>
              <surname>Taggart</surname>
              <given-names>Joanne</given-names>
            </name>
            <name>
              <surname>Goudreault</surname>
              <given-names>Marilyn</given-names>
            </name>
            <name>
              <surname>Muskat</surname>
              <given-names>Brenda</given-names>
            </name>
            <name>
              <surname>Alfarano</surname>
              <given-names>Cris</given-names>
            </name>
            <name>
              <surname>Dewar</surname>
              <given-names>Danielle</given-names>
            </name>
            <name>
              <surname>Lin</surname>
              <given-names>Zhen</given-names>
            </name>
            <name>
              <surname>Michalickova</surname>
              <given-names>Katerina</given-names>
            </name>
            <name>
              <surname>Willems</surname>
              <given-names>Andrew R.</given-names>
            </name>
            <name>
              <surname>Sassi</surname>
              <given-names>Holly</given-names>
            </name>
            <name>
              <surname>Nielsen</surname>
              <given-names>Peter A.</given-names>
            </name>
            <name>
              <surname>Rasmussen</surname>
              <given-names>Karina J.</given-names>
            </name>
            <name>
              <surname>Andersen</surname>
              <given-names>Jens R.</given-names>
            </name>
            <name>
              <surname>Johansen</surname>
              <given-names>Lene E.</given-names>
            </name>
            <name>
              <surname>Hansen</surname>
              <given-names>Lykke H.</given-names>
            </name>
            <name>
              <surname>Jespersen</surname>
              <given-names>Hans</given-names>
            </name>
            <name>
              <surname>Podtelejnikov</surname>
              <given-names>Alexandre</given-names>
            </name>
            <name>
              <surname>Nielsen</surname>
              <given-names>Eva</given-names>
            </name>
            <name>
              <surname>Crawford</surname>
              <given-names>Janne</given-names>
            </name>
            <name>
              <surname>Poulsen</surname>
              <given-names>Vibeke</given-names>
            </name>
            <name>
              <surname>Sørensen</surname>
              <given-names>Birgitte D.</given-names>
            </name>
            <name>
              <surname>Matthiesen</surname>
              <given-names>Jesper</given-names>
            </name>
            <name>
              <surname>Hendrickson</surname>
              <given-names>Ronald C.</given-names>
            </name>
            <name>
              <surname>Gleeson</surname>
              <given-names>Frank</given-names>
            </name>
            <name>
              <surname>Pawson</surname>
              <given-names>Tony</given-names>
            </name>
            <name>
              <surname>Moran</surname>
              <given-names>Michael F.</given-names>
            </name>
            <name>
              <surname>Durocher</surname>
              <given-names>Daniel</given-names>
            </name>
            <name>
              <surname>Mann</surname>
              <given-names>Matthias</given-names>
            </name>
            <name>
              <surname>Hogue</surname>
              <given-names>Christopher W. V.</given-names>
            </name>
            <name>
              <surname>Figeys</surname>
              <given-names>Daniel</given-names>
            </name>
            <name>
              <surname>Tyers</surname>
              <given-names>Mike</given-names>
            </name>
          </person-group>
          <year>2002</year>
          <month>1</month>
          <day>1</day>
          <article-title>Systematic identification of protein complexes in Saccharomyces cerevisiae by mass spectrometry</article-title>
          <source>Nature</source>
          <volume>415</volume>
          <issue>6868</issue>
          <issn>0028-0836</issn>
          <fpage>180</fpage>
          <lpage>183</lpage>
          <pub-id pub-id-type="doi">10.1038/415180a</pub-id>
        </element-citation>
      </ref>
      <ref id="R12">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ito</surname>
              <given-names>Takashi</given-names>
            </name>
            <name>
              <surname>Chiba</surname>
              <given-names>Tomoko</given-names>
            </name>
            <name>
              <surname>Ozawa</surname>
              <given-names>Ritsuko</given-names>
            </name>
            <name>
              <surname>Yoshida</surname>
              <given-names>Mikio</given-names>
            </name>
            <name>
              <surname>Hattori</surname>
              <given-names>Masahira</given-names>
            </name>
            <name>
              <surname>Sakaki</surname>
              <given-names>Yoshiyuki</given-names>
            </name>
          </person-group>
          <year>2001</year>
          <month>3</month>
          <day>13</day>
          <article-title>A comprehensive two-hybrid analysis to explore the yeast protein interactome</article-title>
          <source>Proceedings of the National Academy of Sciences</source>
          <volume>98</volume>
          <issue>8</issue>
          <issn>0027-8424</issn>
          <fpage>4569</fpage>
          <lpage>4574</lpage>
          <pub-id pub-id-type="doi">10.1073/pnas.061034498</pub-id>
        </element-citation>
      </ref>
      <ref id="R13">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Jumper</surname>
              <given-names>John</given-names>
            </name>
            <name>
              <surname>Evans</surname>
              <given-names>Richard</given-names>
            </name>
            <name>
              <surname>Pritzel</surname>
              <given-names>Alexander</given-names>
            </name>
            <name>
              <surname>Green</surname>
              <given-names>Tim</given-names>
            </name>
            <name>
              <surname>Figurnov</surname>
              <given-names>Michael</given-names>
            </name>
            <name>
              <surname>Ronneberger</surname>
              <given-names>Olaf</given-names>
            </name>
            <name>
              <surname>Tunyasuvunakool</surname>
              <given-names>Kathryn</given-names>
            </name>
            <name>
              <surname>Bates</surname>
              <given-names>Russ</given-names>
            </name>
            <name>
              <surname>Žídek</surname>
              <given-names>Augustin</given-names>
            </name>
            <name>
              <surname>Potapenko</surname>
              <given-names>Anna</given-names>
            </name>
            <name>
              <surname>Bridgland</surname>
              <given-names>Alex</given-names>
            </name>
            <name>
              <surname>Meyer</surname>
              <given-names>Clemens</given-names>
            </name>
            <name>
              <surname>Kohl</surname>
              <given-names>Simon A. A.</given-names>
            </name>
            <name>
              <surname>Ballard</surname>
              <given-names>Andrew J.</given-names>
            </name>
            <name>
              <surname>Cowie</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Romera-Paredes</surname>
              <given-names>Bernardino</given-names>
            </name>
            <name>
              <surname>Nikolov</surname>
              <given-names>Stanislav</given-names>
            </name>
            <name>
              <surname>Jain</surname>
              <given-names>Rishub</given-names>
            </name>
            <name>
              <surname>Adler</surname>
              <given-names>Jonas</given-names>
            </name>
            <name>
              <surname>Back</surname>
              <given-names>Trevor</given-names>
            </name>
            <name>
              <surname>Petersen</surname>
              <given-names>Stig</given-names>
            </name>
            <name>
              <surname>Reiman</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Clancy</surname>
              <given-names>Ellen</given-names>
            </name>
            <name>
              <surname>Zielinski</surname>
              <given-names>Michal</given-names>
            </name>
            <name>
              <surname>Steinegger</surname>
              <given-names>Martin</given-names>
            </name>
            <name>
              <surname>Pacholska</surname>
              <given-names>Michalina</given-names>
            </name>
            <name>
              <surname>Berghammer</surname>
              <given-names>Tamas</given-names>
            </name>
            <name>
              <surname>Bodenstein</surname>
              <given-names>Sebastian</given-names>
            </name>
            <name>
              <surname>Silver</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Vinyals</surname>
              <given-names>Oriol</given-names>
            </name>
            <name>
              <surname>Senior</surname>
              <given-names>Andrew W.</given-names>
            </name>
            <name>
              <surname>Kavukcuoglu</surname>
              <given-names>Koray</given-names>
            </name>
            <name>
              <surname>Kohli</surname>
              <given-names>Pushmeet</given-names>
            </name>
            <name>
              <surname>Hassabis</surname>
              <given-names>Demis</given-names>
            </name>
          </person-group>
          <year>2021</year>
          <month>7</month>
          <day>15</day>
          <article-title>Highly accurate protein structure prediction with AlphaFold</article-title>
          <source>Nature</source>
          <volume>596</volume>
          <issue>7873</issue>
          <issn>0028-0836</issn>
          <fpage>583</fpage>
          <lpage>589</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-021-03819-2</pub-id>
        </element-citation>
      </ref>
      <ref id="R14">
        <element-citation publication-type="Preprint">
          <person-group person-group-type="author">
            <name>
              <surname>Kipf</surname>
              <given-names>Thomas N.</given-names>
            </name>
            <name>
              <surname>Welling</surname>
              <given-names>Max</given-names>
            </name>
          </person-group>
          <year>2016</year>
          <article-title>Semi-Supervised Classification with Graph Convolutional Networks</article-title>
          <pub-id pub-id-type="doi">10.48550/arxiv.1609.02907</pub-id>
        </element-citation>
      </ref>
      <ref id="R15">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kyte</surname>
              <given-names>Jack</given-names>
            </name>
            <name>
              <surname>Doolittle</surname>
              <given-names>Russell F.</given-names>
            </name>
          </person-group>
          <year>1982</year>
          <month>5</month>
          <day>1</day>
          <article-title>A simple method for displaying the hydropathic character of a protein</article-title>
          <source>Journal of Molecular Biology</source>
          <volume>157</volume>
          <issue>1</issue>
          <issn>0022-2836</issn>
          <fpage>105</fpage>
          <lpage>132</lpage>
          <pub-id pub-id-type="doi">10.1016/0022-2836(82)90515-0</pub-id>
        </element-citation>
      </ref>
      <ref id="R16">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Lee</surname>
              <given-names>Minhyeok</given-names>
            </name>
          </person-group>
          <year>2023</year>
          <month>7</month>
          <day>2</day>
          <article-title>Recent Advances in Deep Learning for Protein-Protein Interaction Analysis: A Comprehensive Review</article-title>
          <source>Molecules</source>
          <volume>28</volume>
          <issue>13</issue>
          <issn>1420-3049</issn>
          <fpage>5169</fpage>
          <lpage>5169</lpage>
          <pub-id pub-id-type="doi">10.3390/molecules28135169</pub-id>
        </element-citation>
      </ref>
      <ref id="R17">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Low</surname>
              <given-names>Teck Yew</given-names>
            </name>
            <name>
              <surname>Syafruddin</surname>
              <given-names>Saiful Effendi</given-names>
            </name>
            <name>
              <surname>Mohtar</surname>
              <given-names>M. Aiman</given-names>
            </name>
            <name>
              <surname>Vellaichamy</surname>
              <given-names>Adaikkalam</given-names>
            </name>
            <name>
              <surname>A Rahman</surname>
              <given-names>Nisa Syakila</given-names>
            </name>
            <name>
              <surname>Pung</surname>
              <given-names>Yuh-Fen</given-names>
            </name>
            <name>
              <surname>Tan</surname>
              <given-names>Chris Soon Heng</given-names>
            </name>
          </person-group>
          <year>2021</year>
          <month>5</month>
          <day>27</day>
          <article-title>Recent progress in mass spectrometry-based strategies for elucidating protein–protein interactions</article-title>
          <source>Cellular and Molecular Life Sciences</source>
          <volume>78</volume>
          <issue>13</issue>
          <issn>1420-682X</issn>
          <fpage>5325</fpage>
          <lpage>5339</lpage>
          <pub-id pub-id-type="doi">10.1007/s00018-021-03856-0</pub-id>
        </element-citation>
      </ref>
      <ref id="R18">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Martin</surname>
              <given-names>Andrew C. R.</given-names>
            </name>
          </person-group>
          <year>2005</year>
          <month>9</month>
          <day>27</day>
          <article-title>Mapping PDB chains to UniProtKB entries</article-title>
          <source>Bioinformatics</source>
          <volume>21</volume>
          <issue>23</issue>
          <issn>1367-4803</issn>
          <fpage>4297</fpage>
          <lpage>4301</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bti694</pub-id>
        </element-citation>
      </ref>
      <ref id="R19">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Miller</surname>
              <given-names>Kristi E.</given-names>
            </name>
            <name>
              <surname>Kim</surname>
              <given-names>Yeonsoo</given-names>
            </name>
            <name>
              <surname>Huh</surname>
              <given-names>Won-Ki</given-names>
            </name>
            <name>
              <surname>Park</surname>
              <given-names>Hay-Oak</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <month>6</month>
          <day>1</day>
          <article-title>Bimolecular Fluorescence Complementation (BiFC) Analysis: Advances and Recent Applications for Genome-Wide Interaction Studies</article-title>
          <source>Journal of Molecular Biology</source>
          <volume>427</volume>
          <issue>11</issue>
          <issn>0022-2836</issn>
          <fpage>2039</fpage>
          <lpage>2055</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jmb.2015.03.005</pub-id>
        </element-citation>
      </ref>
      <ref id="R20">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mrowka</surname>
              <given-names>Ralf</given-names>
            </name>
            <name>
              <surname>Patzak</surname>
              <given-names>Andreas</given-names>
            </name>
            <name>
              <surname>Herzel</surname>
              <given-names>Hanspeter</given-names>
            </name>
          </person-group>
          <year>2001</year>
          <month>12</month>
          <day>1</day>
          <article-title>Is There a Bias in Proteome Research?</article-title>
          <source>Genome Research</source>
          <volume>11</volume>
          <issue>12</issue>
          <issn>1088-9051</issn>
          <fpage>1971</fpage>
          <lpage>1973</lpage>
          <pub-id pub-id-type="doi">10.1101/gr.206701</pub-id>
        </element-citation>
      </ref>
      <ref id="R21">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Oughtred</surname>
              <given-names>Rose</given-names>
            </name>
            <name>
              <surname>Rust</surname>
              <given-names>Jennifer</given-names>
            </name>
            <name>
              <surname>Chang</surname>
              <given-names>Christie</given-names>
            </name>
            <name>
              <surname>Breitkreutz</surname>
              <given-names>Bobby‐Joe</given-names>
            </name>
            <name>
              <surname>Stark</surname>
              <given-names>Chris</given-names>
            </name>
            <name>
              <surname>Willems</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Boucher</surname>
              <given-names>Lorrie</given-names>
            </name>
            <name>
              <surname>Leung</surname>
              <given-names>Genie</given-names>
            </name>
            <name>
              <surname>Kolas</surname>
              <given-names>Nadine</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Frederick</given-names>
            </name>
            <name>
              <surname>Dolma</surname>
              <given-names>Sonam</given-names>
            </name>
            <name>
              <surname>Coulombe‐Huntington</surname>
              <given-names>Jasmin</given-names>
            </name>
            <name>
              <surname>Chatr‐aryamontri</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Dolinski</surname>
              <given-names>Kara</given-names>
            </name>
            <name>
              <surname>Tyers</surname>
              <given-names>Mike</given-names>
            </name>
          </person-group>
          <year>2020</year>
          <month>11</month>
          <day>23</day>
          <article-title>
            The 
            <scp>BioGRID</scp>
             database: A comprehensive biomedical resource of curated protein, genetic, and chemical interactions
          </article-title>
          <source>Protein Science</source>
          <volume>30</volume>
          <issue>1</issue>
          <issn>0961-8368</issn>
          <fpage>187</fpage>
          <lpage>200</lpage>
          <pub-id pub-id-type="doi">10.1002/pro.3978</pub-id>
        </element-citation>
      </ref>
      <ref id="R22">
        <element-citation publication-type="posted-content">
          <person-group person-group-type="author">
            <name>
              <surname>Réau</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Renaud</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Xue</surname>
              <given-names>L. C.</given-names>
            </name>
            <name>
              <surname>Bonvin</surname>
              <given-names>A. M. J. J.</given-names>
            </name>
          </person-group>
          <year>2021</year>
          <month>12</month>
          <day>10</day>
          <article-title>DeepRank-GNN: A Graph Neural Network Framework to Learn Patterns in Protein-Protein Interfaces</article-title>
          <pub-id pub-id-type="doi">10.1101/2021.12.08.471762</pub-id>
        </element-citation>
      </ref>
      <ref id="R23">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Shen</surname>
              <given-names>Juwen</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>Jian</given-names>
            </name>
            <name>
              <surname>Luo</surname>
              <given-names>Xiaomin</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>Weiliang</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Kunqian</given-names>
            </name>
            <name>
              <surname>Chen</surname>
              <given-names>Kaixian</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Yixue</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>Hualiang</given-names>
            </name>
          </person-group>
          <year>2007</year>
          <month>3</month>
          <day>13</day>
          <article-title>Predicting protein–protein interactions based only on sequences information</article-title>
          <source>Proceedings of the National Academy of Sciences</source>
          <volume>104</volume>
          <issue>11</issue>
          <issn>0027-8424</issn>
          <fpage>4337</fpage>
          <lpage>4341</lpage>
          <pub-id pub-id-type="doi">10.1073/pnas.0607879104</pub-id>
        </element-citation>
      </ref>
      <ref id="R24">
        <mixed-citation>Shervashidze N, Schweitzer P, Van Leeuwen EJ, Mehlhorn K, Borgwardt KM. 2011. Weisfeiler-lehman graph kernels. Journal of Machine Learning. 12(9).</mixed-citation>
      </ref>
      <ref id="R25">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Stelzl</surname>
              <given-names>Ulrich</given-names>
            </name>
            <name>
              <surname>Worm</surname>
              <given-names>Uwe</given-names>
            </name>
            <name>
              <surname>Lalowski</surname>
              <given-names>Maciej</given-names>
            </name>
            <name>
              <surname>Haenig</surname>
              <given-names>Christian</given-names>
            </name>
            <name>
              <surname>Brembeck</surname>
              <given-names>Felix H.</given-names>
            </name>
            <name>
              <surname>Goehler</surname>
              <given-names>Heike</given-names>
            </name>
            <name>
              <surname>Stroedicke</surname>
              <given-names>Martin</given-names>
            </name>
            <name>
              <surname>Zenkner</surname>
              <given-names>Martina</given-names>
            </name>
            <name>
              <surname>Schoenherr</surname>
              <given-names>Anke</given-names>
            </name>
            <name>
              <surname>Koeppen</surname>
              <given-names>Susanne</given-names>
            </name>
            <name>
              <surname>Timm</surname>
              <given-names>Jan</given-names>
            </name>
            <name>
              <surname>Mintzlaff</surname>
              <given-names>Sascha</given-names>
            </name>
            <name>
              <surname>Abraham</surname>
              <given-names>Claudia</given-names>
            </name>
            <name>
              <surname>Bock</surname>
              <given-names>Nicole</given-names>
            </name>
            <name>
              <surname>Kietzmann</surname>
              <given-names>Silvia</given-names>
            </name>
            <name>
              <surname>Goedde</surname>
              <given-names>Astrid</given-names>
            </name>
            <name>
              <surname>Toksöz</surname>
              <given-names>Engin</given-names>
            </name>
            <name>
              <surname>Droege</surname>
              <given-names>Anja</given-names>
            </name>
            <name>
              <surname>Krobitsch</surname>
              <given-names>Sylvia</given-names>
            </name>
            <name>
              <surname>Korn</surname>
              <given-names>Bernhard</given-names>
            </name>
            <name>
              <surname>Birchmeier</surname>
              <given-names>Walter</given-names>
            </name>
            <name>
              <surname>Lehrach</surname>
              <given-names>Hans</given-names>
            </name>
            <name>
              <surname>Wanker</surname>
              <given-names>Erich E.</given-names>
            </name>
          </person-group>
          <year>2005</year>
          <month>9</month>
          <day>1</day>
          <article-title>A Human Protein-Protein Interaction Network: A Resource for Annotating the Proteome</article-title>
          <source>Cell</source>
          <volume>122</volume>
          <issue>6</issue>
          <issn>0092-8674</issn>
          <fpage>957</fpage>
          <lpage>968</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cell.2005.08.029</pub-id>
        </element-citation>
      </ref>
      <ref id="R26">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Sun</surname>
              <given-names>Tanlin</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Bo</given-names>
            </name>
            <name>
              <surname>Lai</surname>
              <given-names>Luhua</given-names>
            </name>
            <name>
              <surname>Pei</surname>
              <given-names>Jianfeng</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <month>5</month>
          <day>25</day>
          <article-title>Sequence-based prediction of protein protein interaction using a deep-learning algorithm</article-title>
          <source>BMC Bioinformatics</source>
          <volume>18</volume>
          <issue>1</issue>
          <issn>1471-2105</issn>
          <pub-id pub-id-type="doi">10.1186/s12859-017-1700-2</pub-id>
        </element-citation>
      </ref>
      <ref id="R27">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Szklarczyk</surname>
              <given-names>Damian</given-names>
            </name>
            <name>
              <surname>Gable</surname>
              <given-names>Annika L</given-names>
            </name>
            <name>
              <surname>Lyon</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Junge</surname>
              <given-names>Alexander</given-names>
            </name>
            <name>
              <surname>Wyder</surname>
              <given-names>Stefan</given-names>
            </name>
            <name>
              <surname>Huerta-Cepas</surname>
              <given-names>Jaime</given-names>
            </name>
            <name>
              <surname>Simonovic</surname>
              <given-names>Milan</given-names>
            </name>
            <name>
              <surname>Doncheva</surname>
              <given-names>Nadezhda T</given-names>
            </name>
            <name>
              <surname>Morris</surname>
              <given-names>John H</given-names>
            </name>
            <name>
              <surname>Bork</surname>
              <given-names>Peer</given-names>
            </name>
            <name>
              <surname>Jensen</surname>
              <given-names>Lars J</given-names>
            </name>
            <name>
              <surname>Mering</surname>
              <given-names>Christian von</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <month>11</month>
          <day>22</day>
          <article-title>STRING v11: protein–protein association networks with increased coverage, supporting functional discovery in genome-wide experimental datasets</article-title>
          <source>Nucleic Acids Research</source>
          <volume>47</volume>
          <issue>D1</issue>
          <issn>0305-1048</issn>
          <fpage>D607</fpage>
          <lpage>D613</lpage>
          <pub-id pub-id-type="doi">10.1093/nar/gky1131</pub-id>
        </element-citation>
      </ref>
      <ref id="R28">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Trabuco</surname>
              <given-names>Leonardo G.</given-names>
            </name>
            <name>
              <surname>Betts</surname>
              <given-names>Matthew J.</given-names>
            </name>
            <name>
              <surname>Russell</surname>
              <given-names>Robert B.</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <month>12</month>
          <day>1</day>
          <article-title>Negative protein–protein interaction datasets derived from large-scale two-hybrid experiments</article-title>
          <source>Methods</source>
          <volume>58</volume>
          <issue>4</issue>
          <issn>1046-2023</issn>
          <fpage>343</fpage>
          <lpage>348</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ymeth.2012.07.028</pub-id>
        </element-citation>
      </ref>
      <ref id="R29">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Varadi</surname>
              <given-names>Mihaly</given-names>
            </name>
            <name>
              <surname>Anyango</surname>
              <given-names>Stephen</given-names>
            </name>
            <name>
              <surname>Deshpande</surname>
              <given-names>Mandar</given-names>
            </name>
            <name>
              <surname>Nair</surname>
              <given-names>Sreenath</given-names>
            </name>
            <name>
              <surname>Natassia</surname>
              <given-names>Cindy</given-names>
            </name>
            <name>
              <surname>Yordanova</surname>
              <given-names>Galabina</given-names>
            </name>
            <name>
              <surname>Yuan</surname>
              <given-names>David</given-names>
            </name>
            <name>
              <surname>Stroe</surname>
              <given-names>Oana</given-names>
            </name>
            <name>
              <surname>Wood</surname>
              <given-names>Gemma</given-names>
            </name>
            <name>
              <surname>Laydon</surname>
              <given-names>Agata</given-names>
            </name>
            <name>
              <surname>Žídek</surname>
              <given-names>Augustin</given-names>
            </name>
            <name>
              <surname>Green</surname>
              <given-names>Tim</given-names>
            </name>
            <name>
              <surname>Tunyasuvunakool</surname>
              <given-names>Kathryn</given-names>
            </name>
            <name>
              <surname>Petersen</surname>
              <given-names>Stig</given-names>
            </name>
            <name>
              <surname>Jumper</surname>
              <given-names>John</given-names>
            </name>
            <name>
              <surname>Clancy</surname>
              <given-names>Ellen</given-names>
            </name>
            <name>
              <surname>Green</surname>
              <given-names>Richard</given-names>
            </name>
            <name>
              <surname>Vora</surname>
              <given-names>Ankur</given-names>
            </name>
            <name>
              <surname>Lutfi</surname>
              <given-names>Mira</given-names>
            </name>
            <name>
              <surname>Figurnov</surname>
              <given-names>Michael</given-names>
            </name>
            <name>
              <surname>Cowie</surname>
              <given-names>Andrew</given-names>
            </name>
            <name>
              <surname>Hobbs</surname>
              <given-names>Nicole</given-names>
            </name>
            <name>
              <surname>Kohli</surname>
              <given-names>Pushmeet</given-names>
            </name>
            <name>
              <surname>Kleywegt</surname>
              <given-names>Gerard</given-names>
            </name>
            <name>
              <surname>Birney</surname>
              <given-names>Ewan</given-names>
            </name>
            <name>
              <surname>Hassabis</surname>
              <given-names>Demis</given-names>
            </name>
            <name>
              <surname>Velankar</surname>
              <given-names>Sameer</given-names>
            </name>
          </person-group>
          <year>2021</year>
          <month>11</month>
          <day>17</day>
          <article-title>AlphaFold Protein Structure Database: massively expanding the structural coverage of protein-sequence space with high-accuracy models</article-title>
          <source>Nucleic Acids Research</source>
          <volume>50</volume>
          <issue>D1</issue>
          <issn>0305-1048</issn>
          <fpage>D439</fpage>
          <lpage>D444</lpage>
          <pub-id pub-id-type="doi">10.1093/nar/gkab1061</pub-id>
        </element-citation>
      </ref>
      <ref id="R30">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>You</surname>
              <given-names>Zhu-Hong</given-names>
            </name>
            <name>
              <surname>Chan</surname>
              <given-names>Keith C. C.</given-names>
            </name>
            <name>
              <surname>Hu</surname>
              <given-names>Pengwei</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <month>5</month>
          <day>6</day>
          <article-title>Predicting Protein-Protein Interactions from Primary Protein Sequences Using a Novel Multi-Scale Local Feature Representation Scheme and the Random Forest</article-title>
          <source>PLOS ONE</source>
          <volume>10</volume>
          <issue>5</issue>
          <issn>1932-6203</issn>
          <fpage>e0125811</fpage>
          <lpage>e0125811</lpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0125811</pub-id>
        </element-citation>
      </ref>
      <ref id="R31">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>You</surname>
              <given-names>Zhu-Hong</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>Jian-Zhong</given-names>
            </name>
            <name>
              <surname>Zhu</surname>
              <given-names>Lin</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>Shuai</given-names>
            </name>
            <name>
              <surname>Wen</surname>
              <given-names>Zhen-Kun</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <month>12</month>
          <day>1</day>
          <article-title>A MapReduce based parallel SVM for large-scale predicting protein–protein interactions</article-title>
          <source>Neurocomputing</source>
          <volume>145</volume>
          <issn>0925-2312</issn>
          <fpage>37</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2014.05.072</pub-id>
        </element-citation>
      </ref>
      <ref id="R32">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhou</surname>
              <given-names>Hang</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Weikun</given-names>
            </name>
            <name>
              <surname>Jin</surname>
              <given-names>Jiayun</given-names>
            </name>
            <name>
              <surname>Zheng</surname>
              <given-names>Zengwei</given-names>
            </name>
            <name>
              <surname>Zhou</surname>
              <given-names>Binbin</given-names>
            </name>
          </person-group>
          <year>2022</year>
          <month>9</month>
          <day>19</day>
          <article-title>Graph Neural Network for Protein–Protein Interaction Prediction: A Comparative Study</article-title>
          <source>Molecules</source>
          <volume>27</volume>
          <issue>18</issue>
          <issn>1420-3049</issn>
          <fpage>6135</fpage>
          <lpage>6135</lpage>
          <pub-id pub-id-type="doi">10.3390/molecules27186135</pub-id>
        </element-citation>
      </ref>
    </ref-list>
  </back>
</article>