PMC:7111504 / 3442-16550 JSONTXT

Annnotations TAB JSON ListView MergeView

    LitCovid-PubTator

    {"project":"LitCovid-PubTator","denotations":[{"id":"57","span":{"begin":47,"end":55},"obj":"Species"},{"id":"64","span":{"begin":631,"end":636},"obj":"Gene"},{"id":"65","span":{"begin":698,"end":701},"obj":"Gene"},{"id":"66","span":{"begin":707,"end":710},"obj":"Gene"},{"id":"67","span":{"begin":222,"end":227},"obj":"Species"},{"id":"68","span":{"begin":301,"end":310},"obj":"Species"},{"id":"69","span":{"begin":496,"end":504},"obj":"Species"},{"id":"84","span":{"begin":929,"end":934},"obj":"Gene"},{"id":"85","span":{"begin":1765,"end":1770},"obj":"Gene"},{"id":"86","span":{"begin":1811,"end":1816},"obj":"Gene"},{"id":"87","span":{"begin":1975,"end":1980},"obj":"Gene"},{"id":"88","span":{"begin":2037,"end":2045},"obj":"Gene"},{"id":"89","span":{"begin":2105,"end":2110},"obj":"Gene"},{"id":"90","span":{"begin":2151,"end":2156},"obj":"Gene"},{"id":"91","span":{"begin":2216,"end":2221},"obj":"Gene"},{"id":"92","span":{"begin":2276,"end":2283},"obj":"Gene"},{"id":"93","span":{"begin":2291,"end":2295},"obj":"Gene"},{"id":"94","span":{"begin":2350,"end":2358},"obj":"Gene"},{"id":"95","span":{"begin":2417,"end":2425},"obj":"Gene"},{"id":"96","span":{"begin":837,"end":846},"obj":"Species"},{"id":"97","span":{"begin":942,"end":983},"obj":"Disease"},{"id":"100","span":{"begin":747,"end":756},"obj":"Species"},{"id":"101","span":{"begin":804,"end":812},"obj":"Species"},{"id":"103","span":{"begin":2434,"end":2442},"obj":"Species"},{"id":"105","span":{"begin":2512,"end":2521},"obj":"Species"},{"id":"108","span":{"begin":2653,"end":2661},"obj":"Species"},{"id":"109","span":{"begin":2745,"end":2754},"obj":"Species"},{"id":"111","span":{"begin":2921,"end":2930},"obj":"Species"},{"id":"115","span":{"begin":3373,"end":3382},"obj":"Species"},{"id":"116","span":{"begin":3708,"end":3716},"obj":"Species"},{"id":"117","span":{"begin":3803,"end":3815},"obj":"Species"},{"id":"119","span":{"begin":3896,"end":3905},"obj":"Species"},{"id":"123","span":{"begin":4229,"end":4238},"obj":"Species"},{"id":"124","span":{"begin":4469,"end":4478},"obj":"Species"},{"id":"125","span":{"begin":4614,"end":4623},"obj":"Species"},{"id":"127","span":{"begin":4871,"end":4880},"obj":"Species"},{"id":"129","span":{"begin":4763,"end":4772},"obj":"Species"},{"id":"131","span":{"begin":6031,"end":6040},"obj":"Species"},{"id":"133","span":{"begin":6051,"end":6060},"obj":"Species"},{"id":"135","span":{"begin":6764,"end":6773},"obj":"Species"},{"id":"145","span":{"begin":7286,"end":7291},"obj":"Gene"},{"id":"146","span":{"begin":7299,"end":7304},"obj":"Gene"},{"id":"147","span":{"begin":7312,"end":7317},"obj":"Gene"},{"id":"148","span":{"begin":7325,"end":7330},"obj":"Gene"},{"id":"149","span":{"begin":7341,"end":7346},"obj":"Gene"},{"id":"150","span":{"begin":7108,"end":7111},"obj":"Gene"},{"id":"151","span":{"begin":6889,"end":6898},"obj":"Species"},{"id":"152","span":{"begin":6941,"end":6950},"obj":"Species"},{"id":"153","span":{"begin":7150,"end":7159},"obj":"Chemical"},{"id":"155","span":{"begin":7388,"end":7391},"obj":"Gene"},{"id":"158","span":{"begin":7783,"end":7792},"obj":"Species"},{"id":"159","span":{"begin":7853,"end":7862},"obj":"Chemical"},{"id":"162","span":{"begin":8702,"end":8705},"obj":"Gene"},{"id":"163","span":{"begin":8678,"end":8687},"obj":"Species"},{"id":"171","span":{"begin":8753,"end":8756},"obj":"Gene"},{"id":"172","span":{"begin":8783,"end":8788},"obj":"Gene"},{"id":"173","span":{"begin":8796,"end":8801},"obj":"Gene"},{"id":"174","span":{"begin":8809,"end":8814},"obj":"Gene"},{"id":"175","span":{"begin":8822,"end":8827},"obj":"Gene"},{"id":"176","span":{"begin":8838,"end":8843},"obj":"Gene"},{"id":"177","span":{"begin":8861,"end":8870},"obj":"Chemical"},{"id":"181","span":{"begin":8963,"end":8966},"obj":"Gene"},{"id":"182","span":{"begin":8968,"end":8971},"obj":"Gene"},{"id":"183","span":{"begin":8937,"end":8946},"obj":"Species"},{"id":"185","span":{"begin":9237,"end":9240},"obj":"Gene"},{"id":"192","span":{"begin":9450,"end":9453},"obj":"Gene"},{"id":"193","span":{"begin":9525,"end":9530},"obj":"Gene"},{"id":"194","span":{"begin":9670,"end":9673},"obj":"Gene"},{"id":"195","span":{"begin":9455,"end":9458},"obj":"Gene"},{"id":"196","span":{"begin":9681,"end":9690},"obj":"Species"},{"id":"197","span":{"begin":9325,"end":9330},"obj":"Disease"},{"id":"203","span":{"begin":10293,"end":10298},"obj":"Gene"},{"id":"204","span":{"begin":9737,"end":9746},"obj":"Species"},{"id":"205","span":{"begin":10173,"end":10182},"obj":"Species"},{"id":"206","span":{"begin":10219,"end":10227},"obj":"Chemical"},{"id":"207","span":{"begin":10327,"end":10336},"obj":"Chemical"},{"id":"210","span":{"begin":10395,"end":10398},"obj":"Gene"},{"id":"211","span":{"begin":10435,"end":10444},"obj":"Species"},{"id":"214","span":{"begin":10580,"end":10583},"obj":"Gene"},{"id":"215","span":{"begin":10541,"end":10550},"obj":"Species"},{"id":"221","span":{"begin":10735,"end":10740},"obj":"Gene"},{"id":"222","span":{"begin":10675,"end":10678},"obj":"Gene"},{"id":"223","span":{"begin":10617,"end":10626},"obj":"Species"},{"id":"224","span":{"begin":10750,"end":10759},"obj":"Chemical"},{"id":"225","span":{"begin":10772,"end":10781},"obj":"Chemical"},{"id":"235","span":{"begin":11728,"end":11731},"obj":"Gene"},{"id":"236","span":{"begin":12319,"end":12322},"obj":"Gene"},{"id":"237","span":{"begin":12137,"end":12146},"obj":"Species"},{"id":"238","span":{"begin":11806,"end":11815},"obj":"Chemical"},{"id":"239","span":{"begin":11833,"end":11840},"obj":"Chemical"},{"id":"240","span":{"begin":11842,"end":11843},"obj":"Chemical"},{"id":"241","span":{"begin":11849,"end":11855},"obj":"Chemical"},{"id":"242","span":{"begin":12005,"end":12012},"obj":"Chemical"},{"id":"243","span":{"begin":12023,"end":12029},"obj":"Chemical"},{"id":"246","span":{"begin":12385,"end":12394},"obj":"Species"},{"id":"247","span":{"begin":12417,"end":12424},"obj":"Chemical"},{"id":"252","span":{"begin":12597,"end":12602},"obj":"Gene"},{"id":"253","span":{"begin":12541,"end":12544},"obj":"Gene"},{"id":"254","span":{"begin":12620,"end":12629},"obj":"Chemical"},{"id":"255","span":{"begin":12642,"end":12651},"obj":"Chemical"}],"attributes":[{"id":"A57","pred":"tao:has_database_id","subj":"57","obj":"Tax:694009"},{"id":"A64","pred":"tao:has_database_id","subj":"64","obj":"Gene:3105"},{"id":"A65","pred":"tao:has_database_id","subj":"65","obj":"Gene:925"},{"id":"A66","pred":"tao:has_database_id","subj":"66","obj":"Gene:920"},{"id":"A67","pred":"tao:has_database_id","subj":"67","obj":"Tax:9606"},{"id":"A68","pred":"tao:has_database_id","subj":"68","obj":"Tax:2697049"},{"id":"A69","pred":"tao:has_database_id","subj":"69","obj":"Tax:694009"},{"id":"A84","pred":"tao:has_database_id","subj":"84","obj":"Gene:3105"},{"id":"A85","pred":"tao:has_database_id","subj":"85","obj":"Gene:3106"},{"id":"A86","pred":"tao:has_database_id","subj":"86","obj":"Gene:3105"},{"id":"A87","pred":"tao:has_database_id","subj":"87","obj":"Gene:3105"},{"id":"A88","pred":"tao:has_database_id","subj":"88","obj":"Gene:3123"},{"id":"A89","pred":"tao:has_database_id","subj":"89","obj":"Gene:3105"},{"id":"A90","pred":"tao:has_database_id","subj":"90","obj":"Gene:3105"},{"id":"A91","pred":"tao:has_database_id","subj":"91","obj":"Gene:3105"},{"id":"A92","pred":"tao:has_database_id","subj":"92","obj":"Gene:3122"},{"id":"A93","pred":"tao:has_database_id","subj":"93","obj":"Gene:3123"},{"id":"A94","pred":"tao:has_database_id","subj":"94","obj":"Gene:3123"},{"id":"A95","pred":"tao:has_database_id","subj":"95","obj":"Gene:3123"},{"id":"A96","pred":"tao:has_database_id","subj":"96","obj":"Tax:2697049"},{"id":"A97","pred":"tao:has_database_id","subj":"97","obj":"MESH:C536108"},{"id":"A100","pred":"tao:has_database_id","subj":"100","obj":"Tax:2697049"},{"id":"A101","pred":"tao:has_database_id","subj":"101","obj":"Tax:694009"},{"id":"A103","pred":"tao:has_database_id","subj":"103","obj":"Tax:694009"},{"id":"A105","pred":"tao:has_database_id","subj":"105","obj":"Tax:2697049"},{"id":"A108","pred":"tao:has_database_id","subj":"108","obj":"Tax:694009"},{"id":"A109","pred":"tao:has_database_id","subj":"109","obj":"Tax:2697049"},{"id":"A111","pred":"tao:has_database_id","subj":"111","obj":"Tax:2697049"},{"id":"A115","pred":"tao:has_database_id","subj":"115","obj":"Tax:2697049"},{"id":"A116","pred":"tao:has_database_id","subj":"116","obj":"Tax:694009"},{"id":"A117","pred":"tao:has_database_id","subj":"117","obj":"Tax:9606"},{"id":"A119","pred":"tao:has_database_id","subj":"119","obj":"Tax:2697049"},{"id":"A123","pred":"tao:has_database_id","subj":"123","obj":"Tax:2697049"},{"id":"A124","pred":"tao:has_database_id","subj":"124","obj":"Tax:2697049"},{"id":"A125","pred":"tao:has_database_id","subj":"125","obj":"Tax:2697049"},{"id":"A127","pred":"tao:has_database_id","subj":"127","obj":"Tax:2697049"},{"id":"A129","pred":"tao:has_database_id","subj":"129","obj":"Tax:2697049"},{"id":"A131","pred":"tao:has_database_id","subj":"131","obj":"Tax:2697049"},{"id":"A133","pred":"tao:has_database_id","subj":"133","obj":"Tax:2697049"},{"id":"A135","pred":"tao:has_database_id","subj":"135","obj":"Tax:2697049"},{"id":"A145","pred":"tao:has_database_id","subj":"145","obj":"Gene:3105"},{"id":"A146","pred":"tao:has_database_id","subj":"146","obj":"Gene:3105"},{"id":"A147","pred":"tao:has_database_id","subj":"147","obj":"Gene:3106"},{"id":"A148","pred":"tao:has_database_id","subj":"148","obj":"Gene:3106"},{"id":"A149","pred":"tao:has_database_id","subj":"149","obj":"Gene:3107"},{"id":"A150","pred":"tao:has_database_id","subj":"150","obj":"Gene:3107"},{"id":"A151","pred":"tao:has_database_id","subj":"151","obj":"Tax:2697049"},{"id":"A152","pred":"tao:has_database_id","subj":"152","obj":"Tax:2697049"},{"id":"A155","pred":"tao:has_database_id","subj":"155","obj":"Gene:3107"},{"id":"A158","pred":"tao:has_database_id","subj":"158","obj":"Tax:2697049"},{"id":"A162","pred":"tao:has_database_id","subj":"162","obj":"Gene:3107"},{"id":"A163","pred":"tao:has_database_id","subj":"163","obj":"Tax:2697049"},{"id":"A171","pred":"tao:has_database_id","subj":"171","obj":"Gene:3107"},{"id":"A172","pred":"tao:has_database_id","subj":"172","obj":"Gene:3105"},{"id":"A173","pred":"tao:has_database_id","subj":"173","obj":"Gene:3105"},{"id":"A174","pred":"tao:has_database_id","subj":"174","obj":"Gene:3106"},{"id":"A175","pred":"tao:has_database_id","subj":"175","obj":"Gene:3106"},{"id":"A176","pred":"tao:has_database_id","subj":"176","obj":"Gene:3107"},{"id":"A181","pred":"tao:has_database_id","subj":"181","obj":"Gene:925"},{"id":"A182","pred":"tao:has_database_id","subj":"182","obj":"Gene:6962"},{"id":"A183","pred":"tao:has_database_id","subj":"183","obj":"Tax:2697049"},{"id":"A185","pred":"tao:has_database_id","subj":"185","obj":"Gene:6962"},{"id":"A192","pred":"tao:has_database_id","subj":"192","obj":"Gene:925"},{"id":"A193","pred":"tao:has_database_id","subj":"193","obj":"Gene:3105"},{"id":"A194","pred":"tao:has_database_id","subj":"194","obj":"Gene:6962"},{"id":"A195","pred":"tao:has_database_id","subj":"195","obj":"Gene:6962"},{"id":"A196","pred":"tao:has_database_id","subj":"196","obj":"Tax:2697049"},{"id":"A197","pred":"tao:has_database_id","subj":"197","obj":"MESH:D009369"},{"id":"A203","pred":"tao:has_database_id","subj":"203","obj":"Gene:3105"},{"id":"A204","pred":"tao:has_database_id","subj":"204","obj":"Tax:2697049"},{"id":"A205","pred":"tao:has_database_id","subj":"205","obj":"Tax:2697049"},{"id":"A206","pred":"tao:has_database_id","subj":"206","obj":"MESH:D010455"},{"id":"A210","pred":"tao:has_database_id","subj":"210","obj":"Gene:6962"},{"id":"A211","pred":"tao:has_database_id","subj":"211","obj":"Tax:2697049"},{"id":"A214","pred":"tao:has_database_id","subj":"214","obj":"Gene:6962"},{"id":"A215","pred":"tao:has_database_id","subj":"215","obj":"Tax:2697049"},{"id":"A221","pred":"tao:has_database_id","subj":"221","obj":"Gene:3105"},{"id":"A222","pred":"tao:has_database_id","subj":"222","obj":"Gene:6962"},{"id":"A223","pred":"tao:has_database_id","subj":"223","obj":"Tax:2697049"},{"id":"A235","pred":"tao:has_database_id","subj":"235","obj":"Gene:3107"},{"id":"A236","pred":"tao:has_database_id","subj":"236","obj":"Gene:6962"},{"id":"A237","pred":"tao:has_database_id","subj":"237","obj":"Tax:2697049"},{"id":"A239","pred":"tao:has_database_id","subj":"239","obj":"MESH:D007930"},{"id":"A240","pred":"tao:has_database_id","subj":"240","obj":"MESH:D007930"},{"id":"A241","pred":"tao:has_database_id","subj":"241","obj":"MESH:D014633"},{"id":"A242","pred":"tao:has_database_id","subj":"242","obj":"MESH:D007930"},{"id":"A243","pred":"tao:has_database_id","subj":"243","obj":"MESH:D014633"},{"id":"A246","pred":"tao:has_database_id","subj":"246","obj":"Tax:2697049"},{"id":"A247","pred":"tao:has_database_id","subj":"247","obj":"MESH:D007930"},{"id":"A252","pred":"tao:has_database_id","subj":"252","obj":"Gene:3105"},{"id":"A253","pred":"tao:has_database_id","subj":"253","obj":"Gene:6962"}],"namespaces":[{"prefix":"Tax","uri":"https://www.ncbi.nlm.nih.gov/taxonomy/"},{"prefix":"MESH","uri":"https://id.nlm.nih.gov/mesh/"},{"prefix":"Gene","uri":"https://www.ncbi.nlm.nih.gov/gene/"},{"prefix":"CVCL","uri":"https://web.expasy.org/cellosaurus/CVCL_"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PMC-OGER-BB

    {"project":"LitCovid-PMC-OGER-BB","denotations":[{"id":"T49","span":{"begin":47,"end":55},"obj":"SP_10"},{"id":"T50","span":{"begin":56,"end":67},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T51","span":{"begin":94,"end":102},"obj":"BV_9"},{"id":"T52","span":{"begin":199,"end":205},"obj":"CL:0000084;BV_23"},{"id":"T53","span":{"begin":206,"end":212},"obj":"BV_23"},{"id":"T54","span":{"begin":222,"end":227},"obj":"SP_6;NCBITaxon:9606"},{"id":"T55","span":{"begin":240,"end":248},"obj":"NCBITaxon:1"},{"id":"T56","span":{"begin":301,"end":310},"obj":"SP_7"},{"id":"T57","span":{"begin":311,"end":330},"obj":"SO:0000236"},{"id":"T58","span":{"begin":332,"end":336},"obj":"SO:0000236"},{"id":"T59","span":{"begin":496,"end":504},"obj":"SP_10"},{"id":"T60","span":{"begin":584,"end":591},"obj":"SO:0001023"},{"id":"T61","span":{"begin":631,"end":636},"obj":"PR:000002009"},{"id":"T62","span":{"begin":707,"end":710},"obj":"PR:000001004"},{"id":"T63","span":{"begin":712,"end":719},"obj":"CL:0000084"},{"id":"T64","span":{"begin":747,"end":756},"obj":"SP_7"},{"id":"T65","span":{"begin":792,"end":803},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T66","span":{"begin":804,"end":812},"obj":"SP_10"},{"id":"T67","span":{"begin":2434,"end":2442},"obj":"SP_10"},{"id":"T68","span":{"begin":2444,"end":2456},"obj":"SP_10"},{"id":"T69","span":{"begin":2457,"end":2468},"obj":"SP_10;UBERON:0001004"},{"id":"T70","span":{"begin":2469,"end":2489},"obj":"SP_10"},{"id":"T71","span":{"begin":2512,"end":2521},"obj":"SP_7"},{"id":"T72","span":{"begin":2585,"end":2596},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T73","span":{"begin":2597,"end":2602},"obj":"NCBITaxon:10239"},{"id":"T74","span":{"begin":2653,"end":2661},"obj":"SP_10"},{"id":"T75","span":{"begin":2682,"end":2686},"obj":"UBERON:0002415"},{"id":"T76","span":{"begin":2745,"end":2754},"obj":"SP_7"},{"id":"T77","span":{"begin":2755,"end":2759},"obj":"SO:0000236"},{"id":"T78","span":{"begin":2921,"end":2930},"obj":"SP_7"},{"id":"T79","span":{"begin":2973,"end":2984},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T80","span":{"begin":3156,"end":3164},"obj":"NCBITaxon:1"},{"id":"T81","span":{"begin":3219,"end":3227},"obj":"BV_9"},{"id":"T82","span":{"begin":3373,"end":3382},"obj":"SP_7"},{"id":"T83","span":{"begin":3708,"end":3716},"obj":"SP_10"},{"id":"T84","span":{"begin":3803,"end":3815},"obj":"SP_6;NCBITaxon:9606"},{"id":"T85","span":{"begin":3896,"end":3905},"obj":"SP_7"},{"id":"T86","span":{"begin":3949,"end":3963},"obj":"BV_15"},{"id":"T87","span":{"begin":4016,"end":4030},"obj":"BV_15"},{"id":"T88","span":{"begin":4066,"end":4080},"obj":"BV_15"},{"id":"T89","span":{"begin":4182,"end":4196},"obj":"BV_15"},{"id":"T90","span":{"begin":4229,"end":4238},"obj":"SP_7"},{"id":"T91","span":{"begin":4279,"end":4293},"obj":"BV_15"},{"id":"T92","span":{"begin":4401,"end":4415},"obj":"BV_15"},{"id":"T93","span":{"begin":4469,"end":4478},"obj":"SP_7"},{"id":"T94","span":{"begin":4568,"end":4579},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T95","span":{"begin":4614,"end":4623},"obj":"SP_7"},{"id":"T96","span":{"begin":4703,"end":4717},"obj":"BV_15"},{"id":"T97","span":{"begin":4763,"end":4772},"obj":"SP_7"},{"id":"T98","span":{"begin":4808,"end":4822},"obj":"BV_15"},{"id":"T99","span":{"begin":5991,"end":6005},"obj":"BV_15"},{"id":"T100","span":{"begin":6015,"end":6026},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T101","span":{"begin":6031,"end":6040},"obj":"SP_7"},{"id":"T102","span":{"begin":6051,"end":6060},"obj":"SP_7"},{"id":"T103","span":{"begin":6107,"end":6118},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T104","span":{"begin":6170,"end":6184},"obj":"BV_15"},{"id":"T105","span":{"begin":6261,"end":6275},"obj":"BV_15"},{"id":"T106","span":{"begin":6386,"end":6400},"obj":"BV_15"},{"id":"T107","span":{"begin":6505,"end":6516},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T108","span":{"begin":6582,"end":6593},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T109","span":{"begin":6601,"end":6612},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T110","span":{"begin":6685,"end":6699},"obj":"BV_15"},{"id":"T111","span":{"begin":6740,"end":6751},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T112","span":{"begin":6764,"end":6773},"obj":"SP_7"},{"id":"T113","span":{"begin":6856,"end":6867},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T114","span":{"begin":6889,"end":6898},"obj":"SP_7"},{"id":"T115","span":{"begin":6931,"end":6935},"obj":"SP_9"},{"id":"T116","span":{"begin":6941,"end":6950},"obj":"SP_7"},{"id":"T117","span":{"begin":7044,"end":7058},"obj":"BV_15"},{"id":"T118","span":{"begin":7108,"end":7111},"obj":"GO:0042611"},{"id":"T119","span":{"begin":7217,"end":7227},"obj":"SO:0001024"},{"id":"T120","span":{"begin":7286,"end":7291},"obj":"PR:000002009"},{"id":"T121","span":{"begin":7299,"end":7304},"obj":"PR:000002009"},{"id":"T122","span":{"begin":7312,"end":7317},"obj":"PR:000002010"},{"id":"T123","span":{"begin":7325,"end":7330},"obj":"PR:000002010"},{"id":"T124","span":{"begin":7341,"end":7346},"obj":"PR:000002011"},{"id":"T125","span":{"begin":7353,"end":7360},"obj":"SO:0001023"},{"id":"T126","span":{"begin":7388,"end":7391},"obj":"GO:0042611"},{"id":"T127","span":{"begin":7409,"end":7423},"obj":"BV_15"},{"id":"T128","span":{"begin":7493,"end":7500},"obj":"SO:0001023"},{"id":"T129","span":{"begin":7523,"end":7537},"obj":"BV_15"},{"id":"T130","span":{"begin":7619,"end":7633},"obj":"BV_15"},{"id":"T131","span":{"begin":7713,"end":7724},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T132","span":{"begin":7783,"end":7792},"obj":"SP_7"},{"id":"T133","span":{"begin":7842,"end":7849},"obj":"SO:0001023"},{"id":"T134","span":{"begin":7904,"end":7911},"obj":"SO:0001023"},{"id":"T135","span":{"begin":7916,"end":7930},"obj":"BV_15"},{"id":"T136","span":{"begin":7967,"end":7974},"obj":"SO:0001023"},{"id":"T137","span":{"begin":8047,"end":8053},"obj":"SO:0001023"},{"id":"T138","span":{"begin":8678,"end":8687},"obj":"SP_7"},{"id":"T139","span":{"begin":8702,"end":8705},"obj":"GO:0042611"},{"id":"T140","span":{"begin":8723,"end":8737},"obj":"BV_15"},{"id":"T141","span":{"begin":8753,"end":8756},"obj":"GO:0042611"},{"id":"T142","span":{"begin":8783,"end":8788},"obj":"PR:000002009"},{"id":"T143","span":{"begin":8796,"end":8801},"obj":"PR:000002009"},{"id":"T144","span":{"begin":8809,"end":8814},"obj":"PR:000002010"},{"id":"T145","span":{"begin":8822,"end":8827},"obj":"PR:000002010"},{"id":"T146","span":{"begin":8838,"end":8843},"obj":"PR:000002011"},{"id":"T147","span":{"begin":8850,"end":8857},"obj":"SO:0001023"},{"id":"T148","span":{"begin":8879,"end":8893},"obj":"BV_15"},{"id":"T149","span":{"begin":8919,"end":8933},"obj":"BV_15"},{"id":"T150","span":{"begin":8937,"end":8946},"obj":"SP_7"},{"id":"T151","span":{"begin":8972,"end":8980},"obj":"CHEBI:36357;CHEBI:36357"},{"id":"T152","span":{"begin":9118,"end":9124},"obj":"CL:0000084"},{"id":"T153","span":{"begin":9242,"end":9248},"obj":"CL:0000084"},{"id":"T154","span":{"begin":9296,"end":9302},"obj":"CL:0000084"},{"id":"T155","span":{"begin":9331,"end":9339},"obj":"CHEBI:59132;CHEBI:59132"},{"id":"T156","span":{"begin":9392,"end":9399},"obj":"CL:0000084"},{"id":"T157","span":{"begin":9525,"end":9530},"obj":"PR:000002009"},{"id":"T158","span":{"begin":9681,"end":9690},"obj":"SP_7"},{"id":"T159","span":{"begin":9723,"end":9727},"obj":"SP_9"},{"id":"T160","span":{"begin":9737,"end":9746},"obj":"SP_7"},{"id":"T161","span":{"begin":9954,"end":9968},"obj":"BV_15"},{"id":"T162","span":{"begin":10173,"end":10182},"obj":"SP_7"},{"id":"T163","span":{"begin":10293,"end":10298},"obj":"PR:000002009"},{"id":"T164","span":{"begin":10435,"end":10444},"obj":"SP_7"},{"id":"T165","span":{"begin":10518,"end":10522},"obj":"SP_9"},{"id":"T166","span":{"begin":10541,"end":10550},"obj":"SP_7"},{"id":"T167","span":{"begin":10551,"end":10555},"obj":"SO:0000236"},{"id":"T168","span":{"begin":10617,"end":10626},"obj":"SP_7"},{"id":"T169","span":{"begin":10735,"end":10740},"obj":"PR:000002009"},{"id":"T170","span":{"begin":11728,"end":11731},"obj":"GO:0042611"},{"id":"T171","span":{"begin":11949,"end":11952},"obj":"GO:0042611"},{"id":"T172","span":{"begin":11955,"end":11962},"obj":"PR:000002009"},{"id":"T173","span":{"begin":12079,"end":12086},"obj":"PR:000002009"},{"id":"T174","span":{"begin":12137,"end":12146},"obj":"SP_7"},{"id":"T175","span":{"begin":12180,"end":12194},"obj":"BV_15"},{"id":"T176","span":{"begin":12353,"end":12360},"obj":"PR:000002009"},{"id":"T177","span":{"begin":12364,"end":12373},"obj":"SO:0001024"},{"id":"T178","span":{"begin":12385,"end":12394},"obj":"SP_7"},{"id":"T179","span":{"begin":12597,"end":12602},"obj":"PR:000002009"},{"id":"T90647","span":{"begin":47,"end":55},"obj":"SP_10"},{"id":"T91789","span":{"begin":56,"end":67},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T36642","span":{"begin":94,"end":102},"obj":"BV_9"},{"id":"T61606","span":{"begin":199,"end":205},"obj":"CL:0000084;BV_23"},{"id":"T92404","span":{"begin":206,"end":212},"obj":"BV_23"},{"id":"T59646","span":{"begin":222,"end":227},"obj":"SP_6;NCBITaxon:9606"},{"id":"T46254","span":{"begin":240,"end":248},"obj":"NCBITaxon:1"},{"id":"T44920","span":{"begin":301,"end":310},"obj":"SP_7"},{"id":"T21846","span":{"begin":311,"end":330},"obj":"SO:0000236"},{"id":"T65235","span":{"begin":332,"end":336},"obj":"SO:0000236"},{"id":"T32217","span":{"begin":496,"end":504},"obj":"SP_10"},{"id":"T71600","span":{"begin":584,"end":591},"obj":"SO:0001023"},{"id":"T25480","span":{"begin":631,"end":636},"obj":"PR:000002009"},{"id":"T8945","span":{"begin":707,"end":710},"obj":"PR:000001004"},{"id":"T43204","span":{"begin":712,"end":719},"obj":"CL:0000084"},{"id":"T24098","span":{"begin":747,"end":756},"obj":"SP_7"},{"id":"T68353","span":{"begin":792,"end":803},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T10691","span":{"begin":804,"end":812},"obj":"SP_10"},{"id":"T43844","span":{"begin":2434,"end":2442},"obj":"SP_10"},{"id":"T38738","span":{"begin":2444,"end":2456},"obj":"SP_10"},{"id":"T69357","span":{"begin":2457,"end":2468},"obj":"SP_10;UBERON:0001004"},{"id":"T49984","span":{"begin":2469,"end":2489},"obj":"SP_10"},{"id":"T77904","span":{"begin":2512,"end":2521},"obj":"SP_7"},{"id":"T67615","span":{"begin":2585,"end":2596},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T6301","span":{"begin":2597,"end":2602},"obj":"NCBITaxon:10239"},{"id":"T83775","span":{"begin":2653,"end":2661},"obj":"SP_10"},{"id":"T79489","span":{"begin":2682,"end":2686},"obj":"UBERON:0002415"},{"id":"T30840","span":{"begin":2745,"end":2754},"obj":"SP_7"},{"id":"T18704","span":{"begin":2755,"end":2759},"obj":"SO:0000236"},{"id":"T25028","span":{"begin":2921,"end":2930},"obj":"SP_7"},{"id":"T38195","span":{"begin":2973,"end":2984},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T91224","span":{"begin":3156,"end":3164},"obj":"NCBITaxon:1"},{"id":"T26522","span":{"begin":3219,"end":3227},"obj":"BV_9"},{"id":"T51283","span":{"begin":3373,"end":3382},"obj":"SP_7"},{"id":"T83402","span":{"begin":3708,"end":3716},"obj":"SP_10"},{"id":"T38460","span":{"begin":3803,"end":3815},"obj":"SP_6;NCBITaxon:9606"},{"id":"T18430","span":{"begin":3896,"end":3905},"obj":"SP_7"},{"id":"T78372","span":{"begin":3949,"end":3963},"obj":"BV_15"},{"id":"T32405","span":{"begin":4016,"end":4030},"obj":"BV_15"},{"id":"T57245","span":{"begin":4066,"end":4080},"obj":"BV_15"},{"id":"T4440","span":{"begin":4182,"end":4196},"obj":"BV_15"},{"id":"T13636","span":{"begin":4229,"end":4238},"obj":"SP_7"},{"id":"T61633","span":{"begin":4279,"end":4293},"obj":"BV_15"},{"id":"T19852","span":{"begin":4401,"end":4415},"obj":"BV_15"},{"id":"T63857","span":{"begin":4469,"end":4478},"obj":"SP_7"},{"id":"T42242","span":{"begin":4568,"end":4579},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T74171","span":{"begin":4614,"end":4623},"obj":"SP_7"},{"id":"T89996","span":{"begin":4703,"end":4717},"obj":"BV_15"},{"id":"T99846","span":{"begin":4763,"end":4772},"obj":"SP_7"},{"id":"T22698","span":{"begin":4808,"end":4822},"obj":"BV_15"},{"id":"T23450","span":{"begin":5991,"end":6005},"obj":"BV_15"},{"id":"T46975","span":{"begin":6015,"end":6026},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T97466","span":{"begin":6031,"end":6040},"obj":"SP_7"},{"id":"T87936","span":{"begin":6051,"end":6060},"obj":"SP_7"},{"id":"T30689","span":{"begin":6107,"end":6118},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T76745","span":{"begin":6170,"end":6184},"obj":"BV_15"},{"id":"T34290","span":{"begin":6261,"end":6275},"obj":"BV_15"},{"id":"T17780","span":{"begin":6386,"end":6400},"obj":"BV_15"},{"id":"T91242","span":{"begin":6505,"end":6516},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T28529","span":{"begin":6582,"end":6593},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T28382","span":{"begin":6601,"end":6612},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T58994","span":{"begin":6685,"end":6699},"obj":"BV_15"},{"id":"T62473","span":{"begin":6740,"end":6751},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T49303","span":{"begin":6764,"end":6773},"obj":"SP_7"},{"id":"T4279","span":{"begin":6856,"end":6867},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T6626","span":{"begin":6889,"end":6898},"obj":"SP_7"},{"id":"T90148","span":{"begin":6931,"end":6935},"obj":"SP_9"},{"id":"T85766","span":{"begin":6941,"end":6950},"obj":"SP_7"},{"id":"T90107","span":{"begin":7044,"end":7058},"obj":"BV_15"},{"id":"T45797","span":{"begin":7108,"end":7111},"obj":"GO:0042611"},{"id":"T63293","span":{"begin":7217,"end":7227},"obj":"SO:0001024"},{"id":"T59388","span":{"begin":7286,"end":7291},"obj":"PR:000002009"},{"id":"T64753","span":{"begin":7299,"end":7304},"obj":"PR:000002009"},{"id":"T67356","span":{"begin":7312,"end":7317},"obj":"PR:000002010"},{"id":"T99742","span":{"begin":7325,"end":7330},"obj":"PR:000002010"},{"id":"T8696","span":{"begin":7341,"end":7346},"obj":"PR:000002011"},{"id":"T3771","span":{"begin":7353,"end":7360},"obj":"SO:0001023"},{"id":"T81007","span":{"begin":7388,"end":7391},"obj":"GO:0042611"},{"id":"T71652","span":{"begin":7409,"end":7423},"obj":"BV_15"},{"id":"T43291","span":{"begin":7493,"end":7500},"obj":"SO:0001023"},{"id":"T65127","span":{"begin":7523,"end":7537},"obj":"BV_15"},{"id":"T76335","span":{"begin":7619,"end":7633},"obj":"BV_15"},{"id":"T29057","span":{"begin":7713,"end":7724},"obj":"CHEBI:60816;CHEBI:60816"},{"id":"T69709","span":{"begin":7783,"end":7792},"obj":"SP_7"},{"id":"T97652","span":{"begin":7842,"end":7849},"obj":"SO:0001023"},{"id":"T30189","span":{"begin":7904,"end":7911},"obj":"SO:0001023"},{"id":"T17570","span":{"begin":7916,"end":7930},"obj":"BV_15"},{"id":"T56623","span":{"begin":7967,"end":7974},"obj":"SO:0001023"},{"id":"T32084","span":{"begin":8047,"end":8053},"obj":"SO:0001023"},{"id":"T12377","span":{"begin":8678,"end":8687},"obj":"SP_7"},{"id":"T98397","span":{"begin":8702,"end":8705},"obj":"GO:0042611"},{"id":"T94145","span":{"begin":8723,"end":8737},"obj":"BV_15"},{"id":"T75496","span":{"begin":8753,"end":8756},"obj":"GO:0042611"},{"id":"T7224","span":{"begin":8783,"end":8788},"obj":"PR:000002009"},{"id":"T38753","span":{"begin":8796,"end":8801},"obj":"PR:000002009"},{"id":"T92877","span":{"begin":8809,"end":8814},"obj":"PR:000002010"},{"id":"T36156","span":{"begin":8822,"end":8827},"obj":"PR:000002010"},{"id":"T68789","span":{"begin":8838,"end":8843},"obj":"PR:000002011"},{"id":"T46318","span":{"begin":8850,"end":8857},"obj":"SO:0001023"},{"id":"T4457","span":{"begin":8879,"end":8893},"obj":"BV_15"},{"id":"T59205","span":{"begin":8919,"end":8933},"obj":"BV_15"},{"id":"T33056","span":{"begin":8937,"end":8946},"obj":"SP_7"},{"id":"T536","span":{"begin":8972,"end":8980},"obj":"CHEBI:36357;CHEBI:36357"},{"id":"T9906","span":{"begin":9118,"end":9124},"obj":"CL:0000084"},{"id":"T69209","span":{"begin":9242,"end":9248},"obj":"CL:0000084"},{"id":"T36975","span":{"begin":9296,"end":9302},"obj":"CL:0000084"},{"id":"T33303","span":{"begin":9331,"end":9339},"obj":"CHEBI:59132;CHEBI:59132"},{"id":"T36223","span":{"begin":9392,"end":9399},"obj":"CL:0000084"},{"id":"T80986","span":{"begin":9525,"end":9530},"obj":"PR:000002009"},{"id":"T35114","span":{"begin":9681,"end":9690},"obj":"SP_7"},{"id":"T99554","span":{"begin":9723,"end":9727},"obj":"SP_9"},{"id":"T68802","span":{"begin":9737,"end":9746},"obj":"SP_7"},{"id":"T66664","span":{"begin":9954,"end":9968},"obj":"BV_15"},{"id":"T22144","span":{"begin":10173,"end":10182},"obj":"SP_7"},{"id":"T48296","span":{"begin":10293,"end":10298},"obj":"PR:000002009"},{"id":"T18213","span":{"begin":10435,"end":10444},"obj":"SP_7"},{"id":"T15461","span":{"begin":10518,"end":10522},"obj":"SP_9"},{"id":"T62919","span":{"begin":10541,"end":10550},"obj":"SP_7"},{"id":"T15838","span":{"begin":10551,"end":10555},"obj":"SO:0000236"},{"id":"T241","span":{"begin":10617,"end":10626},"obj":"SP_7"},{"id":"T1071","span":{"begin":10735,"end":10740},"obj":"PR:000002009"},{"id":"T4757","span":{"begin":11728,"end":11731},"obj":"GO:0042611"},{"id":"T28172","span":{"begin":11949,"end":11952},"obj":"GO:0042611"},{"id":"T77140","span":{"begin":11955,"end":11962},"obj":"PR:000002009"},{"id":"T91368","span":{"begin":12079,"end":12086},"obj":"PR:000002009"},{"id":"T69195","span":{"begin":12137,"end":12146},"obj":"SP_7"},{"id":"T26868","span":{"begin":12180,"end":12194},"obj":"BV_15"},{"id":"T24626","span":{"begin":12353,"end":12360},"obj":"PR:000002009"},{"id":"T89323","span":{"begin":12364,"end":12373},"obj":"SO:0001024"},{"id":"T65632","span":{"begin":12385,"end":12394},"obj":"SP_7"},{"id":"T76744","span":{"begin":12597,"end":12602},"obj":"PR:000002009"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-FMA-UBERON

    {"project":"LitCovid-PD-FMA-UBERON","denotations":[{"id":"T6","span":{"begin":201,"end":205},"obj":"Body_part"},{"id":"T7","span":{"begin":580,"end":583},"obj":"Body_part"},{"id":"T8","span":{"begin":631,"end":634},"obj":"Body_part"},{"id":"T9","span":{"begin":714,"end":719},"obj":"Body_part"},{"id":"T10","span":{"begin":915,"end":927},"obj":"Body_part"},{"id":"T11","span":{"begin":929,"end":932},"obj":"Body_part"},{"id":"T12","span":{"begin":984,"end":991},"obj":"Body_part"},{"id":"T13","span":{"begin":1029,"end":1032},"obj":"Body_part"},{"id":"T14","span":{"begin":1089,"end":1096},"obj":"Body_part"},{"id":"T15","span":{"begin":1098,"end":1101},"obj":"Body_part"},{"id":"T16","span":{"begin":1153,"end":1160},"obj":"Body_part"},{"id":"T17","span":{"begin":1198,"end":1201},"obj":"Body_part"},{"id":"T18","span":{"begin":1248,"end":1251},"obj":"Body_part"},{"id":"T19","span":{"begin":1301,"end":1308},"obj":"Body_part"},{"id":"T20","span":{"begin":1349,"end":1356},"obj":"Body_part"},{"id":"T21","span":{"begin":1394,"end":1397},"obj":"Body_part"},{"id":"T22","span":{"begin":1444,"end":1447},"obj":"Body_part"},{"id":"T23","span":{"begin":1499,"end":1506},"obj":"Body_part"},{"id":"T24","span":{"begin":1544,"end":1547},"obj":"Body_part"},{"id":"T25","span":{"begin":1604,"end":1611},"obj":"Body_part"},{"id":"T26","span":{"begin":1613,"end":1616},"obj":"Body_part"},{"id":"T27","span":{"begin":1663,"end":1670},"obj":"Body_part"},{"id":"T28","span":{"begin":1706,"end":1709},"obj":"Body_part"},{"id":"T29","span":{"begin":1756,"end":1763},"obj":"Body_part"},{"id":"T30","span":{"begin":1765,"end":1768},"obj":"Body_part"},{"id":"T31","span":{"begin":1802,"end":1809},"obj":"Body_part"},{"id":"T32","span":{"begin":1811,"end":1814},"obj":"Body_part"},{"id":"T33","span":{"begin":1852,"end":1864},"obj":"Body_part"},{"id":"T34","span":{"begin":1876,"end":1879},"obj":"Body_part"},{"id":"T35","span":{"begin":1880,"end":1882},"obj":"Body_part"},{"id":"T36","span":{"begin":1911,"end":1923},"obj":"Body_part"},{"id":"T37","span":{"begin":1935,"end":1938},"obj":"Body_part"},{"id":"T38","span":{"begin":1939,"end":1941},"obj":"Body_part"},{"id":"T39","span":{"begin":1966,"end":1973},"obj":"Body_part"},{"id":"T40","span":{"begin":1975,"end":1978},"obj":"Body_part"},{"id":"T41","span":{"begin":2028,"end":2035},"obj":"Body_part"},{"id":"T42","span":{"begin":2037,"end":2040},"obj":"Body_part"},{"id":"T43","span":{"begin":2081,"end":2093},"obj":"Body_part"},{"id":"T44","span":{"begin":2105,"end":2108},"obj":"Body_part"},{"id":"T45","span":{"begin":2142,"end":2149},"obj":"Body_part"},{"id":"T46","span":{"begin":2151,"end":2154},"obj":"Body_part"},{"id":"T47","span":{"begin":2192,"end":2204},"obj":"Body_part"},{"id":"T48","span":{"begin":2216,"end":2219},"obj":"Body_part"},{"id":"T49","span":{"begin":2267,"end":2274},"obj":"Body_part"},{"id":"T50","span":{"begin":2276,"end":2279},"obj":"Body_part"},{"id":"T51","span":{"begin":2341,"end":2348},"obj":"Body_part"},{"id":"T52","span":{"begin":2350,"end":2353},"obj":"Body_part"},{"id":"T53","span":{"begin":2408,"end":2415},"obj":"Body_part"},{"id":"T54","span":{"begin":2417,"end":2420},"obj":"Body_part"},{"id":"T55","span":{"begin":6979,"end":6990},"obj":"Body_part"},{"id":"T56","span":{"begin":7012,"end":7022},"obj":"Body_part"},{"id":"T57","span":{"begin":7108,"end":7111},"obj":"Body_part"},{"id":"T58","span":{"begin":7178,"end":7181},"obj":"Body_part"},{"id":"T59","span":{"begin":7286,"end":7289},"obj":"Body_part"},{"id":"T60","span":{"begin":7299,"end":7302},"obj":"Body_part"},{"id":"T61","span":{"begin":7312,"end":7315},"obj":"Body_part"},{"id":"T62","span":{"begin":7325,"end":7328},"obj":"Body_part"},{"id":"T63","span":{"begin":7341,"end":7344},"obj":"Body_part"},{"id":"T64","span":{"begin":7388,"end":7391},"obj":"Body_part"},{"id":"T65","span":{"begin":7489,"end":7492},"obj":"Body_part"},{"id":"T66","span":{"begin":7601,"end":7604},"obj":"Body_part"},{"id":"T67","span":{"begin":7838,"end":7841},"obj":"Body_part"},{"id":"T68","span":{"begin":7900,"end":7903},"obj":"Body_part"},{"id":"T69","span":{"begin":8043,"end":8046},"obj":"Body_part"},{"id":"T70","span":{"begin":8146,"end":8149},"obj":"Body_part"},{"id":"T71","span":{"begin":8702,"end":8705},"obj":"Body_part"},{"id":"T72","span":{"begin":8753,"end":8756},"obj":"Body_part"},{"id":"T73","span":{"begin":8783,"end":8786},"obj":"Body_part"},{"id":"T74","span":{"begin":8796,"end":8799},"obj":"Body_part"},{"id":"T75","span":{"begin":8809,"end":8812},"obj":"Body_part"},{"id":"T76","span":{"begin":8822,"end":8825},"obj":"Body_part"},{"id":"T77","span":{"begin":8838,"end":8841},"obj":"Body_part"},{"id":"T78","span":{"begin":9120,"end":9124},"obj":"Body_part"},{"id":"T79","span":{"begin":9244,"end":9248},"obj":"Body_part"},{"id":"T80","span":{"begin":9298,"end":9302},"obj":"Body_part"},{"id":"T81","span":{"begin":9394,"end":9399},"obj":"Body_part"},{"id":"T82","span":{"begin":9525,"end":9528},"obj":"Body_part"},{"id":"T83","span":{"begin":10293,"end":10296},"obj":"Body_part"},{"id":"T84","span":{"begin":10735,"end":10738},"obj":"Body_part"},{"id":"T85","span":{"begin":11728,"end":11731},"obj":"Body_part"},{"id":"T86","span":{"begin":11833,"end":11840},"obj":"Body_part"},{"id":"T87","span":{"begin":11849,"end":11855},"obj":"Body_part"},{"id":"T88","span":{"begin":11949,"end":11952},"obj":"Body_part"},{"id":"T89","span":{"begin":11955,"end":11958},"obj":"Body_part"},{"id":"T90","span":{"begin":12005,"end":12012},"obj":"Body_part"},{"id":"T91","span":{"begin":12023,"end":12029},"obj":"Body_part"},{"id":"T92","span":{"begin":12079,"end":12082},"obj":"Body_part"},{"id":"T93","span":{"begin":12353,"end":12356},"obj":"Body_part"},{"id":"T94","span":{"begin":12417,"end":12424},"obj":"Body_part"},{"id":"T95","span":{"begin":12425,"end":12431},"obj":"Body_part"},{"id":"T96","span":{"begin":12597,"end":12600},"obj":"Body_part"}],"attributes":[{"id":"A6","pred":"fma_id","subj":"T6","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A7","pred":"fma_id","subj":"T7","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A8","pred":"fma_id","subj":"T8","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A9","pred":"fma_id","subj":"T9","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A10","pred":"fma_id","subj":"T10","obj":"http://purl.org/sig/ont/fma/fma62925"},{"id":"A11","pred":"fma_id","subj":"T11","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A12","pred":"fma_id","subj":"T12","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A13","pred":"fma_id","subj":"T13","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A14","pred":"fma_id","subj":"T14","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A15","pred":"fma_id","subj":"T15","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A16","pred":"fma_id","subj":"T16","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A17","pred":"fma_id","subj":"T17","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A18","pred":"fma_id","subj":"T18","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A19","pred":"fma_id","subj":"T19","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A20","pred":"fma_id","subj":"T20","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A21","pred":"fma_id","subj":"T21","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A22","pred":"fma_id","subj":"T22","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A23","pred":"fma_id","subj":"T23","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A24","pred":"fma_id","subj":"T24","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A25","pred":"fma_id","subj":"T25","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A26","pred":"fma_id","subj":"T26","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A27","pred":"fma_id","subj":"T27","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A28","pred":"fma_id","subj":"T28","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A29","pred":"fma_id","subj":"T29","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A30","pred":"fma_id","subj":"T30","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A31","pred":"fma_id","subj":"T31","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A32","pred":"fma_id","subj":"T32","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A33","pred":"fma_id","subj":"T33","obj":"http://purl.org/sig/ont/fma/fma62925"},{"id":"A34","pred":"fma_id","subj":"T34","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A35","pred":"fma_id","subj":"T35","obj":"http://purl.org/sig/ont/fma/fma66595"},{"id":"A36","pred":"fma_id","subj":"T36","obj":"http://purl.org/sig/ont/fma/fma62925"},{"id":"A37","pred":"fma_id","subj":"T37","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A38","pred":"fma_id","subj":"T38","obj":"http://purl.org/sig/ont/fma/fma66595"},{"id":"A39","pred":"fma_id","subj":"T39","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A40","pred":"fma_id","subj":"T40","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A41","pred":"fma_id","subj":"T41","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A42","pred":"fma_id","subj":"T42","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A43","pred":"fma_id","subj":"T43","obj":"http://purl.org/sig/ont/fma/fma62925"},{"id":"A44","pred":"fma_id","subj":"T44","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A45","pred":"fma_id","subj":"T45","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A46","pred":"fma_id","subj":"T46","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A47","pred":"fma_id","subj":"T47","obj":"http://purl.org/sig/ont/fma/fma62925"},{"id":"A48","pred":"fma_id","subj":"T48","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A49","pred":"fma_id","subj":"T49","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A50","pred":"fma_id","subj":"T50","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A51","pred":"fma_id","subj":"T51","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A52","pred":"fma_id","subj":"T52","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A53","pred":"fma_id","subj":"T53","obj":"http://purl.org/sig/ont/fma/fma67257"},{"id":"A54","pred":"fma_id","subj":"T54","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A55","pred":"fma_id","subj":"T55","obj":"http://purl.org/sig/ont/fma/fma82739"},{"id":"A56","pred":"fma_id","subj":"T56","obj":"http://purl.org/sig/ont/fma/fma82739"},{"id":"A57","pred":"fma_id","subj":"T57","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A58","pred":"fma_id","subj":"T58","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A59","pred":"fma_id","subj":"T59","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A60","pred":"fma_id","subj":"T60","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A61","pred":"fma_id","subj":"T61","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A62","pred":"fma_id","subj":"T62","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A63","pred":"fma_id","subj":"T63","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A64","pred":"fma_id","subj":"T64","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A65","pred":"fma_id","subj":"T65","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A66","pred":"fma_id","subj":"T66","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A67","pred":"fma_id","subj":"T67","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A68","pred":"fma_id","subj":"T68","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A69","pred":"fma_id","subj":"T69","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A70","pred":"fma_id","subj":"T70","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A71","pred":"fma_id","subj":"T71","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A72","pred":"fma_id","subj":"T72","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A73","pred":"fma_id","subj":"T73","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A74","pred":"fma_id","subj":"T74","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A75","pred":"fma_id","subj":"T75","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A76","pred":"fma_id","subj":"T76","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A77","pred":"fma_id","subj":"T77","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A78","pred":"fma_id","subj":"T78","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A79","pred":"fma_id","subj":"T79","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A80","pred":"fma_id","subj":"T80","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A81","pred":"fma_id","subj":"T81","obj":"http://purl.org/sig/ont/fma/fma68646"},{"id":"A82","pred":"fma_id","subj":"T82","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A83","pred":"fma_id","subj":"T83","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A84","pred":"fma_id","subj":"T84","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A85","pred":"fma_id","subj":"T85","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A86","pred":"fma_id","subj":"T86","obj":"http://purl.org/sig/ont/fma/fma82757"},{"id":"A87","pred":"fma_id","subj":"T87","obj":"http://purl.org/sig/ont/fma/fma82766"},{"id":"A88","pred":"fma_id","subj":"T88","obj":"http://purl.org/sig/ont/fma/fma84079"},{"id":"A89","pred":"fma_id","subj":"T89","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A90","pred":"fma_id","subj":"T90","obj":"http://purl.org/sig/ont/fma/fma82757"},{"id":"A91","pred":"fma_id","subj":"T91","obj":"http://purl.org/sig/ont/fma/fma82766"},{"id":"A92","pred":"fma_id","subj":"T92","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A93","pred":"fma_id","subj":"T93","obj":"http://purl.org/sig/ont/fma/fma84795"},{"id":"A94","pred":"fma_id","subj":"T94","obj":"http://purl.org/sig/ont/fma/fma82757"},{"id":"A95","pred":"fma_id","subj":"T95","obj":"http://purl.org/sig/ont/fma/fma82766"},{"id":"A96","pred":"fma_id","subj":"T96","obj":"http://purl.org/sig/ont/fma/fma84795"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-UBERON

    {"project":"LitCovid-PD-UBERON","denotations":[{"id":"T1","span":{"begin":2682,"end":2686},"obj":"Body_part"}],"attributes":[{"id":"A1","pred":"uberon_id","subj":"T1","obj":"http://purl.obolibrary.org/obo/UBERON_0002415"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-MONDO

    {"project":"LitCovid-PD-MONDO","denotations":[{"id":"T6","span":{"begin":47,"end":51},"obj":"Disease"},{"id":"T7","span":{"begin":496,"end":504},"obj":"Disease"},{"id":"T8","span":{"begin":804,"end":812},"obj":"Disease"},{"id":"T9","span":{"begin":2280,"end":2283},"obj":"Disease"},{"id":"T10","span":{"begin":2434,"end":2442},"obj":"Disease"},{"id":"T11","span":{"begin":2444,"end":2477},"obj":"Disease"},{"id":"T12","span":{"begin":2653,"end":2657},"obj":"Disease"},{"id":"T13","span":{"begin":3708,"end":3712},"obj":"Disease"},{"id":"T14","span":{"begin":8088,"end":8090},"obj":"Disease"},{"id":"T15","span":{"begin":8098,"end":8100},"obj":"Disease"},{"id":"T16","span":{"begin":8108,"end":8110},"obj":"Disease"},{"id":"T17","span":{"begin":8118,"end":8120},"obj":"Disease"},{"id":"T18","span":{"begin":8128,"end":8130},"obj":"Disease"},{"id":"T19","span":{"begin":9325,"end":9330},"obj":"Disease"}],"attributes":[{"id":"A6","pred":"mondo_id","subj":"T6","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A7","pred":"mondo_id","subj":"T7","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A8","pred":"mondo_id","subj":"T8","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A9","pred":"mondo_id","subj":"T9","obj":"http://purl.obolibrary.org/obo/MONDO_0019440"},{"id":"A10","pred":"mondo_id","subj":"T10","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A11","pred":"mondo_id","subj":"T11","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A12","pred":"mondo_id","subj":"T12","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A13","pred":"mondo_id","subj":"T13","obj":"http://purl.obolibrary.org/obo/MONDO_0005091"},{"id":"A14","pred":"mondo_id","subj":"T14","obj":"http://purl.obolibrary.org/obo/MONDO_0005072"},{"id":"A15","pred":"mondo_id","subj":"T15","obj":"http://purl.obolibrary.org/obo/MONDO_0005072"},{"id":"A16","pred":"mondo_id","subj":"T16","obj":"http://purl.obolibrary.org/obo/MONDO_0005072"},{"id":"A17","pred":"mondo_id","subj":"T17","obj":"http://purl.obolibrary.org/obo/MONDO_0005072"},{"id":"A18","pred":"mondo_id","subj":"T18","obj":"http://purl.obolibrary.org/obo/MONDO_0005072"},{"id":"A19","pred":"mondo_id","subj":"T19","obj":"http://purl.obolibrary.org/obo/MONDO_0005070"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-CLO

    {"project":"LitCovid-PD-CLO","denotations":[{"id":"T49","span":{"begin":68,"end":76},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T50","span":{"begin":138,"end":146},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T51","span":{"begin":199,"end":205},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T52","span":{"begin":222,"end":230},"obj":"http://purl.obolibrary.org/obo/NCBITaxon_9606"},{"id":"T53","span":{"begin":240,"end":248},"obj":"http://purl.obolibrary.org/obo/OBI_0100026"},{"id":"T54","span":{"begin":240,"end":248},"obj":"http://purl.obolibrary.org/obo/UBERON_0000468"},{"id":"T55","span":{"begin":268,"end":269},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T56","span":{"begin":358,"end":366},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T57","span":{"begin":438,"end":446},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T58","span":{"begin":539,"end":547},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T59","span":{"begin":635,"end":636},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T60","span":{"begin":698,"end":701},"obj":"http://purl.obolibrary.org/obo/CLO_0053438"},{"id":"T61","span":{"begin":707,"end":710},"obj":"http://purl.obolibrary.org/obo/PR_000001004"},{"id":"T62","span":{"begin":712,"end":719},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T63","span":{"begin":757,"end":765},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T64","span":{"begin":813,"end":821},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T65","span":{"begin":906,"end":914},"obj":"http://purl.obolibrary.org/obo/UBERON_0000158"},{"id":"T66","span":{"begin":933,"end":934},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T67","span":{"begin":1033,"end":1034},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T68","span":{"begin":1202,"end":1203},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T69","span":{"begin":1252,"end":1253},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T70","span":{"begin":1398,"end":1399},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T71","span":{"begin":1448,"end":1449},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T72","span":{"begin":1548,"end":1549},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T73","span":{"begin":1710,"end":1711},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T74","span":{"begin":1769,"end":1770},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T75","span":{"begin":1815,"end":1816},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T76","span":{"begin":1880,"end":1882},"obj":"http://purl.obolibrary.org/obo/CLO_0001562"},{"id":"T77","span":{"begin":1939,"end":1941},"obj":"http://purl.obolibrary.org/obo/CLO_0001562"},{"id":"T78","span":{"begin":1979,"end":1980},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T79","span":{"begin":2109,"end":2110},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T80","span":{"begin":2155,"end":2156},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T81","span":{"begin":2220,"end":2221},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T82","span":{"begin":2509,"end":2511},"obj":"http://purl.obolibrary.org/obo/CLO_0050507"},{"id":"T83","span":{"begin":2522,"end":2530},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T84","span":{"begin":2603,"end":2611},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T85","span":{"begin":2675,"end":2676},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T86","span":{"begin":2682,"end":2686},"obj":"http://purl.obolibrary.org/obo/UBERON_0002415"},{"id":"T87","span":{"begin":2776,"end":2784},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T88","span":{"begin":2931,"end":2939},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T89","span":{"begin":2985,"end":2993},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T90","span":{"begin":3003,"end":3004},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T91","span":{"begin":3060,"end":3068},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T92","span":{"begin":3103,"end":3104},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T93","span":{"begin":3123,"end":3131},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T94","span":{"begin":3156,"end":3164},"obj":"http://purl.obolibrary.org/obo/OBI_0100026"},{"id":"T95","span":{"begin":3156,"end":3164},"obj":"http://purl.obolibrary.org/obo/UBERON_0000468"},{"id":"T96","span":{"begin":3170,"end":3178},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T97","span":{"begin":3347,"end":3348},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T98","span":{"begin":3383,"end":3391},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T99","span":{"begin":3469,"end":3471},"obj":"http://purl.obolibrary.org/obo/CLO_0053799"},{"id":"T100","span":{"begin":3476,"end":3478},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T101","span":{"begin":3479,"end":3487},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T102","span":{"begin":3578,"end":3586},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T103","span":{"begin":3648,"end":3649},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T104","span":{"begin":3656,"end":3658},"obj":"http://purl.obolibrary.org/obo/CLO_0001313"},{"id":"T105","span":{"begin":3659,"end":3667},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T106","span":{"begin":3803,"end":3815},"obj":"http://purl.obolibrary.org/obo/NCBITaxon_9606"},{"id":"T107","span":{"begin":3925,"end":3933},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T108","span":{"begin":3978,"end":3986},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T109","span":{"begin":3995,"end":3996},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T110","span":{"begin":4111,"end":4119},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T111","span":{"begin":4151,"end":4152},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T112","span":{"begin":4208,"end":4209},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T113","span":{"begin":4239,"end":4247},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T114","span":{"begin":4324,"end":4326},"obj":"http://purl.obolibrary.org/obo/CLO_0001382"},{"id":"T115","span":{"begin":4432,"end":4440},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T116","span":{"begin":4456,"end":4458},"obj":"http://purl.obolibrary.org/obo/CLO_0050507"},{"id":"T117","span":{"begin":4466,"end":4468},"obj":"http://purl.obolibrary.org/obo/CLO_0001382"},{"id":"T118","span":{"begin":4479,"end":4487},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T119","span":{"begin":4624,"end":4632},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T120","span":{"begin":4638,"end":4639},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T121","span":{"begin":4675,"end":4677},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T122","span":{"begin":4695,"end":4696},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T123","span":{"begin":4760,"end":4762},"obj":"http://purl.obolibrary.org/obo/CLO_0050507"},{"id":"T124","span":{"begin":4773,"end":4781},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T125","span":{"begin":4789,"end":4790},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T126","span":{"begin":4847,"end":4855},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T127","span":{"begin":6041,"end":6049},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T128","span":{"begin":6061,"end":6069},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T129","span":{"begin":6077,"end":6078},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T130","span":{"begin":6119,"end":6127},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T131","span":{"begin":6285,"end":6286},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T132","span":{"begin":6287,"end":6294},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T133","span":{"begin":6318,"end":6319},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T134","span":{"begin":6476,"end":6477},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T135","span":{"begin":6517,"end":6525},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T136","span":{"begin":6630,"end":6633},"obj":"http://purl.obolibrary.org/obo/CLO_0001755"},{"id":"T137","span":{"begin":6752,"end":6760},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T138","span":{"begin":6786,"end":6787},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T139","span":{"begin":6836,"end":6837},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T140","span":{"begin":6868,"end":6876},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T141","span":{"begin":6965,"end":6966},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T142","span":{"begin":7068,"end":7076},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T143","span":{"begin":7206,"end":7213},"obj":"http://purl.obolibrary.org/obo/CLO_0009985"},{"id":"T144","span":{"begin":7290,"end":7291},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T145","span":{"begin":7303,"end":7304},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T146","span":{"begin":7316,"end":7317},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T147","span":{"begin":7329,"end":7330},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T148","span":{"begin":7373,"end":7376},"obj":"http://purl.obolibrary.org/obo/CLO_0001302"},{"id":"T149","span":{"begin":7450,"end":7458},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T150","span":{"begin":7695,"end":7696},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T151","span":{"begin":7799,"end":7807},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T152","span":{"begin":8174,"end":8178},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T153","span":{"begin":8180,"end":8187},"obj":"http://purl.obolibrary.org/obo/CLO_0053001"},{"id":"T154","span":{"begin":8212,"end":8216},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T155","span":{"begin":8218,"end":8225},"obj":"http://purl.obolibrary.org/obo/CLO_0053001"},{"id":"T156","span":{"begin":8247,"end":8251},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T157","span":{"begin":8285,"end":8289},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T158","span":{"begin":8322,"end":8326},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T159","span":{"begin":8407,"end":8411},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T160","span":{"begin":8512,"end":8516},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T161","span":{"begin":8550,"end":8554},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T162","span":{"begin":8591,"end":8595},"obj":"http://purl.obolibrary.org/obo/CLO_0053733"},{"id":"T163","span":{"begin":8688,"end":8696},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T164","span":{"begin":8787,"end":8788},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T165","span":{"begin":8800,"end":8801},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T166","span":{"begin":8813,"end":8814},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T167","span":{"begin":8826,"end":8827},"obj":"http://purl.obolibrary.org/obo/CLO_0001021"},{"id":"T168","span":{"begin":8947,"end":8955},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T169","span":{"begin":8963,"end":8966},"obj":"http://purl.obolibrary.org/obo/CLO_0053438"},{"id":"T170","span":{"begin":9118,"end":9124},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T171","span":{"begin":9242,"end":9248},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T172","span":{"begin":9266,"end":9269},"obj":"http://purl.obolibrary.org/obo/CLO_0051582"},{"id":"T173","span":{"begin":9275,"end":9287},"obj":"http://purl.obolibrary.org/obo/OBI_0000968"},{"id":"T174","span":{"begin":9296,"end":9302},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T175","span":{"begin":9380,"end":9381},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T176","span":{"begin":9392,"end":9399},"obj":"http://purl.obolibrary.org/obo/CL_0000084"},{"id":"T177","span":{"begin":9450,"end":9453},"obj":"http://purl.obolibrary.org/obo/CLO_0053438"},{"id":"T178","span":{"begin":9504,"end":9511},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T179","span":{"begin":9529,"end":9530},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T180","span":{"begin":9585,"end":9586},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T181","span":{"begin":9691,"end":9698},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T182","span":{"begin":9762,"end":9770},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T183","span":{"begin":9786,"end":9796},"obj":"http://purl.obolibrary.org/obo/CLO_0001658"},{"id":"T184","span":{"begin":9884,"end":9891},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T185","span":{"begin":9941,"end":9942},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T186","span":{"begin":10017,"end":10027},"obj":"http://purl.obolibrary.org/obo/CLO_0001658"},{"id":"T187","span":{"begin":10183,"end":10191},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T188","span":{"begin":10197,"end":10198},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T189","span":{"begin":10219,"end":10227},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T190","span":{"begin":10245,"end":10253},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T191","span":{"begin":10297,"end":10298},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T192","span":{"begin":10445,"end":10453},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T193","span":{"begin":10633,"end":10641},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T194","span":{"begin":10739,"end":10740},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T195","span":{"begin":10789,"end":10796},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T196","span":{"begin":10813,"end":10823},"obj":"http://purl.obolibrary.org/obo/CLO_0001658"},{"id":"T197","span":{"begin":11766,"end":11774},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T198","span":{"begin":11883,"end":11885},"obj":"http://purl.obolibrary.org/obo/CLO_0008307"},{"id":"T199","span":{"begin":11894,"end":11896},"obj":"http://purl.obolibrary.org/obo/CLO_0008343"},{"id":"T200","span":{"begin":11975,"end":11983},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T201","span":{"begin":11991,"end":11999},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T202","span":{"begin":12016,"end":12018},"obj":"http://purl.obolibrary.org/obo/CLO_0008307"},{"id":"T203","span":{"begin":12033,"end":12035},"obj":"http://purl.obolibrary.org/obo/CLO_0008343"},{"id":"T204","span":{"begin":12111,"end":12118},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T205","span":{"begin":12147,"end":12155},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T206","span":{"begin":12167,"end":12175},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T207","span":{"begin":12214,"end":12222},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T208","span":{"begin":12275,"end":12283},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T209","span":{"begin":12401,"end":12409},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T210","span":{"begin":12453,"end":12461},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T211","span":{"begin":12601,"end":12602},"obj":"http://purl.obolibrary.org/obo/CLO_0001020"},{"id":"T212","span":{"begin":12659,"end":12666},"obj":"http://purl.obolibrary.org/obo/PR_000018263"},{"id":"T213","span":{"begin":12683,"end":12693},"obj":"http://purl.obolibrary.org/obo/CLO_0001658"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-CHEBI

    {"project":"LitCovid-PD-CHEBI","denotations":[{"id":"T17","span":{"begin":68,"end":76},"obj":"Chemical"},{"id":"T18","span":{"begin":138,"end":146},"obj":"Chemical"},{"id":"T19","span":{"begin":358,"end":366},"obj":"Chemical"},{"id":"T20","span":{"begin":438,"end":446},"obj":"Chemical"},{"id":"T21","span":{"begin":539,"end":547},"obj":"Chemical"},{"id":"T22","span":{"begin":672,"end":674},"obj":"Chemical"},{"id":"T23","span":{"begin":757,"end":765},"obj":"Chemical"},{"id":"T24","span":{"begin":813,"end":821},"obj":"Chemical"},{"id":"T25","span":{"begin":915,"end":927},"obj":"Chemical"},{"id":"T26","span":{"begin":984,"end":991},"obj":"Chemical"},{"id":"T27","span":{"begin":1089,"end":1096},"obj":"Chemical"},{"id":"T28","span":{"begin":1108,"end":1110},"obj":"Chemical"},{"id":"T29","span":{"begin":1153,"end":1160},"obj":"Chemical"},{"id":"T30","span":{"begin":1301,"end":1308},"obj":"Chemical"},{"id":"T31","span":{"begin":1349,"end":1356},"obj":"Chemical"},{"id":"T32","span":{"begin":1499,"end":1506},"obj":"Chemical"},{"id":"T33","span":{"begin":1604,"end":1611},"obj":"Chemical"},{"id":"T34","span":{"begin":1663,"end":1670},"obj":"Chemical"},{"id":"T35","span":{"begin":1756,"end":1763},"obj":"Chemical"},{"id":"T36","span":{"begin":1802,"end":1809},"obj":"Chemical"},{"id":"T37","span":{"begin":1852,"end":1864},"obj":"Chemical"},{"id":"T38","span":{"begin":1911,"end":1923},"obj":"Chemical"},{"id":"T39","span":{"begin":1966,"end":1973},"obj":"Chemical"},{"id":"T40","span":{"begin":2028,"end":2035},"obj":"Chemical"},{"id":"T41","span":{"begin":2081,"end":2093},"obj":"Chemical"},{"id":"T42","span":{"begin":2142,"end":2149},"obj":"Chemical"},{"id":"T43","span":{"begin":2192,"end":2204},"obj":"Chemical"},{"id":"T44","span":{"begin":2267,"end":2274},"obj":"Chemical"},{"id":"T45","span":{"begin":2341,"end":2348},"obj":"Chemical"},{"id":"T46","span":{"begin":2408,"end":2415},"obj":"Chemical"},{"id":"T47","span":{"begin":2522,"end":2530},"obj":"Chemical"},{"id":"T48","span":{"begin":2603,"end":2611},"obj":"Chemical"},{"id":"T49","span":{"begin":2776,"end":2784},"obj":"Chemical"},{"id":"T50","span":{"begin":2931,"end":2939},"obj":"Chemical"},{"id":"T51","span":{"begin":2985,"end":2993},"obj":"Chemical"},{"id":"T52","span":{"begin":3060,"end":3068},"obj":"Chemical"},{"id":"T53","span":{"begin":3123,"end":3131},"obj":"Chemical"},{"id":"T54","span":{"begin":3170,"end":3178},"obj":"Chemical"},{"id":"T55","span":{"begin":3383,"end":3391},"obj":"Chemical"},{"id":"T56","span":{"begin":3479,"end":3487},"obj":"Chemical"},{"id":"T57","span":{"begin":3578,"end":3586},"obj":"Chemical"},{"id":"T58","span":{"begin":3659,"end":3667},"obj":"Chemical"},{"id":"T59","span":{"begin":3925,"end":3933},"obj":"Chemical"},{"id":"T60","span":{"begin":3978,"end":3986},"obj":"Chemical"},{"id":"T61","span":{"begin":4111,"end":4119},"obj":"Chemical"},{"id":"T62","span":{"begin":4239,"end":4247},"obj":"Chemical"},{"id":"T63","span":{"begin":4432,"end":4440},"obj":"Chemical"},{"id":"T64","span":{"begin":4479,"end":4487},"obj":"Chemical"},{"id":"T65","span":{"begin":4624,"end":4632},"obj":"Chemical"},{"id":"T66","span":{"begin":4773,"end":4781},"obj":"Chemical"},{"id":"T67","span":{"begin":4847,"end":4855},"obj":"Chemical"},{"id":"T68","span":{"begin":5367,"end":5369},"obj":"Chemical"},{"id":"T69","span":{"begin":6041,"end":6049},"obj":"Chemical"},{"id":"T70","span":{"begin":6061,"end":6069},"obj":"Chemical"},{"id":"T71","span":{"begin":6119,"end":6127},"obj":"Chemical"},{"id":"T72","span":{"begin":6287,"end":6294},"obj":"Chemical"},{"id":"T73","span":{"begin":6517,"end":6525},"obj":"Chemical"},{"id":"T74","span":{"begin":6752,"end":6760},"obj":"Chemical"},{"id":"T75","span":{"begin":6868,"end":6876},"obj":"Chemical"},{"id":"T76","span":{"begin":6979,"end":6990},"obj":"Chemical"},{"id":"T77","span":{"begin":6979,"end":6984},"obj":"Chemical"},{"id":"T78","span":{"begin":6985,"end":6990},"obj":"Chemical"},{"id":"T79","span":{"begin":7012,"end":7022},"obj":"Chemical"},{"id":"T80","span":{"begin":7012,"end":7017},"obj":"Chemical"},{"id":"T81","span":{"begin":7018,"end":7022},"obj":"Chemical"},{"id":"T82","span":{"begin":7068,"end":7076},"obj":"Chemical"},{"id":"T83","span":{"begin":7450,"end":7458},"obj":"Chemical"},{"id":"T84","span":{"begin":7799,"end":7807},"obj":"Chemical"},{"id":"T85","span":{"begin":8688,"end":8696},"obj":"Chemical"},{"id":"T86","span":{"begin":8947,"end":8955},"obj":"Chemical"},{"id":"T87","span":{"begin":8972,"end":8980},"obj":"Chemical"},{"id":"T88","span":{"begin":9331,"end":9339},"obj":"Chemical"},{"id":"T89","span":{"begin":9504,"end":9511},"obj":"Chemical"},{"id":"T90","span":{"begin":9691,"end":9698},"obj":"Chemical"},{"id":"T91","span":{"begin":9762,"end":9770},"obj":"Chemical"},{"id":"T92","span":{"begin":9884,"end":9891},"obj":"Chemical"},{"id":"T93","span":{"begin":10183,"end":10191},"obj":"Chemical"},{"id":"T94","span":{"begin":10219,"end":10227},"obj":"Chemical"},{"id":"T95","span":{"begin":10245,"end":10253},"obj":"Chemical"},{"id":"T96","span":{"begin":10445,"end":10453},"obj":"Chemical"},{"id":"T97","span":{"begin":10633,"end":10641},"obj":"Chemical"},{"id":"T98","span":{"begin":10789,"end":10796},"obj":"Chemical"},{"id":"T99","span":{"begin":11766,"end":11774},"obj":"Chemical"},{"id":"T100","span":{"begin":11833,"end":11840},"obj":"Chemical"},{"id":"T101","span":{"begin":11849,"end":11855},"obj":"Chemical"},{"id":"T102","span":{"begin":11883,"end":11885},"obj":"Chemical"},{"id":"T103","span":{"begin":11975,"end":11983},"obj":"Chemical"},{"id":"T104","span":{"begin":11991,"end":11999},"obj":"Chemical"},{"id":"T105","span":{"begin":12005,"end":12012},"obj":"Chemical"},{"id":"T106","span":{"begin":12016,"end":12018},"obj":"Chemical"},{"id":"T107","span":{"begin":12023,"end":12029},"obj":"Chemical"},{"id":"T108","span":{"begin":12108,"end":12110},"obj":"Chemical"},{"id":"T109","span":{"begin":12111,"end":12118},"obj":"Chemical"},{"id":"T110","span":{"begin":12147,"end":12155},"obj":"Chemical"},{"id":"T111","span":{"begin":12167,"end":12175},"obj":"Chemical"},{"id":"T112","span":{"begin":12214,"end":12222},"obj":"Chemical"},{"id":"T113","span":{"begin":12275,"end":12283},"obj":"Chemical"},{"id":"T114","span":{"begin":12401,"end":12409},"obj":"Chemical"},{"id":"T115","span":{"begin":12417,"end":12424},"obj":"Chemical"},{"id":"T116","span":{"begin":12425,"end":12431},"obj":"Chemical"},{"id":"T117","span":{"begin":12659,"end":12666},"obj":"Chemical"}],"attributes":[{"id":"A17","pred":"chebi_id","subj":"T17","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A18","pred":"chebi_id","subj":"T18","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A19","pred":"chebi_id","subj":"T19","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A20","pred":"chebi_id","subj":"T20","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A21","pred":"chebi_id","subj":"T21","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A22","pred":"chebi_id","subj":"T22","obj":"http://purl.obolibrary.org/obo/CHEBI_74067"},{"id":"A23","pred":"chebi_id","subj":"T23","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A24","pred":"chebi_id","subj":"T24","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A25","pred":"chebi_id","subj":"T25","obj":"http://purl.obolibrary.org/obo/CHEBI_17089"},{"id":"A26","pred":"chebi_id","subj":"T26","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A27","pred":"chebi_id","subj":"T27","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A28","pred":"chebi_id","subj":"T28","obj":"http://purl.obolibrary.org/obo/CHEBI_74067"},{"id":"A29","pred":"chebi_id","subj":"T29","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A30","pred":"chebi_id","subj":"T30","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A31","pred":"chebi_id","subj":"T31","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A32","pred":"chebi_id","subj":"T32","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A33","pred":"chebi_id","subj":"T33","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A34","pred":"chebi_id","subj":"T34","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A35","pred":"chebi_id","subj":"T35","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A36","pred":"chebi_id","subj":"T36","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A37","pred":"chebi_id","subj":"T37","obj":"http://purl.obolibrary.org/obo/CHEBI_17089"},{"id":"A38","pred":"chebi_id","subj":"T38","obj":"http://purl.obolibrary.org/obo/CHEBI_17089"},{"id":"A39","pred":"chebi_id","subj":"T39","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A40","pred":"chebi_id","subj":"T40","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A41","pred":"chebi_id","subj":"T41","obj":"http://purl.obolibrary.org/obo/CHEBI_17089"},{"id":"A42","pred":"chebi_id","subj":"T42","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A43","pred":"chebi_id","subj":"T43","obj":"http://purl.obolibrary.org/obo/CHEBI_17089"},{"id":"A44","pred":"chebi_id","subj":"T44","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A45","pred":"chebi_id","subj":"T45","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A46","pred":"chebi_id","subj":"T46","obj":"http://purl.obolibrary.org/obo/CHEBI_36080"},{"id":"A47","pred":"chebi_id","subj":"T47","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A48","pred":"chebi_id","subj":"T48","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A49","pred":"chebi_id","subj":"T49","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A50","pred":"chebi_id","subj":"T50","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A51","pred":"chebi_id","subj":"T51","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A52","pred":"chebi_id","subj":"T52","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A53","pred":"chebi_id","subj":"T53","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A54","pred":"chebi_id","subj":"T54","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A55","pred":"chebi_id","subj":"T55","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A56","pred":"chebi_id","subj":"T56","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A57","pred":"chebi_id","subj":"T57","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A58","pred":"chebi_id","subj":"T58","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A59","pred":"chebi_id","subj":"T59","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A60","pred":"chebi_id","subj":"T60","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A61","pred":"chebi_id","subj":"T61","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A62","pred":"chebi_id","subj":"T62","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A63","pred":"chebi_id","subj":"T63","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A64","pred":"chebi_id","subj":"T64","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A65","pred":"chebi_id","subj":"T65","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A66","pred":"chebi_id","subj":"T66","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A67","pred":"chebi_id","subj":"T67","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A68","pred":"chebi_id","subj":"T68","obj":"http://purl.obolibrary.org/obo/CHEBI_141447"},{"id":"A69","pred":"chebi_id","subj":"T69","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A70","pred":"chebi_id","subj":"T70","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A71","pred":"chebi_id","subj":"T71","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A72","pred":"chebi_id","subj":"T72","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A73","pred":"chebi_id","subj":"T73","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A74","pred":"chebi_id","subj":"T74","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A75","pred":"chebi_id","subj":"T75","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A76","pred":"chebi_id","subj":"T76","obj":"http://purl.obolibrary.org/obo/CHEBI_33709"},{"id":"A77","pred":"chebi_id","subj":"T77","obj":"http://purl.obolibrary.org/obo/CHEBI_46882"},{"id":"A78","pred":"chebi_id","subj":"T78","obj":"http://purl.obolibrary.org/obo/CHEBI_37527"},{"id":"A79","pred":"chebi_id","subj":"T79","obj":"http://purl.obolibrary.org/obo/CHEBI_33709"},{"id":"A80","pred":"chebi_id","subj":"T80","obj":"http://purl.obolibrary.org/obo/CHEBI_46882"},{"id":"A81","pred":"chebi_id","subj":"T81","obj":"http://purl.obolibrary.org/obo/CHEBI_37527"},{"id":"A82","pred":"chebi_id","subj":"T82","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A83","pred":"chebi_id","subj":"T83","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A84","pred":"chebi_id","subj":"T84","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A85","pred":"chebi_id","subj":"T85","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A86","pred":"chebi_id","subj":"T86","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A87","pred":"chebi_id","subj":"T87","obj":"http://purl.obolibrary.org/obo/CHEBI_25367"},{"id":"A88","pred":"chebi_id","subj":"T88","obj":"http://purl.obolibrary.org/obo/CHEBI_59132"},{"id":"A89","pred":"chebi_id","subj":"T89","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A90","pred":"chebi_id","subj":"T90","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A91","pred":"chebi_id","subj":"T91","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A92","pred":"chebi_id","subj":"T92","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A93","pred":"chebi_id","subj":"T93","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A94","pred":"chebi_id","subj":"T94","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A95","pred":"chebi_id","subj":"T95","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A96","pred":"chebi_id","subj":"T96","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A97","pred":"chebi_id","subj":"T97","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A98","pred":"chebi_id","subj":"T98","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A99","pred":"chebi_id","subj":"T99","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A100","pred":"chebi_id","subj":"T100","obj":"http://purl.obolibrary.org/obo/CHEBI_25017"},{"id":"A101","pred":"chebi_id","subj":"T101","obj":"http://purl.obolibrary.org/obo/CHEBI_27266"},{"id":"A102","pred":"chebi_id","subj":"T102","obj":"http://purl.obolibrary.org/obo/CHEBI_33472"},{"id":"A103","pred":"chebi_id","subj":"T103","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A104","pred":"chebi_id","subj":"T104","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A105","pred":"chebi_id","subj":"T105","obj":"http://purl.obolibrary.org/obo/CHEBI_25017"},{"id":"A106","pred":"chebi_id","subj":"T106","obj":"http://purl.obolibrary.org/obo/CHEBI_33472"},{"id":"A107","pred":"chebi_id","subj":"T107","obj":"http://purl.obolibrary.org/obo/CHEBI_27266"},{"id":"A108","pred":"chebi_id","subj":"T108","obj":"http://purl.obolibrary.org/obo/CHEBI_73579"},{"id":"A109","pred":"chebi_id","subj":"T109","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A110","pred":"chebi_id","subj":"T110","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A111","pred":"chebi_id","subj":"T111","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A112","pred":"chebi_id","subj":"T112","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A113","pred":"chebi_id","subj":"T113","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A114","pred":"chebi_id","subj":"T114","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"},{"id":"A115","pred":"chebi_id","subj":"T115","obj":"http://purl.obolibrary.org/obo/CHEBI_25017"},{"id":"A116","pred":"chebi_id","subj":"T116","obj":"http://purl.obolibrary.org/obo/CHEBI_27266"},{"id":"A117","pred":"chebi_id","subj":"T117","obj":"http://purl.obolibrary.org/obo/CHEBI_16670"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-PD-HP

    {"project":"LitCovid-PD-HP","denotations":[{"id":"T1","span":{"begin":9325,"end":9330},"obj":"Phenotype"}],"attributes":[{"id":"A1","pred":"hp_id","subj":"T1","obj":"http://purl.obolibrary.org/obo/HP_0002664"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    LitCovid-sentences

    {"project":"LitCovid-sentences","denotations":[{"id":"T26","span":{"begin":0,"end":7},"obj":"Sentence"},{"id":"T27","span":{"begin":9,"end":120},"obj":"Sentence"},{"id":"T28","span":{"begin":121,"end":249},"obj":"Sentence"},{"id":"T29","span":{"begin":250,"end":395},"obj":"Sentence"},{"id":"T30","span":{"begin":396,"end":532},"obj":"Sentence"},{"id":"T31","span":{"begin":533,"end":733},"obj":"Sentence"},{"id":"T32","span":{"begin":734,"end":742},"obj":"Sentence"},{"id":"T33","span":{"begin":744,"end":822},"obj":"Sentence"},{"id":"T34","span":{"begin":823,"end":881},"obj":"Sentence"},{"id":"T35","span":{"begin":882,"end":941},"obj":"Sentence"},{"id":"T36","span":{"begin":942,"end":991},"obj":"Sentence"},{"id":"T37","span":{"begin":992,"end":1041},"obj":"Sentence"},{"id":"T38","span":{"begin":1042,"end":1110},"obj":"Sentence"},{"id":"T39","span":{"begin":1111,"end":1160},"obj":"Sentence"},{"id":"T40","span":{"begin":1161,"end":1210},"obj":"Sentence"},{"id":"T41","span":{"begin":1211,"end":1260},"obj":"Sentence"},{"id":"T42","span":{"begin":1261,"end":1308},"obj":"Sentence"},{"id":"T43","span":{"begin":1309,"end":1356},"obj":"Sentence"},{"id":"T44","span":{"begin":1357,"end":1406},"obj":"Sentence"},{"id":"T45","span":{"begin":1407,"end":1456},"obj":"Sentence"},{"id":"T46","span":{"begin":1457,"end":1506},"obj":"Sentence"},{"id":"T47","span":{"begin":1507,"end":1556},"obj":"Sentence"},{"id":"T48","span":{"begin":1557,"end":1624},"obj":"Sentence"},{"id":"T49","span":{"begin":1625,"end":1670},"obj":"Sentence"},{"id":"T50","span":{"begin":1671,"end":1718},"obj":"Sentence"},{"id":"T51","span":{"begin":1719,"end":1777},"obj":"Sentence"},{"id":"T52","span":{"begin":1778,"end":1823},"obj":"Sentence"},{"id":"T53","span":{"begin":1824,"end":1882},"obj":"Sentence"},{"id":"T54","span":{"begin":1883,"end":1941},"obj":"Sentence"},{"id":"T55","span":{"begin":1942,"end":1987},"obj":"Sentence"},{"id":"T56","span":{"begin":1988,"end":2052},"obj":"Sentence"},{"id":"T57","span":{"begin":2053,"end":2117},"obj":"Sentence"},{"id":"T58","span":{"begin":2118,"end":2163},"obj":"Sentence"},{"id":"T59","span":{"begin":2164,"end":2228},"obj":"Sentence"},{"id":"T60","span":{"begin":2229,"end":2302},"obj":"Sentence"},{"id":"T61","span":{"begin":2303,"end":2365},"obj":"Sentence"},{"id":"T62","span":{"begin":2366,"end":2432},"obj":"Sentence"},{"id":"T63","span":{"begin":2433,"end":2443},"obj":"Sentence"},{"id":"T64","span":{"begin":2444,"end":2489},"obj":"Sentence"},{"id":"T65","span":{"begin":2491,"end":2611},"obj":"Sentence"},{"id":"T66","span":{"begin":2612,"end":2807},"obj":"Sentence"},{"id":"T67","span":{"begin":2808,"end":2909},"obj":"Sentence"},{"id":"T68","span":{"begin":2910,"end":2919},"obj":"Sentence"},{"id":"T69","span":{"begin":2921,"end":3002},"obj":"Sentence"},{"id":"T70","span":{"begin":3003,"end":3005},"obj":"Sentence"},{"id":"T71","span":{"begin":3006,"end":3102},"obj":"Sentence"},{"id":"T72","span":{"begin":3103,"end":3105},"obj":"Sentence"},{"id":"T73","span":{"begin":3106,"end":3165},"obj":"Sentence"},{"id":"T74","span":{"begin":3166,"end":3288},"obj":"Sentence"},{"id":"T75","span":{"begin":3289,"end":3427},"obj":"Sentence"},{"id":"T76","span":{"begin":3428,"end":3566},"obj":"Sentence"},{"id":"T77","span":{"begin":3567,"end":3717},"obj":"Sentence"},{"id":"T78","span":{"begin":3718,"end":3816},"obj":"Sentence"},{"id":"T79","span":{"begin":3817,"end":4137},"obj":"Sentence"},{"id":"T80","span":{"begin":4138,"end":4313},"obj":"Sentence"},{"id":"T81","span":{"begin":4314,"end":4441},"obj":"Sentence"},{"id":"T82","span":{"begin":4442,"end":4591},"obj":"Sentence"},{"id":"T83","span":{"begin":4592,"end":4741},"obj":"Sentence"},{"id":"T84","span":{"begin":4742,"end":4750},"obj":"Sentence"},{"id":"T85","span":{"begin":4752,"end":4856},"obj":"Sentence"},{"id":"T86","span":{"begin":4857,"end":4910},"obj":"Sentence"},{"id":"T87","span":{"begin":4911,"end":4948},"obj":"Sentence"},{"id":"T88","span":{"begin":4949,"end":4989},"obj":"Sentence"},{"id":"T89","span":{"begin":4990,"end":5029},"obj":"Sentence"},{"id":"T90","span":{"begin":5030,"end":5102},"obj":"Sentence"},{"id":"T91","span":{"begin":5103,"end":5154},"obj":"Sentence"},{"id":"T92","span":{"begin":5155,"end":5207},"obj":"Sentence"},{"id":"T93","span":{"begin":5208,"end":5260},"obj":"Sentence"},{"id":"T94","span":{"begin":5261,"end":5301},"obj":"Sentence"},{"id":"T95","span":{"begin":5302,"end":5354},"obj":"Sentence"},{"id":"T96","span":{"begin":5355,"end":5389},"obj":"Sentence"},{"id":"T97","span":{"begin":5390,"end":5447},"obj":"Sentence"},{"id":"T98","span":{"begin":5448,"end":5506},"obj":"Sentence"},{"id":"T99","span":{"begin":5507,"end":5559},"obj":"Sentence"},{"id":"T100","span":{"begin":5560,"end":5594},"obj":"Sentence"},{"id":"T101","span":{"begin":5595,"end":5629},"obj":"Sentence"},{"id":"T102","span":{"begin":5630,"end":5687},"obj":"Sentence"},{"id":"T103","span":{"begin":5688,"end":5721},"obj":"Sentence"},{"id":"T104","span":{"begin":5722,"end":5774},"obj":"Sentence"},{"id":"T105","span":{"begin":5775,"end":5814},"obj":"Sentence"},{"id":"T106","span":{"begin":5815,"end":5857},"obj":"Sentence"},{"id":"T107","span":{"begin":5858,"end":5916},"obj":"Sentence"},{"id":"T108","span":{"begin":5917,"end":5969},"obj":"Sentence"},{"id":"T109","span":{"begin":5970,"end":5979},"obj":"Sentence"},{"id":"T110","span":{"begin":5981,"end":6050},"obj":"Sentence"},{"id":"T111","span":{"begin":6051,"end":6214},"obj":"Sentence"},{"id":"T112","span":{"begin":6215,"end":6448},"obj":"Sentence"},{"id":"T113","span":{"begin":6449,"end":6614},"obj":"Sentence"},{"id":"T114","span":{"begin":6615,"end":6720},"obj":"Sentence"},{"id":"T115","span":{"begin":6722,"end":6782},"obj":"Sentence"},{"id":"T116","span":{"begin":6783,"end":6917},"obj":"Sentence"},{"id":"T117","span":{"begin":6918,"end":7039},"obj":"Sentence"},{"id":"T118","span":{"begin":7040,"end":7188},"obj":"Sentence"},{"id":"T119","span":{"begin":7189,"end":7378},"obj":"Sentence"},{"id":"T120","span":{"begin":7379,"end":7557},"obj":"Sentence"},{"id":"T121","span":{"begin":7558,"end":7658},"obj":"Sentence"},{"id":"T122","span":{"begin":7659,"end":7772},"obj":"Sentence"},{"id":"T123","span":{"begin":7773,"end":7781},"obj":"Sentence"},{"id":"T124","span":{"begin":7783,"end":7952},"obj":"Sentence"},{"id":"T125","span":{"begin":7953,"end":8054},"obj":"Sentence"},{"id":"T126","span":{"begin":8055,"end":8149},"obj":"Sentence"},{"id":"T127","span":{"begin":8150,"end":8187},"obj":"Sentence"},{"id":"T128","span":{"begin":8188,"end":8225},"obj":"Sentence"},{"id":"T129","span":{"begin":8226,"end":8263},"obj":"Sentence"},{"id":"T130","span":{"begin":8264,"end":8301},"obj":"Sentence"},{"id":"T131","span":{"begin":8302,"end":8338},"obj":"Sentence"},{"id":"T132","span":{"begin":8339,"end":8376},"obj":"Sentence"},{"id":"T133","span":{"begin":8377,"end":8414},"obj":"Sentence"},{"id":"T134","span":{"begin":8415,"end":8452},"obj":"Sentence"},{"id":"T135","span":{"begin":8453,"end":8490},"obj":"Sentence"},{"id":"T136","span":{"begin":8491,"end":8528},"obj":"Sentence"},{"id":"T137","span":{"begin":8529,"end":8566},"obj":"Sentence"},{"id":"T138","span":{"begin":8567,"end":8604},"obj":"Sentence"},{"id":"T139","span":{"begin":8605,"end":8642},"obj":"Sentence"},{"id":"T140","span":{"begin":8643,"end":8652},"obj":"Sentence"},{"id":"T141","span":{"begin":8654,"end":8748},"obj":"Sentence"},{"id":"T142","span":{"begin":8749,"end":8917},"obj":"Sentence"},{"id":"T143","span":{"begin":8919,"end":8980},"obj":"Sentence"},{"id":"T144","span":{"begin":8981,"end":9142},"obj":"Sentence"},{"id":"T145","span":{"begin":9143,"end":9241},"obj":"Sentence"},{"id":"T146","span":{"begin":9242,"end":9363},"obj":"Sentence"},{"id":"T147","span":{"begin":9364,"end":9537},"obj":"Sentence"},{"id":"T148","span":{"begin":9538,"end":9699},"obj":"Sentence"},{"id":"T149","span":{"begin":9700,"end":9986},"obj":"Sentence"},{"id":"T150","span":{"begin":9987,"end":10132},"obj":"Sentence"},{"id":"T151","span":{"begin":10133,"end":10234},"obj":"Sentence"},{"id":"T152","span":{"begin":10235,"end":10363},"obj":"Sentence"},{"id":"T153","span":{"begin":10364,"end":10373},"obj":"Sentence"},{"id":"T154","span":{"begin":10375,"end":10454},"obj":"Sentence"},{"id":"T155","span":{"begin":10455,"end":10606},"obj":"Sentence"},{"id":"T156","span":{"begin":10607,"end":10615},"obj":"Sentence"},{"id":"T157","span":{"begin":10617,"end":10788},"obj":"Sentence"},{"id":"T158","span":{"begin":10789,"end":10867},"obj":"Sentence"},{"id":"T159","span":{"begin":10868,"end":10932},"obj":"Sentence"},{"id":"T160","span":{"begin":10933,"end":10996},"obj":"Sentence"},{"id":"T161","span":{"begin":10997,"end":11059},"obj":"Sentence"},{"id":"T162","span":{"begin":11060,"end":11124},"obj":"Sentence"},{"id":"T163","span":{"begin":11125,"end":11188},"obj":"Sentence"},{"id":"T164","span":{"begin":11189,"end":11253},"obj":"Sentence"},{"id":"T165","span":{"begin":11254,"end":11318},"obj":"Sentence"},{"id":"T166","span":{"begin":11319,"end":11383},"obj":"Sentence"},{"id":"T167","span":{"begin":11384,"end":11447},"obj":"Sentence"},{"id":"T168","span":{"begin":11448,"end":11512},"obj":"Sentence"},{"id":"T169","span":{"begin":11513,"end":11575},"obj":"Sentence"},{"id":"T170","span":{"begin":11576,"end":11639},"obj":"Sentence"},{"id":"T171","span":{"begin":11640,"end":11911},"obj":"Sentence"},{"id":"T172","span":{"begin":11912,"end":12092},"obj":"Sentence"},{"id":"T173","span":{"begin":12093,"end":12240},"obj":"Sentence"},{"id":"T174","span":{"begin":12241,"end":12374},"obj":"Sentence"},{"id":"T175","span":{"begin":12375,"end":12383},"obj":"Sentence"},{"id":"T176","span":{"begin":12385,"end":12452},"obj":"Sentence"},{"id":"T177","span":{"begin":12453,"end":12658},"obj":"Sentence"},{"id":"T178","span":{"begin":12659,"end":12737},"obj":"Sentence"},{"id":"T179","span":{"begin":12738,"end":12799},"obj":"Sentence"},{"id":"T180","span":{"begin":12800,"end":12861},"obj":"Sentence"},{"id":"T181","span":{"begin":12862,"end":12922},"obj":"Sentence"},{"id":"T182","span":{"begin":12923,"end":12984},"obj":"Sentence"},{"id":"T183","span":{"begin":12985,"end":13046},"obj":"Sentence"},{"id":"T184","span":{"begin":13047,"end":13108},"obj":"Sentence"}],"namespaces":[{"prefix":"_base","uri":"http://pubannotation.org/ontology/tao.owl#"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    MyTest

    {"project":"MyTest","denotations":[{"id":"32269766-30357391-30420970","span":{"begin":157,"end":158},"obj":"30357391"},{"id":"32269766-30144804-30420971","span":{"begin":4037,"end":4039},"obj":"30144804"},{"id":"32269766-28978689-30420972","span":{"begin":7164,"end":7166},"obj":"28978689"},{"id":"32269766-31695703-30420973","span":{"begin":9612,"end":9614},"obj":"31695703"},{"id":"32269766-31695703-30420974","span":{"begin":10505,"end":10507},"obj":"31695703"},{"id":"32269766-1709722-30420975","span":{"begin":12090,"end":12091},"obj":"1709722"}],"namespaces":[{"prefix":"_base","uri":"https://www.uniprot.org/uniprot/testbase"},{"prefix":"UniProtKB","uri":"https://www.uniprot.org/uniprot/"},{"prefix":"uniprot","uri":"https://www.uniprot.org/uniprotkb/"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}

    2_test

    {"project":"2_test","denotations":[{"id":"32269766-30357391-30420970","span":{"begin":157,"end":158},"obj":"30357391"},{"id":"32269766-30144804-30420971","span":{"begin":4037,"end":4038},"obj":"30144804"},{"id":"32269766-28978689-30420972","span":{"begin":7164,"end":7165},"obj":"28978689"},{"id":"32269766-31695703-30420973","span":{"begin":9612,"end":9613},"obj":"31695703"},{"id":"32269766-31695703-30420974","span":{"begin":10505,"end":10506},"obj":"31695703"},{"id":"32269766-1709722-30420975","span":{"begin":12090,"end":12091},"obj":"1709722"}],"text":"Results\n\nIdentification of 28 exact matches to SARS CoV immunogenic peptides by screening all epitopes deposited in IEDB\nWe collected all peptides in IEDB ( 3, as of 13-02-2020) reported positive in T cell assays and have human as the host organism. We then conducted a local sequence alignment of 10 2019-nCoV open reading frames (ORFs) against 35,225 IEDB peptides, and found 28 exact matches. Surprisingly, all identical hits (against peptides having sequence length greater than 3) were from SARS-CoV ( Table 1, Data Table 1 4). These peptides have been shown to bind various HLA alleles, although with higher tendency towards HLA-A:02:01, from both class I and class II, and can be target for CD8+ and CD4+ T cells respectively.\nTable 1. 28 2019-nCoV peptides having exact matches with immunogenic SARS-CoV peptides.\nIEDB.peptide 2019-nCoV.pattern Antigen.Name Allele.Name\nTLACFVLAAV TLACFVLAAV Membrane glycoprotein HLA-A *02:01\nAFFGMSRIGMEVTPSGTW AFFGMSRIGMEVTPSGTW N protein\nALNTPKDHI ALNTPKDHI Nucleoprotein HLA-A *02:01\nAQFAPSASAFFGMSR AQFAPSASAFFGMSR nucleocapsid protein HLA class II\nAQFAPSASAFFGMSRIGM AQFAPSASAFFGMSRIGM N protein\nGMSRIGMEV GMSRIGMEV Nucleoprotein HLA-A *02:01\nILLNKHIDA ILLNKHIDA Nucleoprotein HLA-A *02:01\nIRQGTDYKHWPQIAQFA IRQGTDYKHWPQIAQFA N protein\nKHWPQIAQFAPSASAFF KHWPQIAQFAPSASAFF N protein\nLALLLLDRL LALLLLDRL Nucleoprotein HLA-A *02:01\nLLLDRLNQL LLLDRLNQL Nucleoprotein HLA-A *02:01\nLLNKHIDAYKTFPPTEPK LLNKHIDAYKTFPPTEPK N protein\nLQLPQGTTL LQLPQGTTL Nucleoprotein HLA-A *02:01\nRRPQGLPNNTASWFT RRPQGLPNNTASWFT nucleocapsid protein HLA class I\nYKTFPPTEPKKDKKKK YKTFPPTEPKKDKKKK N protein\nILLNKHID ILLNKHID Nucleoprotein HLA-A *02:01\nMEVTPSGTWL MEVTPSGTWL nucleocapsid protein HLA-B *40:01\nALNTLVKQL ALNTLVKQL S protein HLA-A *02:01\nFIAGLIAIV FIAGLIAIV Spike glycoprotein precursor HLA-A2\nLITGRLQSL LITGRLQSL Spike glycoprotein precursor HLA-A2\nNLNESLIDL NLNESLIDL S protein HLA-A *02:01\nQALNTLVKQLSSNFGAI QALNTLVKQLSSNFGAI S protein HLA-DRB1 *04:01\nRLNEVAKNL RLNEVAKNL Spike glycoprotein precursor HLA-A *02:01\nVLNDILSRL VLNDILSRL S protein HLA-A *02:01\nVVFLHVTYV VVFLHVTYV Spike glycoprotein precursor HLA-A *02:01\nGAALQIPFAMQMAYRF GAALQIPFAMQMAYRF S protein HLA-DRA *01:01/DRB1 *07:01\nMAYRFNGIGVTQNVLY MAYRFNGIGVTQNVLY S protein HLA-DRB1 *04:01\nQLIRAAEIRASANLAATK QLIRAAEIRASANLAATK S protein HLA-DRB1 *04:01\n*SARS-CoV: Severe acute respiratory syndrome coronavirus\n\nIdentification of 22 2019-nCoV peptides with high degree of similarity to previously reported immunogenic viral peptides\nIn addition to 28 identical hits against SARS CoV, we observed a long tail in distribution of normalized alignment scores between 10 2019-nCoV ORFs and 35,225 IEDB peptides ( Figure 1A, Methods). We therefore set out to further investigate potential vaccine targets among highly similar sequences.\nFigure 1. 2019-nCoV peptides with high sequence similarity to immunogenic peptides in IEDB.\nA. Comparison of normalized sequence alignment score for peptides with exact and non-exact matches. B. Number of target peptides grouped by their source organism. The peptides having an exact sequence alignment with epitopes in IEDB had normalized alignment scores ranging from 4 to 6. Taking the normalized alignment score of exact matches as a reference, we extracted 2019-nCoV peptides having score greater or equal to 4. As illustrated in Figure 1A, we observed 45 and 11 peptides having normalized alignment score ≥ 4 and ≥ 5 respectively ( Figure 1A inset). The target peptides were originated from 10 different sources ( Figure 1B) where a total 36 peptides were derived from strains associated to SARS CoV. Of interest, we also observed 7 hits having high sequence similarity to targets from Homo sapiens.\nIn order to investigate the extent to which the difference between the source (2019-nCoV) and target (IEDB) peptides influences the immunogenicity of the source peptides we used a recently published immunogenicity model 5 to predict and compare the immunogenicity between the source and target peptides (Data Table 2 4).\nWe could see a similar (close to identical) immunogenicity scores for a number of IEDB and 2019-nCov peptides especially for those with high immunogenicity scores ( Figure 2). While all 48 can be potential targets, of particular interest were those having higher immunogenicity score than IEDB peptides. Here, we list 22 out of 48 2019-nCoV peptides that scored higher compared to their targets that have been characterized to be immunogenic ( Table 2). In this list 15 (68%) 2019-nCov peptides have a score higher than 0.5 whereas only 11(50%) of IEDB get a score immunogenicity score greater than 0.5.\nTable 2. List of 22 2019-nCoV peptides having a higher predicted immunogenicity score than their target peptides.\nIEDB.peptide 2019-nCoV.pattern IEDB.prob nCol.prob\nWYMWLGARY WYIWLG 0.999249 0.999441\nGLMWLSYFV GLMWLSYFI 0.995073 0.998216\nGLVFLCLQY GIVFMCVEY 0.98123 0.984127\nTWLTYHGAIKLDDKDPQFKDNVILL TWLTYTGAIKLDDKDPNFKDQVILL 0.925862 0.975242\nIGMEVTPSGTWLTYH IGMEVTPSGTWLTY 0.903518 0.919184\nGETALALLLLDRLNQ GDAALALLLLDRLNQ 0.853114 0.900655\nTPSGTWLTYHGAIKL TPSGTWLTYTGAIKL 0.620894 0.662417\nSIVAYTMSL SIIAYTMSL 0.589694 0.693763\nRRPQGLPNNIASWFT RRPQGLPNNTASWFT 0.533253 0.584355\nYNLKWN YNL-WN 0.520244 0.765309\nAGCLIGAEHVDTSYECDI AGCLIGAEHVNNSYECDI 0.503905 0.56813\nGFMKQYGECLGDINARDL GFIKQYGDCLGDIAARDL 0.471939 0.506817\nANKEGIVWVATEGAL ANKDGIIWVATEGAL 0.367723 0.404796\nWNPDDY WNADLY 0.355018 0.584726\nPDDYGG PDDFTG 0.334887 0.527287\nTWLTYHGAIKLDDKDPQF TWLTYTGAIKLDDKDPNF 0.27017 0.529675\nDEVNQI DEVRQI 0.18504 0.187797\nSSKRFQPFQQFGRDV SNKKFLPFQQFGRDI 0.098384 0.119472\nNHDSPDAEL NHTSPDVDL 0.067808 0.17889\nTKQYNVTQAF TKAYNVTQAF 0.054818 0.171488\nVKQMYKTPTLKYFGGFNF VKQIYKTPPIKDFGGFNF 0.018685 0.135681\nQKRTATKQYNVTQAF QKRTATKAYNVTQAF 0.004891 0.037776\nFigure 2. Predicted immunogenicity for IEDB immunogenic vs. 2019-nCoV peptides.\n2019-nCoV peptides having a high sequence similarity to immunogenic peptides and their targets were analysed for their immunogenicity potential by iPred algorithm. It is worth noting that in general predicting immunogenicity of given a peptide is challenging and not a fully solved problem, and therefore current models for predicting immunogenicity are suboptimal. iPred is also not an exception. In fact, we could see that a substantial number of IEDB immunogenic peptides were scored \u003c 0.5 (the threshold score used to classify immunogenic vs non-immunogenic). This led us to ask whether we can gather any other evidence of either immunogenicity or cross-reactivity.\n\nDe novo search of immunogenic peptides in 2019-nCoV proteome\nAs a complementary reciprocal approach, we conducted a de novo search of immunogenic peptides against the 2019-nCov proteome sequence. We scanned 9-mers from 2019-nCoV proteome with a window of 9 amino acids and step length of 1 amino acid (9613 in total). The immunogenicity of 9-mer peptides were predicted using iPred and MHC presentation scores were gauged using NetMHCpan 4.0 6 for various HLA types. In this task, we focused on haplotypes common in Chinese and European populations, which include HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles (Data Table 3 4).\nBased on MHC presentation and immunogenicity prediction, we detected 5 peptides predicted to bind 4 different HLA alleles of which 2 had strong immunogenicity scores ( Figure 3). For those 65 strong binders to 3 different HLA types, 39 had immunogenicity scores ≥ 0.5 ( Table 3). Collectively this analysis suggests a number of 9-mer immunogenic candidates for further experimental validation.\nTable 3. 2019-nCoV 9-mer peptides predicted to bind 4 different HLA alleles by NetMHCpan 4.0, and those predicted to bind ≥ 3 HLA alleles and immunogenicity score ≥ 0.9 by iPred.\nFor different alleles, 0 denotes non-binding and 1 denotes binding predicted for specific HLA allele.\nAntigen.epitope Imm.prob A0101.NB A0201.NB B0702.NB B4001.NB C0702.NB Total binding HLA\nVQMAPISAM 0.893938 0 1 1 1 1 4\nAMYTPHTVL 0.862427 0 1 1 1 1 4\nTLDSKTQSL 0.254998 1 1 1 0 1 4\nKVDGVVQQL 0.191786 1 1 1 0 1 4\nKVDGVDVEL 0.18632 1 1 1 0 1 4\nMADQAMTQM 0.991227 1 0 1 0 1 3\nLEAPFLYLY 0.983072 1 0 0 1 1 3\nRTAPHGHVM 0.972153 1 0 1 0 1 3\nIPFAMQMAY 0.961569 1 0 1 0 1 3\nFLTENLLLY 0.951715 1 1 0 0 1 3\nYLQPRTFLL 0.947743 1 1 0 0 1 3\nMMISAGFSL 0.941318 0 1 1 0 1 3\nATLPKGIMM 0.926603 1 0 1 0 1 3\nFigure 3. De novo search of 9-mer 2019-nCoV peptides with MHC presentation and immunogenicity potential.\nThe MHC binding was predicted for HLA-A*02:01, HLA-A*01:01, HLA-B*07:02, HLA-B*40:01 and HLA-C*07:02 alleles by NetMHCpan 4.0 and immunogenicity was predicted by iPred.\n\nImmunogenicity of 2019-nCoV peptides to 1G4 CD8+ TCR molecule\nWhile our de novo candidates are appealing shortlisted targets for experimental validation, it does not provide information about target T cell receptors (TCRs). We therefore set out to interrogate the possibility of cross reactivity with one well-studied TCR.\nT cell cross-reactivity has been instrumental for the T cell immunity against both tumor antigens and external pathogens. In that regard, a number of T cells have been extensively characterized including 1G4 CD8+ TCR, which is known to recognize the ‘SLLMWITQC’ peptide presented by HLA-A*02:01. We therefore set out to leverage the data from a recently published study 7 and exploit the possibility of cross reactivity of this TCR to any 2019-nCoV peptide.\nHere, we scanned all 9-mers from the 2019-nCoV proteome (9613 peptides) with Binding, Activating and Killing Position Weight Matrices (PWM, see the method section) and associated each peptide with the geometric mean of these three assays as a measure of immunogenicity (Data Table 4 4). The distributions of binding, activation and killing scores along with their multiplicative score and geometric mean are illustrated in Figure 4. Based on geometric mean, we observed 20 2019-nCoV peptides with a score \u003e 0.8 and 516 peptides \u003e 0.7. The 9-mer peptides with geometric mean \u003e 0.7 and positive HLA-A*02:01 binding prediction by NetMHCpan 4.0 are listed in Table 4.\nFigure 4. Distribution of 1G4 TCR positional weight matrix scores for 2019-nCoV peptides.\nThe positional weight matrices were obtained from 7 and 9613 9-mers generated from 10 2019-nCoV ORFs were computed for their TCR recognition potential.\nTable 4. 2019-nCoV 9-mer peptides with geometric mean ≥ 0.7 by 1G4 TCR positional weight matrix and predicted positive to bind HLA-A*02:01 by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nRIMTWLDMV 0.866377428 0.853995 0.776303 0.831249 0.3481 SB\nALNTLVKQL 0.802453741 0.75073 0.785957 0.779413 0.6159 WB\nLLLDRLNQL 0.809895414 0.7752 0.741096 0.774888 0.0423 SB\nMIAQYTSAL 0.766262499 0.789511 0.749477 0.768242 0.9238 WB\nVLSTFISAA 0.799672451 0.756117 0.687278 0.746239 0.536 WB\nNVLAWLYAA 0.761297552 0.686117 0.739944 0.728423 1.4457 WB\nRLANECAQV 0.783161706 0.719705 0.680504 0.726572 0.2049 SB\nKLLKSIAAT 0.748896679 0.708996 0.697463 0.718118 1.0923 WB\nQLSLPVLQV 0.70128376 0.715259 0.708405 0.708293 0.4768 SB\nVQMAPISAM 0.729320768 0.698514 0.689612 0.705612 1.4677 WB\nLLLTILTSL 0.7131709 0.715194 0.680064 0.702623 0.2712 SB\nSVLLFLAFV 0.736972762 0.690855 0.679534 0.70202 1.1449 WB\nLMWLIINLV 0.727847374 0.681119 0.694007 0.700717 1.304 WB We further analysed the MHC binding propensities and gathered peptides not only predicted positive by NetMHCpan but also to have leucine (L) and valine (V) in anchor positions 2 (P2) and 9 (P9) respectively. Previous studies have shown that for MHC-I HLA-A02:01 specific peptides, 9-mer peptides with leucine at P2 and valine at P9 are preferably presented on the surface of HLA-A02:01 8. Looking at the LV peptide, we identified 44 2019-nCoV peptides of which 2 peptides had immunogenicity score \u003e 0.7 and 12 peptides \u003e 0.6 ( Table 5). Thus, here we provide the list of peptides that are potential targets for 1G4 TCR recognition for subjects with HLA-A02:01 haplotype.\nTable 5. 2019-nCoV 9-mer peptides having leucine-valine in anchor positions.\nPeptides have geometric mean ≥ 0.6 and ≤ 0.7 (for those ≥ 0.7, refer to Table 4) by 1G4 TCR positional weight matrix and predicted positive for HLA-A*02:01 binding by NetMHCpan 4.0 (Rank = NetMHCpan rank).\nPeptide Binding score Activation score Killing score geoMean Rank Binder\nTLMNVLTLV 0.723687 0.658986 0.652178 0.677534 0.0444 SB\nQLEMELTPV 0.711291 0.651003 0.608605 0.655625 1.6769 WB\nMLAKALRKV 0.668756 0.610664 0.65968 0.645854 0.3524 SB\nGLFKDCSKV 0.675952 0.632375 0.594753 0.633494 0.2677 SB\nALSKGVHFV 0.652549 0.604952 0.586236 0.613954 0.0425 SB\nYLNTLTLAV 0.624147 0.610826 0.575445 0.603119 0.0453 SB"}