import pandas as pd
import numpy as np
import re
import sys
import operator
import collections
import os
bioplex_interactions = pd.read_csv('Uniprot_Proteome.tsv', sep='\t')
bioplex_interactions
Entry | Entry name | Status | Protein names | Gene names | Organism | Length | |
---|---|---|---|---|---|---|---|
0 | P78410 | BT3A2_HUMAN | reviewed | Butyrophilin subfamily 3 member A2 | BTN3A2 BT3.2 BTF3 BTF4 | Homo sapiens (Human) | 334 |
1 | Q8TDQ1 | CLM1_HUMAN | reviewed | CMRF35-like molecule 1 (CLM-1) (CD300 antigen-... | CD300LF CD300F CLM1 IGSF13 IREM1 NKIR UNQ3105/... | Homo sapiens (Human) | 290 |
2 | Q7Z624 | CMKMT_HUMAN | reviewed | Calmodulin-lysine N-methyltransferase (CLNMT) ... | CAMKMT C2orf34 CLNMT | Homo sapiens (Human) | 323 |
3 | O75208 | COQ9_HUMAN | reviewed | Ubiquinone biosynthesis protein COQ9, mitochon... | COQ9 C16orf49 HSPC326 PSEC0129 | Homo sapiens (Human) | 318 |
4 | Q8NEV1 | CSK23_HUMAN | reviewed | Casein kinase II subunit alpha 3 (CK II alpha ... | CSNK2A3 CSNK2A1P | Homo sapiens (Human) | 391 |
5 | P33681 | CD80_HUMAN | reviewed | T-lymphocyte activation antigen CD80 (Activati... | CD80 CD28LG CD28LG1 LAB7 | Homo sapiens (Human) | 288 |
6 | P02511 | CRYAB_HUMAN | reviewed | Alpha-crystallin B chain (Alpha(B)-crystallin)... | CRYAB CRYA2 HSPB5 | Homo sapiens (Human) | 175 |
7 | Q8N4T0 | CBPA6_HUMAN | reviewed | Carboxypeptidase A6 (EC 3.4.17.-) | CPA6 CPAH | Homo sapiens (Human) | 437 |
8 | P20933 | ASPG_HUMAN | reviewed | N(4)-(beta-N-acetylglucosaminyl)-L-asparaginas... | AGA | Homo sapiens (Human) | 346 |
9 | Q86VB7 | C163A_HUMAN | reviewed | Scavenger receptor cysteine-rich type 1 protei... | CD163 M130 | Homo sapiens (Human) | 1156 |
10 | P53420 | CO4A4_HUMAN | reviewed | Collagen alpha-4(IV) chain | COL4A4 | Homo sapiens (Human) | 1690 |
11 | A2IDD5 | CCD78_HUMAN | reviewed | Coiled-coil domain-containing protein 78 (hsCC... | CCDC78 C16orf25 JFP10 | Homo sapiens (Human) | 438 |
12 | Q02952 | AKA12_HUMAN | reviewed | A-kinase anchor protein 12 (AKAP-12) (A-kinase... | AKAP12 AKAP250 | Homo sapiens (Human) | 1782 |
13 | O15194 | CTDSL_HUMAN | reviewed | CTD small phosphatase-like protein (CTDSP-like... | CTDSPL C3orf8 NIF1 NIFL SCP3 YA22 | Homo sapiens (Human) | 276 |
14 | O14613 | BORG1_HUMAN | reviewed | Cdc42 effector protein 2 (Binder of Rho GTPase... | CDC42EP2 BORG1 CEP2 | Homo sapiens (Human) | 210 |
15 | P30260 | CDC27_HUMAN | reviewed | Cell division cycle protein 27 homolog (Anapha... | CDC27 ANAPC3 D0S1430E D17S978E | Homo sapiens (Human) | 824 |
16 | O75175 | CNOT3_HUMAN | reviewed | CCR4-NOT transcription complex subunit 3 (CCR4... | CNOT3 KIAA0691 LENG2 NOT3 | Homo sapiens (Human) | 753 |
17 | Q16611 | BAK_HUMAN | reviewed | Bcl-2 homologous antagonist/killer (Apoptosis ... | BAK1 BAK BCL2L7 CDN1 | Homo sapiens (Human) | 211 |
18 | Q07065 | CKAP4_HUMAN | reviewed | Cytoskeleton-associated protein 4 (63-kDa cyto... | CKAP4 | Homo sapiens (Human) | 602 |
19 | Q96B67 | ARRD3_HUMAN | reviewed | Arrestin domain-containing protein 3 (TBP-2-li... | ARRDC3 KIAA1376 | Homo sapiens (Human) | 414 |
20 | Q15327 | ANKR1_HUMAN | reviewed | Ankyrin repeat domain-containing protein 1 (Ca... | ANKRD1 C193 CARP HA1A2 | Homo sapiens (Human) | 319 |
21 | Q99653 | CHP1_HUMAN | reviewed | Calcineurin B homologous protein 1 (Calcineuri... | CHP1 CHP | Homo sapiens (Human) | 195 |
22 | P0CG37 | CFC1_HUMAN | reviewed | Cryptic protein (Cryptic family protein 1) | CFC1 | Homo sapiens (Human) | 223 |
23 | P17544 | ATF7_HUMAN | reviewed | Cyclic AMP-dependent transcription factor ATF-... | ATF7 ATFA | Homo sapiens (Human) | 494 |
24 | Q8N5B7 | CERS5_HUMAN | reviewed | Ceramide synthase 5 (CerS5) (EC 2.3.1.-) (LAG1... | CERS5 LASS5 | Homo sapiens (Human) | 392 |
25 | Q6ZMG9 | CERS6_HUMAN | reviewed | Ceramide synthase 6 (CerS6) (EC 2.3.1.-) (LAG1... | CERS6 LASS6 | Homo sapiens (Human) | 384 |
26 | A0A1B0GW15 | A0A1B0GW15_HUMAN | unreviewed | Uncharacterized protein | NaN | Homo sapiens (Human) | 77 |
27 | A0A0A0MRX4 | A0A0A0MRX4_HUMAN | unreviewed | Ral guanine nucleotide dissociation stimulator... | RGL3 | Homo sapiens (Human) | 710 |
28 | F5H052 | F5H052_HUMAN | unreviewed | Armadillo repeat-containing protein 6 (Fragment) | ARMC6 | Homo sapiens (Human) | 103 |
29 | B1AMT0 | B1AMT0_HUMAN | unreviewed | Cohesin subunit SA-2 (Fragment) | STAG2 | Homo sapiens (Human) | 115 |
... | ... | ... | ... | ... | ... | ... | ... |
74004 | O14775 | GNB5_HUMAN | reviewed | Guanine nucleotide-binding protein subunit bet... | GNB5 | Homo sapiens (Human) | 395 |
74005 | O43716 | GATC_HUMAN | reviewed | Glutamyl-tRNA(Gln) amidotransferase subunit C,... | GATC 15E1.2 | Homo sapiens (Human) | 136 |
74006 | P03372 | ESR1_HUMAN | reviewed | Estrogen receptor (ER) (ER-alpha) (Estradiol r... | ESR1 ESR NR3A1 | Homo sapiens (Human) | 595 |
74007 | Q6NT32 | EST5A_HUMAN | reviewed | Carboxylesterase 5A (EC 3.1.1.1) (Carboxyleste... | CES5A CES7 | Homo sapiens (Human) | 575 |
74008 | P30793 | GCH1_HUMAN | reviewed | GTP cyclohydrolase 1 (EC 3.5.4.16) (GTP cycloh... | GCH1 DYT5 GCH | Homo sapiens (Human) | 250 |
74009 | Q9HAH7 | FBRS_HUMAN | reviewed | Probable fibrosin-1 | FBRS FBS FBS1 | Homo sapiens (Human) | 460 |
74010 | O00461 | GOLI4_HUMAN | reviewed | Golgi integral membrane protein 4 (Golgi integ... | GOLIM4 GIMPC GOLPH4 GPP130 | Homo sapiens (Human) | 696 |
74011 | Q9UI32 | GLSL_HUMAN | reviewed | Glutaminase liver isoform, mitochondrial (GLS)... | GLS2 GA | Homo sapiens (Human) | 602 |
74012 | Q9UBI6 | GBG12_HUMAN | reviewed | Guanine nucleotide-binding protein G(I)/G(S)/G... | GNG12 | Homo sapiens (Human) | 72 |
74013 | P63215 | GBG3_HUMAN | reviewed | Guanine nucleotide-binding protein G(I)/G(S)/G... | GNG3 GNGT3 | Homo sapiens (Human) | 75 |
74014 | Q8WUU5 | GATD1_HUMAN | reviewed | GATA zinc finger domain-containing protein 1 (... | GATAD1 ODAG | Homo sapiens (Human) | 269 |
74015 | Q8NBI3 | DRAXI_HUMAN | reviewed | Draxin (Dorsal inhibitory axon guidance protei... | DRAXIN C1orf187 PSEC0258 UNQ3119/PRO10268 | Homo sapiens (Human) | 349 |
74016 | Q8IUC8 | GLT13_HUMAN | reviewed | Polypeptide N-acetylgalactosaminyltransferase ... | GALNT13 KIAA1918 | Homo sapiens (Human) | 556 |
74017 | Q7Z2K6 | ERMP1_HUMAN | reviewed | Endoplasmic reticulum metallopeptidase 1 (EC 3... | ERMP1 FXNA KIAA1815 | Homo sapiens (Human) | 904 |
74018 | Q9UM22 | EPDR1_HUMAN | reviewed | Mammalian ependymin-related protein 1 (MERP-1)... | EPDR1 MERP1 UCC1 | Homo sapiens (Human) | 224 |
74019 | P05160 | F13B_HUMAN | reviewed | Coagulation factor XIII B chain (Fibrin-stabil... | F13B | Homo sapiens (Human) | 661 |
74020 | P37059 | DHB2_HUMAN | reviewed | Estradiol 17-beta-dehydrogenase 2 (EC 1.1.1.62... | HSD17B2 EDH17B2 SDR9C2 | Homo sapiens (Human) | 387 |
74021 | A8K855 | EFCB7_HUMAN | reviewed | EF-hand calcium-binding domain-containing prot... | EFCAB7 KIAA1799 | Homo sapiens (Human) | 629 |
74022 | Q16099 | GRIK4_HUMAN | reviewed | Glutamate receptor ionotropic, kainate 4 (GluK... | GRIK4 GRIK | Homo sapiens (Human) | 956 |
74023 | P0DPD8 | EFCE2_HUMAN | reviewed | EEF1AKMT4-ECE2 readthrough transcript protein ... | EEF1AKMT4-ECE2 | Homo sapiens (Human) | 883 |
74024 | P56937 | DHB7_HUMAN | reviewed | 3-keto-steroid reductase (EC 1.1.1.270) (17-be... | HSD17B7 SDR37C1 UNQ2563/PRO6243 | Homo sapiens (Human) | 341 |
74025 | Q9NYF3 | FA53C_HUMAN | reviewed | Protein FAM53C | FAM53C C5orf6 | Homo sapiens (Human) | 392 |
74026 | Q6UY11 | DLK2_HUMAN | reviewed | Protein delta homolog 2 (DLK-2) (Epidermal gro... | DLK2 EGFL9 UNQ2903/PRO28633 | Homo sapiens (Human) | 383 |
74027 | Q99504 | EYA3_HUMAN | reviewed | Eyes absent homolog 3 (EC 3.1.3.48) | EYA3 | Homo sapiens (Human) | 573 |
74028 | Q01459 | DIAC_HUMAN | reviewed | Di-N-acetylchitobiase (EC 3.2.1.-) | CTBS CTB | Homo sapiens (Human) | 385 |
74029 | O60610 | DIAP1_HUMAN | reviewed | Protein diaphanous homolog 1 (Diaphanous-relat... | DIAPH1 DIAP1 | Homo sapiens (Human) | 1272 |
74030 | O60269 | GRIN2_HUMAN | reviewed | G protein-regulated inducer of neurite outgrow... | GPRIN2 KIAA0514 | Homo sapiens (Human) | 458 |
74031 | Q6P3S1 | DEN1B_HUMAN | reviewed | DENN domain-containing protein 1B (Connecdenn ... | DENND1B C1orf218 FAM31B | Homo sapiens (Human) | 775 |
74032 | P09958 | FURIN_HUMAN | reviewed | Furin (EC 3.4.21.75) (Dibasic-processing enzym... | FURIN FUR PACE PCSK3 | Homo sapiens (Human) | 794 |
74033 | Q8IUX8 | EGFL6_HUMAN | reviewed | Epidermal growth factor-like protein 6 (EGF-li... | EGFL6 MAEG PP648 UNQ281/PRO320 | Homo sapiens (Human) | 553 |
74034 rows × 7 columns
prot_list = []
for ind, row in bioplex_interactions.iterrows():
prots = str(row['Gene names'])
#print(prots)
prot_arr = prots.split(' ')
#print(prot_arr)
for prot in prot_arr:
if prot not in prot_list:
prot_list.append(prot)
prot_list
['BTN3A2', 'BT3.2', 'BTF3', 'BTF4', 'CD300LF', 'CD300F', 'CLM1', 'IGSF13', 'IREM1', 'NKIR', 'UNQ3105/PRO10111', 'CAMKMT', 'C2orf34', 'CLNMT', 'COQ9', 'C16orf49', 'HSPC326', 'PSEC0129', 'CSNK2A3', 'CSNK2A1P', 'CD80', 'CD28LG', 'CD28LG1', 'LAB7', 'CRYAB', 'CRYA2', 'HSPB5', 'CPA6', 'CPAH', 'AGA', 'CD163', 'M130', 'COL4A4', 'CCDC78', 'C16orf25', 'JFP10', 'AKAP12', 'AKAP250', 'CTDSPL', 'C3orf8', 'NIF1', 'NIFL', 'SCP3', 'YA22', 'CDC42EP2', 'BORG1', 'CEP2', 'CDC27', 'ANAPC3', 'D0S1430E', 'D17S978E', 'CNOT3', 'KIAA0691', 'LENG2', 'NOT3', 'BAK1', 'BAK', 'BCL2L7', 'CDN1', 'CKAP4', 'ARRDC3', 'KIAA1376', 'ANKRD1', 'C193', 'CARP', 'HA1A2', 'CHP1', 'CHP', 'CFC1', 'ATF7', 'ATFA', 'CERS5', 'LASS5', 'CERS6', 'LASS6', 'nan', 'RGL3', 'ARMC6', 'STAG2', 'CACNA1D', 'GPRC5B', 'KCNMA1', 'MICALL1', 'KCNT1', 'ZNF433', 'MDN1', 'FANCA', 'ZNF236', 'MADCAM1', 'TJP3', 'DCC', 'SNX6', 'GPS2', 'SELENBP1', 'DPY19L2', 'EXOC3L2', 'LGALS1', 'FGF13', 'PSG5', 'BEST3', 'CSNK2A1', 'ATG16L2', 'GIT1', 'PARP8', 'HPSE2', 'GMPR2', 'NUP107', 'ZNF467', 'LRP2BP', 'GALK1', 'NT5C3A', 'LETM2', 'COBLL1', 'USP14', 'DEPDC4', 'PIGT', 'SMYD4', 'SLC37A3', 'MAPK10', 'ARPP21', 'STIM2', 'SLC25A29', 'SH2D4A', 'FBXL5', 'APOC1', 'C1orf167', 'ZNF10', 'LGR4', 'RCN2', 'DHX36', 'DIABLO', 'LRRK2', 'CS', 'ZNF816', 'ADGRG1', 'KCNN3', 'DDX3X', 'RHBDF2', 'NAA38', 'PSMC3', 'MCIDAS', 'PRAMEF9', 'EXT2', 'RPS6KA5', 'PIGQ', 'MBP', 'TXNDC9', 'SREBF2', 'YIF1B', 'TRAJ33', 'SLC46A2', 'TMEM248', 'ANKRD12', 'PEG3', 'HBP1', 'RNF123', 'PHACTR4', 'USP17L19', 'RAB5A', 'SHPRH', 'HLA-DMA', 'CAMK2D', 'USE1', 'RFX2', 'RFX4', 'ZNF683', 'MBD6', 'NDRG4', 'CNTRL', 'CASP7', 'KIF1B', 'DIRAS2', 'ADD1', 'C6orf52', 'MOK', 'MEIS2', 'DNMBP', 'LSM7', 'CEP126', 'FAM13A', 'TUBB3', 'SNX1', 'PRXL2B', 'ATXN2L', 'SEPTIN9', 'ARHGAP17', 'LMAN1L', 'SWI5', 'LILRB2', 'CTNND2', 'PIAS3', 'LPCAT4', 'EFEMP2', 'PRKCSH', 'BNIP3L', 'BAIAP3', 'SEPTIN8', 'MPHOSPH9', 'PDE4DIP', 'ACTN2', 'ATP6V1D', 'TRIM73', 'ELOB', 'SLC12A4', 'ST6GALNAC2', 'TNK1', 'RABEP2', 'CRYBG1', 'SCN2A', 'DCTN5', 'TMC3', 'POLR2J2', 'ITPKC', 'RUFY1', 'INSIG2', 'IQGAP2', 'PYCR1', 'SLC12A5', 'TSPAN11', 'FBXL15', 'LIPC', 'MON2', 'RANBP3', 'HMCN1', 'DMRTC1B', 'ETS2', 'NCF2', 'TK1', 'SPINT2', 'NCBP3', 'TMCO6', 'NDUFV1', 'LSM14B', 'CIZ1', 'KDM8', 'NIFK', 'RMND5B', 'VEPH1', 'MRPL15', 'SALL3', 'ARHGAP21', 'ANTKMT', 'SLC8B1', 'DEPDC1B', 'PHF20', 'WAC', 'FAM118B', 'CYP26B1', 'NUSAP1', 'MANEAL', 'TFAP2A', 'RAB11A', 'GLT8D1', 'MIB2', 'PRPF39', 'RALB', 'CD74', 'RETREG3', 'LPIN1', 'KLHL22', 'HBS1L', 'SLC22A31', 'TATDN3', 'RPS27L', 'NFE2L1', 'PDE4C', 'SIAH1', 'APBB2', 'ELF2', 'BRWD1', 'SLC2A1', 'CCDC32', 'FCGRT', 'ANKRD44', 'MYRIP', 'C11orf88', 'MTHFD2L', 'NDEL1', 'RNF5', 'HNRNPM', 'REXO5', 'GCSH', 'TM7SF2', 'ARMC5', 'ESYT1', 'DEF8', 'TROAP', 'PAK1', 'G2E3', 'KIF25', 'SPAG5', 'GAS8', 'MAG', 'MTERF3', 'BTN2A2', 'ANKRD46', 'ADGRL3', 'TAOK3', 'PEX16', 'ICAM2', 'ABCE1', 'DDX56', 'NTHL1', 'SAMD11', 'ABI3BP', 'ZFR', 'RASSF8', 'ARHGEF28', 'MSL1', 'ACTN4', 'PCCB', 'EIF3L', 'CCDC181', 'TBCK', 'CNRIP1', 'KAT5', 'AGAP2', 'TADA2A', 'ECH1', 'GSPT1', 'PCNX2', 'TPST1', 'CECR2', 'POU2F2', 'DMTF1', 'LRRCC1', 'HPGD', 'USP40', 'PTDSS2', 'KLKB1', 'AGBL5', 'ZNF491', 'TMBIM4', 'MAP4K3', 'EMC9', 'NTM', 'TCF4', 'GCHFR', 'AP4M1', 'LMNTD2', 'PHF1', 'ELOC', 'FCHSD2', 'KRIT1', 'ARHGAP8', 'POTEE', 'ARHGEF2', 'TUBA1A', 'UQCC2', 'VGLL4', 'FMR1', 'MED24', 'FLNA', 'RPS6KC1', 'TMEM161B', 'ANXA11', 'RBPJ', 'TSTD2', 'CDK5RAP3', 'PHF19', 'LRRC8D', 'ATM', 'ADGRV1', 'U2SURP', 'PICK1', 'HEATR6', 'PLSCR1', 'RBBP8', 'ILVBL', 'CD22', 'CNDP2', 'JADE1', 'APLP1', 'CEP57L1', 'ANXA6', 'TTYH1', 'HNRNPH1', 'NME4', 'ZCRB1', 'BCAS3', 'MPND', 'CUL3', 'CTDNEP1', 'MYO18A', 'BTBD2', 'DXO', 'ZNF189', 'DNAH7', 'CHID1', 'NHP2', 'CARF', 'GPRC5A', 'LRIG3', 'ZDHHC23', 'NLRP2', 'VIM', 'OSBPL9', 'NSD3', 'PMS1', 'CAPN5', 'CXorf40A', 'TCAIM', 'ZSCAN32', 'C1QTNF7', 'ACSM2A', 'PRRG3', 'TFG', 'HELZ', 'TTLL3', 'CCDC88A', 'RPS3', 'LMBR1L', 'OCIAD1', 'PCYT1B', 'IPPK', 'ARPC1B', 'CD82', 'CFTR', 'C17orf50', 'PKLR', 'EVC', 'KIRREL2', 'PAH', 'MAGEA2B', 'BAZ2B', 'ANPEP', 'SPATS2', 'MPV17', 'ZCCHC8', 'ZFYVE19', 'PDGFC', 'ACP5', 'COMMD3', 'CTC1', 'TRAIP', 'PDE4D', 'CES4A', 'C10orf90', 'CMIP', 'DDX42', 'CCHCR1', 'CLPP', 'DGLUCY', 'TBC1D25', 'PLCB1', 'FMO3', 'STARD10', 'TASOR2', 'MMAB', 'PSEN1', 'CENPX', 'RRAS2', 'IL17RC', 'L3HYPDH', 'NFIA', 'SPECC1L', 'TP53', 'DPP8', 'SULT1C2', 'KANSL2', 'NRXN1', 'DCTN4', 'SUN3', 'SPIRE1', 'SLC7A6OS', 'IL17RE', 'GID4', 'MAX', 'OCIAD2', 'ALMS1', 'CEP128', 'ERBB4', 'IQCJ-SCHIP1', 'XPO6', 'GATB', 'ZNF134', 'ST6GAL1', 'NFIB', 'SHF', 'ACKR2', 'BLVRB', 'FBXO15', 'RAB2A', 'CFAP99', 'MAP3K12', 'MCCC2', 'EIF4A2', 'DNAJC18', 'PTGER3', 'PLEC', 'IZUMO3', 'RGR', 'NME7', 'KDM4C', 'EYA1', 'ITGA3', 'ATP9B', 'MTMR14', 'CBX1', 'EIF2A', 'SNTG1', 'DDX60L', 'RABGGTA', 'PUS1', 'VPS35L', 'YTHDF1', 'KLK1', 'HERC3', 'GLYATL1', 'LAMTOR1', 'THAP9', 'IFIH1', 'AXDND1', 'KCTD17', 'CEP95', 'PIEZO2', 'CFB', 'METRN', 'ANTXR2', 'SKAP1', 'LPP', 'SLC38A5', 'PRKD1', 'CPE', 'RANBP6', 'GABRA2', 'MSRA', 'TYK2', 'EPHA10', 'PACS1', 'TTC12', 'EXOSC4', 'ZNF81', 'ZNF28', 'PSG6', 'BANP', 'COX5A', 'RCOR3', 'FAM49B', 'MKNK2', 'TAF1C', 'UBC', 'C11orf80', 'CTU2', 'NCS2', 'DIO2', 'CD6', 'PAMR1', 'TMEM130', 'FTO', 'HEATR9', 'ICE2', 'APEH', 'HLA-DQB1', 'CBWD6', 'IGLJ5', 'PHF12', 'ALDOC', 'ENO3', 'CRYZ', 'RELL2', 'ADAM22', 'ZNF737', 'CDH23', 'ZFR2', 'GRIP1', 'MED1', 'PLEKHB1', 'DDI2', 'MAP4K4', 'GAL3ST1', 'MCTP1', 'ZNF562', 'CLTC', 'TFEB', 'PRPSAP2', 'RALA', 'GABRB3', 'PSG7', 'NCOA7', 'VMP1', 'C19orf25', 'STMN4', 'ANKRD13D', 'PITX1', 'IGSF9B', 'ARHGAP1', 'BECN1', 'ZNF277', 'ECHDC1', 'SETD1A', 'PBK', 'KLRC2', 'AP2A1', 'EIF3M', 'PPP4R1', 'EEF1A1', 'C3orf49', 'ETNK2', 'EXOSC2', 'SMPD4', 'BAG1', 'GFAP', 'TRPC3', 'RRBP1', 'REELD1', 'NEDD4L', 'UBIAD1', 'NPEPPS', 'CA10', 'BIRC5', 'DBNL', 'NACA', 'EIF3H', 'ZNF43', 'THOC2', 'DUSP15', 'KIAA1614', 'EPN3', 'KIR3DL1', 'PIGG', 'TSKU', 'PCYOX1', 'PCSK5', 'ACSM2B', 'WFS1', 'UBA1', 'RNF167', 'RAD51AP1', 'ST6GALNAC4', 'AP1G1', 'C2CD3', 'DMKN', 'RNASE11', 'CCDC110', 'DOCK10', 'GNPTAB', 'MDH1', 'RAB35', 'WDR48', 'TSC22D3', 'HP', 'TMC5', 'NSD2', 'LILRB5', 'PNPT1', 'PEX10', 'GAB4', 'NIPAL1', 'RAD54B', 'TM2D3', 'NFU1', 'PHGDH', 'NRG1', 'CHTOP', 'ZNF207', 'RNF166', 'MYBPC1', 'ZBTB38', 'TRAK1', 'GIGYF2', 'CACNB4', 'DECR1', 'ABCC9', 'ACSL6', 'FANCB', 'GTF2IRD2B', 'GTF2IRD2', 'CRYZL1', 'OR51C1P', 'hCG_1685829', 'SLC19A1', 'PDCD6', 'MED25', 'MKS1', 'TBC1D3F', 'C8B', 'TXNDC15', 'TMEM262', 'EEF1A2', 'LRR1', 'PPIL5', 'hCG_1640043', 'FAM92A', 'TMEM179', 'ECM2', 'TOGARAM1', 'KIAA0423', 'hCG_20876', 'MYT1L', 'HECW2', 'NR1I3', 'CD3G', 'PLAC8', 'hCG_1782057', 'CHD1L', 'RERE', 'hCG_2008872', 'DPF1', 'NME6', 'MLLT6', 'ACAA1', 'NIF3L1', 'MAN2C1', 'MYB', 'c-myb', 'hCG_32380', 'LPAR1', 'TCF3', 'AKAP9', 'hCG_1812018', 'MAJIN', 'GUSB', 'LMO3', 'C12orf57', 'VPS26C', 'CALB1', 'MTA3', 'hCG_1783907', 'NUP42', 'CDHR1', 'AUTS2', 'COPE', 'hCG_2001439', 'RIN3', 'hCG_2029104', 'TSC2', 'FCHSD1', 'MARS', 'TRIM59', 'FBXL12', 'KRT85', 'MARF1', 'TCF7L2', 'hCG_40998', 'ITSN1', 'KAT6B', 'GTF2H1', 'BTNL8', 'RNF32', 'ATP5F1B', 'KIR3DL2', 'ELAVL4', 'SERAC1', 'PPT2', 'EPB41', 'CD48', 'HIST2H3PS2', 'RP5-998N21.6-001', 'TRPM2', 'CPT1B', 'DEK', 'ETFBKMT', 'MGC50559', 'hCG_39178', 'MED22', 'RP11-244N20.9-005', 'FXYD6', 'PLXNC1', 'KRT23', 'DKFZp434G032', 'STRADB', 'CRISP3', 'SLC39A13', 'hCG_1730570', 'SLC39A11', 'OLFM1', 'GORASP1', 'GGNBP2', 'CCDC25', 'SPEG', 'APEG1', 'hCG_2012857', 'DAOA', 'EGLN2', 'ARHGAP33', 'FAM122C', 'MTHFR', 'MICAL2', 'DEDD', 'hCG_20845', 'ACD', 'NARF', 'SCNN1B', 'TMPRSS4', 'hCG_41152', 'MSR1', 'GPATCH4', 'SPATA24', 'SHKBP1', 'MRTFA', 'MKL1', 'hCG_41119', 'ZNF575', 'CCDC136', 'EPHA5', 'hCG_1810817', 'VPS35', 'ABHD11', 'PNLIPRP1', 'L3MBTL1', 'VARS2', 'ZKSCAN7', 'DUSP18', 'hCG_24790', 'TIMMDC1', 'C3orf1', 'hCG_1780137', 'VRK3', 'HDAC9', 'NTMT1', 'SLC38A7', 'ABCA2', 'MPP6', 'FBXL2', 'SF3A1', 'TMEM62', 'CDH16', 'HLA-DMB', 'IPO8', 'GABRD', 'PUS7L', 'NPIPB3', 'CERCAM', 'IL4I1', 'ARHGAP28', 'NRXN2', 'hCG_1810991', 'RANBP17', 'ARFGAP2', 'DNAAF3', 'TTC9C', 'PPP2R1A', 'WDR18', 'CYP19A1', 'MRC2', 'MAGI2', 'PSMG2', 'ALDH3A1', 'ANXA2', 'SLC30A7', 'STAT4', 'CHGB', 'PPP5C', 'DNAJC7', 'HNRNPC', 'ZNF112', 'MYO6', 'DMRTC2', 'NNAT', 'IPCEF1', 'NID2', 'MSL2', 'RBSN', 'SIGIRR', 'OPALIN', 'CITED2', 'PAK6', 'ALG11', 'APOOL', 'SENP2', 'ZCWPW2', 'PALM2', 'NDRG2', 'TRMU', 'NAPG', 'SNX16', 'SERPINI1', 'EIF4G2', 'FADS1', 'WDR97', 'CSNK1G1', 'TMPRSS13', 'CHRNA5', 'CYP2J2', 'SYNE1', 'HYAL4', 'CCNG2', 'GLRA1', 'FAM72A', 'PITX2', 'GLI3', 'AMT', 'FRMPD2', 'C3orf67', 'CCAR1', 'SULF1', 'PLK1', 'FARSA', 'MED15', 'IGKV1OR2-108', 'TBCE', 'FAM107B', 'LARP1B', 'TENM3', 'DLG1', 'NUDCD2', 'MYO5A', 'ASF1B', 'CA11', 'CRYGN', 'WNK2', 'COPS6', 'PUM2', 'PDE6D', 'ARHGAP4', 'DAB2', 'FKBP7', 'CASC3', 'NCK1', 'MLXIP', 'ALDH1L1', 'GALE', 'GLB1', 'PYM1', 'RNF214', 'RBM47', 'PUF60', 'AKAP13', 'KPNB1', 'TRAJ46', 'CCDC178', 'HAUS4', 'NDC80', 'SLC35B1', 'TMPRSS5', 'SERPING1', 'SAP30BP', 'MPDU1', 'GM2A', 'SLC20A1', 'NUCB2', 'NVL', 'ARHGEF10L', 'GC', 'CEP192', 'RHOH', 'N4BP2L1', 'PALM3', 'SNRNP70', 'NMNAT3', 'AMDHD1', 'PCYT1A', 'ZNF793', 'C4orf19', 'TACC1', 'VWDE', 'HLA-DPB1', 'ARPC1A', 'GALNS', 'TXNDC12', 'GNLY', 'PRDM16', 'CFLAR', 'ACTR6', 'RAB30', 'CPNE3', 'MUC1', 'FBXO22', 'CP', 'BET1L', 'RSRC1', 'ZNF175', 'SPECC1', 'FARS2', 'TTC32', 'COX7A2', 'RNPEPL1', 'RABEPK', 'BCL7C', 'UMODL1', 'PTPA', 'CYFIP2', 'BBX', 'GNAS', 'USP10', 'DCN', 'HSPA9', 'ZFAND2B', 'POLR3E', 'CTDP1', 'AP1S3', 'HLA-C', 'FAP', 'CMSS1', 'CARM1', 'RINL', 'FXR2', 'ST7', 'JADE3', 'EXOC7', 'HMGXB4', 'VPS33B', 'CPNE1', 'RAP1B', 'MACF1', 'CNPY2', 'CCDC97', 'IL16', 'CCDC106', ...]
print(len(prot_list))
45637