Tim O'Donnell update validation results analysis  almost 8 years ago

Commit id: 1900edc1960fcd69c3155d56189b98f80234b3b9

deletions | additions      

       

"cells": [  {  "cell_type": "code",  "execution_count": 2, 4,  "metadata": {  "collapsed": false  }, 

"import fancyimpute, locale\n",  "\n",  "import sklearn.metrics\n",  "import sklearn.cross_validation" sklearn.cross_validation\n",  "\n",  "def print_full(x):\n",  " pandas.set_option('display.max_rows', len(x))\n",  " print(x)\n",  " pandas.reset_option('display.max_rows')"  ]  },  {  "cell_type": "code",  "execution_count": 5,  "metadata": {  "collapsed": true  },  "outputs": [],  "source": [  "max_ic50 = 50000\n",  "data_dir = \"../data/\""  ]  },  {  "cell_type": "code",  "execution_count": 6,  "metadata": {  "collapsed": false  },  "outputs": [],  "source": [  "all_train_data = mhcflurry.data.load_allele_datasets(data_dir + \"bdata.2009.mhci.public.1.txt\")"  ]  },  {  "cell_type": "code",  "execution_count": 7,  "metadata": {  "collapsed": true  },  "outputs": [],  "source": [  "def make_scores(ic50_y, ic50_y_pred, sample_weight=None, threshold_nm=500): \n",  " y_pred = mhcflurry.common.ic50_to_regression_target(ic50_y_pred, max_ic50)\n",  " try:\n",  " auc = sklearn.metrics.roc_auc_score(ic50_y <= threshold_nm, y_pred, sample_weight=sample_weight)\n",  " except ValueError:\n",  " auc = numpy.nan\n",  " try:\n",  " f1 = sklearn.metrics.f1_score(ic50_y <= threshold_nm, ic50_y_pred <= threshold_nm, sample_weight=sample_weight)\n",  " except ValueError:\n",  " f1 = numpy.nan\n",  " try:\n",  " tau = scipy.stats.kendalltau(ic50_y_pred, ic50_y)[0]\n",  " except ValueError:\n",  " tau = numpy.nan\n",  " \n",  " return dict(\n",  " auc=auc,\n",  " f1=f1,\n",  " tau=tau,\n",  " ) "  ]  },  {  "cell_type": "code",  "execution_count": 13, 8,  "metadata": {  "collapsed": false  }, 

" \n",  " \n",  " \n",  " activation\n",  " dropout_probability\n",  " embedding_output_dim\n",  " impute\n", 

" \n",  " \n",  " 0\n",  " tanh\n",  " 0.0\n",  " 32\n",  " False\n", 

" \n",  " \n",  " 1\n",  " tanh\n",  " 0.0\n",  " 8\n",  " False\n", 

" \n",  " \n",  " 2\n",  " tanh\n",  " 0.5\n",  " 32\n",  " False\n", 

" \n",  " \n",  " 3\n",  " tanh\n",  " 0.5\n",  " 8\n",  " False\n", 

" \n",  " \n",  " 4\n",  " tanh\n",  " 0.0\n",  " 32\n",  " True\n", 

" \n",  " \n",  " 5\n",  " tanh\n",  " 0.0\n",  " 8\n",  " True\n", 

" \n",  " \n",  " 6\n",  " tanh\n",  " 0.5\n",  " 32\n",  " True\n", 

" \n",  " \n",  " 7\n",  " tanh\n",  " 0.5\n",  " 8\n",  " True\n",  " [4]\n",  " 4\n",  " \n",  " \n",  "\n",  ""  ],  "text/plain": [ \n",  " activation dropout_probability embedding_output_dim impute layer_sizes \\\n",  "0 tanh 0.0 32 False [64] \n",  "1 tanh 0.0 8 False [4] \n",  "2 tanh 0.5 32 False [64] \n",  "3 tanh 0.5 8 False [4] \n",  "4 tanh 0.0 32 True [64] \n",  "5 tanh 0.0 8 True [4] \n",  "6 tanh 0.5 32 True [64] \n",  "7 tanh 0.5 8 True [4] \n",  "\n", 8\n",  " layer_size \n",  "0 64 \n",  "1 4 \n",  "2 64 \n",  "3 4 \n",  "4 64 \n",  "5 4 \n",  "6 64 \n",  "7 4 0.0\n",  " ]  },  "execution_count": 13,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "models = pandas.read_csv(\"../data/validation_models.csv\", converters={'layer_sizes': eval})\n",  "models[\"layer_size\"] = [x[0] for x in models.layer_sizes]\n",  "models"  ]  },  {  "cell_type": "code",  "execution_count": 20,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/html": [  "
\n",  "\n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  "
32
False
[64]mhcflurry 0_aucmhcflurry 0_f1mhcflurry 0_taumhcflurry 1_aucmhcflurry 1_f1mhcflurry 1_taumhcflurry 2_aucmhcflurry 2_f1mhcflurry 2_taumhcflurry 3_auc...netmhc_f1netmhc_taunetmhcpan_aucnetmhcpan_f1netmhcpan_tausmmpmbec_cpp_aucsmmpmbec_cpp_f1smmpmbec_cpp_tautest_sizetrain_size64
allele90.08False[4]4
HLA-A0201100.8991230.50.837826320.554988False0.926853[64]0.8706710.6233140.9257130.8811670.6225570.913962...0.8843360.6354980.9304790.8809630.6373380.9273580.8851210.6262242126956564
HLA-A0301110.8915610.50.83423680.540025False0.922007[4]0.8921470.5958900.9233430.8794020.6025230.916512...0.9006210.6292360.9272870.8851060.6112400.9339660.8972750.61089181161414
HLA-A0201120.8991230.00.837826320.554988True0.926853[64]0.8706710.6233140.9257130.8811670.6225570.913962...0.8843360.6354980.9304790.8809630.6373380.9273580.8851210.6262242126956564
HLA-A0301130.8915610.00.83423680.540025True0.922007[4]0.8921470.5958900.9233430.8794020.6025230.916512...0.9006210.6292360.9272870.8851060.6112400.9339660.8972750.61089181161414
HLA-A2601140.9280840.50.580000320.432299True0.929260[64]0.5931030.4407220.9317600.5748990.4334370.923544...0.5411760.4366460.9422790.6400000.4516660.9273390.6030530.4229001333289464
HLA-B0801150.9426940.50.76293180.600817True0.949517[4]0.7735040.6203420.9482740.7785230.6164910.940561...0.7760530.6295190.9428220.7016710.6067620.9405550.7600000.61895394022674
HLA-B5101160.9330500.00.489796320.369192False0.939082[64]0.3913040.3693590.9481410.4047620.3823980.945669...0.4285710.3653070.9486950.6101690.4069730.9276210.3956040.344534854173464
HLA-B5701170.9142400.00.75000080.524933False0.916777[4]0.7402990.5352270.9228180.6708860.5453770.914248...0.7418400.4849750.8830770.6426230.4601330.9299230.7090910.56961581518574
HLA-B0702180.9049850.50.792711320.564505False0.915801[64]0.866525640.594497
0.909308
0.835526190.5872470.50.8980448False[4]4
200.032True[64]64
210.08True[4]4
220.532True[64]64
230.58True[4]4
240.032False[64]64
250.08False[4]4
260.532False[64]64
270.58False[4]4
280.032True[64]64
290.08True[4]4
..................
500.532False[64]64
510.58False[4]4
520.032True[64]64
530.08True[4]4
540.532True[64]64
550.58True[4]4
560.032False[64]64
570.08False[4]4
580.532False[64]64
590.58False[4]4
600.032True[64]64
610.08True[4]4
620.532True[64]64
630.58True[4]4
640.032False[64]64
650.08False[4]4
660.532False[64]64
670.58False[4]4
680.032True[64]64
690.08True[4]4
700.532True[64]64
710.58True[4]4
720.032False[64]64
730.08False[4]4
740.532False[64]64
750.58False[4]4
760.032True[64]64
770.08True[4]4
780.532True[64]64
790.58True[4]4
\n",
  "

80 rows × 5 columns

\n",
  "
"
  ],  "text/plain": [  " dropout_probability embedding_output_dim impute layer_sizes layer_size\n",  "0 0.0 32 False [64] 64\n",  "1 0.0 8 False [4] 4\n",  "2 0.5 32 False [64] 64\n",  "3 0.5 8 False [4] 4\n",  "4 0.0 32 True [64] 64\n",  "5 0.0 8 True [4] 4\n",  "6 0.5 32 True [64] 64\n",  "7 0.5 8 True [4] 4\n",  "8 0.0 32 False [64] 64\n",  "9 0.0 8 False [4] 4\n",  "10 0.5 32 False [64] 64\n",  "11 0.5 8 False [4] 4\n",  "12 0.0 32 True [64] 64\n",  "13 0.0 8 True [4] 4\n",  "14 0.5 32 True [64] 64\n",  "15 0.5 8 True [4] 4\n",  "16 0.0 32 False [64] 64\n",  "17 0.0 8 False [4] 4\n",  "18 0.5 32 False [64] 64\n",  "19 0.5 8 False [4] 4\n",  "20 0.0 32 True [64] 64\n",  "21 0.0 8 True [4] 4\n",  "22 0.5 32 True [64] 64\n",  "23 0.5 8 True [4] 4\n",  "24 0.0 32 False [64] 64\n",  "25 0.0 8 False [4] 4\n",  "26 0.5 32 False [64] 64\n",  "27 0.5 8 False [4] 4\n",  "28 0.0 32 True [64] 64\n",  "29 0.0 8 True [4] 4\n",  ".. ... ... ... ... ...\n",  "50 0.5 32 False [64] 64\n",  "51 0.5 8 False [4] 4\n",  "52 0.0 32 True [64] 64\n",  "53 0.0 8 True [4] 4\n",  "54 0.5 32 True [64] 64\n",  "55 0.5 8 True [4] 4\n",  "56 0.0 32 False [64] 64\n",  "57 0.0 8 False [4] 4\n",  "58 0.5 32 False [64] 64\n",  "59 0.5 8 False [4] 4\n",  "60 0.0 32 True [64] 64\n",  "61 0.0 8 True [4] 4\n",  "62 0.5 32 True [64] 64\n",  "63 0.5 8 True [4] 4\n",  "64 0.0 32 False [64] 64\n",  "65 0.0 8 False [4] 4\n",  "66 0.5 32 False [64] 64\n",  "67 0.5 8 False [4] 4\n",  "68 0.0 32 True [64] 64\n",  "69 0.0 8 True [4] 4\n",  "70 0.5 32 True [64] 64\n",  "71 0.5 8 True [4] 4\n",  "72 0.0 32 False [64] 64\n",  "73 0.0 8 False [4] 4\n",  "74 0.5 32 False [64] 64\n",  "75 0.5 8 False [4] 4\n",  "76 0.0 32 True [64] 64\n",  "77 0.0 8 True [4] 4\n",  "78 0.5 32 True [64] 64\n",  "79 0.5 8 True [4] 4\n",  "\n",  "[80 rows x 5 columns]"  ]  },  "execution_count": 8,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "models = pandas.read_csv(\"../data/validation_models.csv\", converters={'layer_sizes': eval})\n",  "models[\"layer_size\"] = [x[0] for x in models.layer_sizes]\n",  "del models[\"activation\"]\n",  "models"  ]  },  {  "cell_type": "code",  "execution_count": 9,  "metadata": {  "collapsed": false,  "scrolled": true  },  "outputs": [  {  "data": {  "text/html": [  "
\n",  "\n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  "
dropout_probabilityembedding_output_dimimputelayer_sizeslayer_sizenumname
00.032False[64]640big
10.08False[4]41small
20.532False[64]642big dropout
30.58False[4]43small dropout
40.032True[64]644big impute
50.08True[4]45small impute
60.532True[64]646big dropout impute
70.58True[4]47small dropout impute
80.032False[64]648big
90.08False[4]49small
100.532False[64]6410big dropout
110.58False[4]411small dropout
120.032True[64]6412big impute
130.08True[4]413small impute
140.532True[64]6414big dropout impute
150.58True[4]415small dropout impute
160.032False[64]6416big
170.08False[4]417small
180.532False[64]6418big dropout
190.58False[4]419small dropout
200.032True[64]6420big impute
210.08True[4]421small impute
220.532True[64]6422big dropout impute
230.58True[4]423small dropout impute
240.032False[64]6424big
250.08False[4]425small
260.532False[64]6426big dropout
270.58False[4]427small dropout
280.032True[64]6428big impute
290.08True[4]429small impute
........................
500.532False[64]6450big dropout
510.58False[4]451small dropout
520.032True[64]6452big impute
530.08True[4]453small impute
540.532True[64]6454big dropout impute
550.58True[4]455small dropout impute
560.032False[64]6456big
570.08False[4]457small
580.532False[64]6458big dropout
590.58False[4]459small dropout
600.032True[64]6460big impute
610.08True[4]461small impute
620.532True[64]6462big dropout impute
630.58True[4]463small dropout impute
640.032False[64]6464big
650.08False[4]465small
660.532False[64]6466big dropout
670.58False[4]467small dropout
680.032True[64]6468big impute
690.08True[4]469small impute
700.532True[64]6470big dropout impute
710.58True[4]471small dropout impute
720.032False[64]6472big
730.08False[4]473small
740.532False[64]6474big dropout
750.58False[4]475small dropout
760.032True[64]6476big impute
770.08True[4]477small impute
780.532True[64]6478big dropout impute
790.58True[4]479small dropout impute
\n",
  "

80 rows × 7 columns

\n",
  "
"
  ],  "text/plain": [  " dropout_probability embedding_output_dim impute layer_sizes layer_size \\\n",  "0 0.0 32 False [64] 64 \n",  "1 0.0 8 False [4] 4 \n",  "2 0.5 32 False [64] 64 \n",  "3 0.5 8 False [4] 4 \n",  "4 0.0 32 True [64] 64 \n",  "5 0.0 8 True [4] 4 \n",  "6 0.5 32 True [64] 64 \n",  "7 0.5 8 True [4] 4 \n",  "8 0.0 32 False [64] 64 \n",  "9 0.0 8 False [4] 4 \n",  "10 0.5 32 False [64] 64 \n",  "11 0.5 8 False [4] 4 \n",  "12 0.0 32 True [64] 64 \n",  "13 0.0 8 True [4] 4 \n",  "14 0.5 32 True [64] 64 \n",  "15 0.5 8 True [4] 4 \n",  "16 0.0 32 False [64] 64 \n",  "17 0.0 8 False [4] 4 \n",  "18 0.5 32 False [64] 64 \n",  "19 0.5 8 False [4] 4 \n",  "20 0.0 32 True [64] 64 \n",  "21 0.0 8 True [4] 4 \n",  "22 0.5 32 True [64] 64 \n",  "23 0.5 8 True [4] 4 \n",  "24 0.0 32 False [64] 64 \n",  "25 0.0 8 False [4] 4 \n",  "26 0.5 32 False [64] 64 \n",  "27 0.5 8 False [4] 4 \n",  "28 0.0 32 True [64] 64 \n",  "29 0.0 8 True [4] 4 \n",  ".. ... ... ... ... ... \n",  "50 0.5 32 False [64] 64 \n",  "51 0.5 8 False [4] 4 \n",  "52 0.0 32 True [64] 64 \n",  "53 0.0 8 True [4] 4 \n",  "54 0.5 32 True [64] 64 \n",  "55 0.5 8 True [4] 4 \n",  "56 0.0 32 False [64] 64 \n",  "57 0.0 8 False [4] 4 \n",  "58 0.5 32 False [64] 64 \n",  "59 0.5 8 False [4] 4 \n",  "60 0.0 32 True [64] 64 \n",  "61 0.0 8 True [4] 4 \n",  "62 0.5 32 True [64] 64 \n",  "63 0.5 8 True [4] 4 \n",  "64 0.0 32 False [64] 64 \n",  "65 0.0 8 False [4] 4 \n",  "66 0.5 32 False [64] 64 \n",  "67 0.5 8 False [4] 4 \n",  "68 0.0 32 True [64] 64 \n",  "69 0.0 8 True [4] 4 \n",  "70 0.5 32 True [64] 64 \n",  "71 0.5 8 True [4] 4 \n",  "72 0.0 32 False [64] 64 \n",  "73 0.0 8 False [4] 4 \n",  "74 0.5 32 False [64] 64 \n",  "75 0.5 8 False [4] 4 \n",  "76 0.0 32 True [64] 64 \n",  "77 0.0 8 True [4] 4 \n",  "78 0.5 32 True [64] 64 \n",  "79 0.5 8 True [4] 4 \n",  "\n",  " num name \n",  "0 0 big \n",  "1 1 small \n",  "2 2 big dropout \n",  "3 3 small dropout \n",  "4 4 big impute \n",  "5 5 small impute \n",  "6 6 big dropout impute \n",  "7 7 small dropout impute \n",  "8 8 big \n",  "9 9 small \n",  "10 10 big dropout \n",  "11 11 small dropout \n",  "12 12 big impute \n",  "13 13 small impute \n",  "14 14 big dropout impute \n",  "15 15 small dropout impute \n",  "16 16 big \n",  "17 17 small \n",  "18 18 big dropout \n",  "19 19 small dropout \n",  "20 20 big impute \n",  "21 21 small impute \n",  "22 22 big dropout impute \n",  "23 23 small dropout impute \n",  "24 24 big \n",  "25 25 small \n",  "26 26 big dropout \n",  "27 27 small dropout \n",  "28 28 big impute \n",  "29 29 small impute \n",  ".. ... ... \n",  "50 50 big dropout \n",  "51 51 small dropout \n",  "52 52 big impute \n",  "53 53 small impute \n",  "54 54 big dropout impute \n",  "55 55 small dropout impute \n",  "56 56 big \n",  "57 57 small \n",  "58 58 big dropout \n",  "59 59 small dropout \n",  "60 60 big impute \n",  "61 61 small impute \n",  "62 62 big dropout impute \n",  "63 63 small dropout impute \n",  "64 64 big \n",  "65 65 small \n",  "66 66 big dropout \n",  "67 67 small dropout \n",  "68 68 big impute \n",  "69 69 small impute \n",  "70 70 big dropout impute \n",  "71 71 small dropout impute \n",  "72 72 big \n",  "73 73 small \n",  "74 74 big dropout \n",  "75 75 small dropout \n",  "76 76 big impute \n",  "77 77 small impute \n",  "78 78 big dropout impute \n",  "79 79 small dropout impute \n",  "\n",  "[80 rows x 7 columns]"  ]  },  "execution_count": 9,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "def name_model(row):\n",  " size = \"big\" if row.embedding_output_dim == 32 else \"small\"\n",  " pieces = [size]\n",  " if row.dropout_probability > 0:\n",  " pieces.append(\"dropout\")\n",  " if row.impute:\n",  " pieces.append(\"impute\")\n",  " return \" \".join(pieces)\n",  "\n",  "models[\"num\"] = models.index\n",  "models[\"name\"] = [name_model(row) for (_, row) in models.iterrows()]\n",  "models"  ]  },  {  "cell_type": "code",  "execution_count": 10,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/plain": [  "name\n",  "big [0, 8, 16, 24, 32, 40, 48, 56, 64, 72]\n",  "big dropout [2, 10, 18, 26, 34, 42, 50, 58, 66, 74]\n",  "big dropout impute [6, 14, 22, 30, 38, 46, 54, 62, 70, 78]\n",  "big impute [4, 12, 20, 28, 36, 44, 52, 60, 68, 76]\n",  "small [1, 9, 17, 25, 33, 41, 49, 57, 65, 73]\n",  "small dropout [3, 11, 19, 27, 35, 43, 51, 59, 67, 75]\n",  "small dropout impute [7, 15, 23, 31, 39, 47, 55, 63, 71, 79]\n",  "small impute [5, 13, 21, 29, 37, 45, 53, 61, 69, 77]\n",  "Name: num, dtype: object"  ]  },  "execution_count": 10,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "model_groups = models.groupby(\"name\").num.unique()\n",  "model_groups"  ]  },  {  "cell_type": "code",  "execution_count": 11,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/html": [  "
\n",  "\n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  "
allelepeptidelengthmeasnetmhcnetmhcpansmmpmbec_cppmhcflurry 0mhcflurry 1mhcflurry 2...mhcflurry 70mhcflurry 71mhcflurry 72mhcflurry 73mhcflurry 74mhcflurry 75mhcflurry 76mhcflurry 77mhcflurry 78mhcflurry 79
0H-2-DBAAACNVATA9657.657837154.881662711.213514438.530698466.814768172.641984343.793510...355.844970825.249008236.052464956.955845407.9201381335.32652412.870162146.240141387.0252931175.574895
1H-2-DBAAFEFVYV830831.8795026456.542290785.23563510351.42166715087.57442610433.57988110853.152403...11752.22789115845.44483920566.6211499283.35974511241.79719514002.3826969334.1978637675.90635612913.68859915777.427472
2H-2-DBAAFVNDYSL977.44618017.4582227.51622928.05433647.82080716.30379429.588240...39.930163217.65052340.09533846.91429932.406285179.56423626.90908116.45783934.553959218.821497
3H-2-DBAAIANQAAV91.9998629.6382909.74989625.7039582.8878697.43067623.204965...23.68500490.3136195.01709811.15676019.40768370.8182184.1193977.33727119.713879103.209533
4H-2-DBAAIANQAVV91.5170508.5506678.33681228.7739842.5797535.21599317.054924...19.16559174.7654374.3786195.17013416.11163869.8247313.5073056.21059115.77275986.157611
5H-2-DBAAIENYVRF937.844258252.348077114.815362187.06821491.63201077.986067288.144351...302.361030493.962110374.752767217.663016301.008748415.441450402.005916195.863576368.765718533.387993
6H-2-DBAAINFITTM93.155005199.986187389.045145200.909281474.790652183.21505343.296033...43.854696288.18737316.12218728.38289941.544168186.44272976.292963156.35298544.815033282.989902
7H-2-DBAAIPAPPPI93243.3961731059.253725493.173804295.120923623.8788477834.652456178.830163...229.813055285.925339352.893901246.850697184.103734213.9476962278.596615207.562759219.872392329.439928
8H-2-DBAAKLNRPPL9654.63617466.37430777.26805938.45917888.91700463.99615560.123046...88.217258337.759556199.810086177.46849267.696375149.00965830.53699387.14571472.876322240.820089
9H-2-DBAALDMVDAL9229.614865547.015963597.035287225.4239215459.146719678.959069605.313435...454.257039627.4924743152.1814311722.232625438.567638535.0665322163.586824617.108573843.582091868.502679
10H-2-DBAALQHLRSI9905.7326011686.5530252032.357011698.2324043669.0748003156.4635291692.175239...1810.2148632732.7937705234.3499141440.8532231497.6493571515.463774401.7384523099.4016522217.8817092120.478424
11H-2-DBAALVRLTAL91106.623784435.511874214.783047378.4425852137.0101573406.4246851367.951646...1326.0214934875.5535961154.8525161467.3593911007.4465473071.2864501194.5425371536.7402921412.4659933537.201741
12H-2-DBAAMVPTGSL91836.5383434055.0853545176.0683201545.25444015245.04609721471.1309395051.710355...4747.80204511006.36124811072.1560083931.7099234959.5213564315.00657010710.08874710668.5202165155.9229518201.539185
13H-2-DBAANSPWAPV94325.138310903.6494741023.292992557.1857491446.5783364093.6316561124.045813...1094.6110366360.457511307.171802812.754323910.3836652690.5267533445.8675259463.9670911005.0973355503.108263
14H-2-DBAAPSGAAPL92.84446197.948999501.187234822.24265077.761677116.251052658.194668...800.8921081401.23696353.680604108.438079773.3840211367.342619121.451184437.461308887.5622251781.904400
15H-2-DBAAPVSEPTV9106.9054882654.6055621918.6687411870.6821401627.4372432005.2047562467.857734...2127.7242503295.5852881445.3068712024.7663611920.3286072410.318075693.1112483189.7195702294.9205683389.988758
16H-2-DBAAVANGFAA983.368118205.116218228.559880200.44720340.538621116.659086382.503402...362.540055487.307534372.898117390.071684337.855848579.19010167.290789346.727393424.915484728.546885
17H-2-DBAAVLLGAPV9373.250158320.626932623.734835286.41779739.330610408.638824605.753153...725.1966191212.226998129.636031384.397149534.5276331108.41201691.799755414.029628768.9024591445.428048
18H-2-DBAAVQLLFPA9347.5361612494.5947275152.286446679.203633250.552588681.4964201427.626931...1702.5491502396.604364696.9512413932.3565531503.6874193000.7387411538.6031222704.1917702316.0407743015.279174
19H-2-DBAAVTAGVAL9229.6148651552.3870102172.7011791927.5249132506.291305780.9196382868.849059...2517.9283362170.3829001055.1593802794.1402922302.9963862518.167863820.4965332671.2234382850.4953613962.499784
20H-2-DBAAVVNRSLV98.60993826.30268029.58012563.82634910.61283219.74872059.138583...75.529552318.6376257.21389029.84785470.128943272.39087610.7718219.90435777.326501338.353540
21H-2-DBAAYVPADAV9331.8944581757.9236143206.269325595.6621449645.65853211279.3049471835.991854...1730.2520459663.8615293394.274298343.3056391448.3556914378.6164733786.8843971788.6708651658.6937318368.901644
22H-2-DBACMVNLERL9737.904230239.331576679.203633444.6312671891.427069521.101746520.331052...668.3130511022.9646333781.894617607.244752646.255327740.2042011458.515409845.697222677.363608750.479001
23H-2-DBADLVNHPPV9558.4701951694.3378001857.804455325.0872974042.236381954.0534821131.217632...0.8693831449.5143850.6060144738.3799870.9135272530.1651520.855011551.1297010.6047201385.3079250.8979283537.2256940.8577193961.0249240.563960505.0637398131741.03958934122946.101555
HLA-A3101240.828510H-2-DB0.782609AEMEEALKG0.46055490.85483878523.5634610.82250041304.7501990.51028746989.4108610.847235440554.8635070.81761048819.1822110.50399043577.0473330.84062841487.708042...0.83395841399.9883790.52502635250.5231530.85926148362.4470850.82233545097.1793720.52894141718.2512790.85127035448.0264540.83703749293.2072170.50258641773.22472972442962.716446479637455.936779
HLA-A1101250.920368H-2-DB0.872077AFFAFRYV0.57990680.93652087902.2516830.88315218967.0592120.61535112882.4955170.9369277816.2780460.88429817412.9618930.6120138603.3894750.92545022533.909280...0.88340224016.0905010.63219921994.3181610.94506524405.2692460.88767113666.2184510.62579423156.1402140.94420520193.6342540.88251417554.1344380.6183888162.34739272324923.308535539922296.724479
HLA-A0101260.912746H-2-DB0.621762AGLDNKFYL0.52172090.924911659.1738950.659794357.2728380.531596202.7682720.909260260.0159560.58620732.4668860.521745374.1950200.887468216.595300...0.619565237.5803960.524866648.8775690.89489596.9913990.594286445.8548310.498767221.8157600.832665385.4157590.437811858.8010790.42806467.825594696248.4441983725382.737079
HLA-A0206270.876067H-2-DB0.849449AGLLFVLL0.46571380.90908187902.2516830.87223614996.8483550.5288769885.5309470.90002526242.1854340.86871217654.3207700.51742117139.8225790.88350016697.495982...0.87290216757.7573790.54318418717.1644440.91079634186.3977780.86625815473.3013460.53506716370.4335640.90431718373.2923240.87828226600.5495390.52757121086.74605168217927.260869482717732.815373
28H-2-DBAGLQVINL859429.21586225061.09253012560.29963735399.73410831484.00322933545.66261526437.149676...27944.89731124644.50480736414.27390630879.96342827227.38098923507.40866432060.81921529365.71754329602.72829924198.313575
29H-2-DBAGLVSFNFL9210.862815620.8690342285.5988031811.3400931972.836236630.4586531812.154993...1769.0977935681.9652871380.825869678.4443331656.2646033436.201451849.735139689.3506482083.6977143479.754922
..................................................................
27650Mamu-A02YNTVCVIW8909.913273734.51386810023.05238148.86523611822.9079608396.8663777112.873873...6103.7622795706.8483388802.55201312567.1964328011.7647314650.3997747086.5015627825.5129377096.7757795180.448858
27651Mamu-A02YRHDGGNVL978342.9642771355.18941222233.0989061409.2887982553.2938841061.0216241050.845801...894.909129994.1365791214.3748752514.1833131272.9045661422.421658907.4838371900.1908251335.629257718.434273
27652Mamu-A02YSEGQYMNTP107362.0709752958.0124678709.6359004477.1330423862.2897482829.0805013857.430334...3143.9628386180.7610255845.0212386467.2659123548.7837444006.5185285664.05863813693.5574883536.5668337235.413991
27653Mamu-A02YSEVALNVTES117709.0346911682.6740615105.05000051.522864602.395338540.214499382.353838...250.582548280.629057526.2291531021.750902369.581319234.690151486.5368351060.598522342.638429236.626449
27654Mamu-A02YSLVFVILM91256.02996417.49846749.4310696.3241196.53408512.24552814.057669...10.50999128.0405115.5470387.03378312.46672126.2734857.15133910.76786912.48550128.785291
27655Mamu-A02YSQIGAGVY91.99986217.86487615.34617016.29296015.84980610.15948143.079177...30.75925382.32924647.95054231.01821740.31417463.92397011.68109210.37140937.62517362.095899
27656Mamu-A02YSRDLICEQS101059.2537251297.1792713863.669771220.292646941.907232388.803523516.415889...387.881448742.517045414.874833758.740294632.258766830.589892793.228083572.923767613.892864570.111053
27657Mamu-A02YSYKAFIKY92.3173954.2854853.0902951.7782795.47645230.28788713.697417...8.62823243.8687826.0312053.82279013.21751925.3149413.3908806.53617112.34284327.965131
27658Mamu-A02YSYKAFIKYP104830.5880201199.4993031753.8805023111.7163371948.3113901887.0882371719.075267...1423.3161553947.2241281921.0795022578.6577811938.8193432072.8271141712.4028825059.6732051661.7620774067.969954
27659Mamu-A02YSYKAFIKYPE114897.788194671.4288532666.85866542.5598412940.1083931753.5134951992.582402...1562.0232242457.5260712553.7109711028.3742262201.9986631914.1267661971.3690732999.8966712162.5413391245.603882
27660Mamu-A02YTAFTLPSV9101.62486932.21068852.84452591.8332604.5728524.46082014.724639...13.08001353.8011796.6642675.26533714.22363265.4067487.5732505.39913414.20073653.042656
27661Mamu-A02YTAFTLPSVN102529.297996236.5919701406.04752414.48771965.07737757.65963693.229936...83.773598384.640057125.84079752.47150074.862144573.88701681.70202266.78078371.886595240.199173
27662Mamu-A02YTDGSCNKQS1011091.7481534345.10224211246.049740588.8436551636.0849772050.4302311818.078082...1256.8405231306.9328371469.7971302058.2531851969.5040371605.8522351416.5171181745.7906851682.5159281105.013233
27663Mamu-A02YTGDFDSVI9215.278173354.81338942.46195640.550854282.77362761.811464203.244505...181.966273462.890272412.331323365.904127245.184308313.036807174.941719208.131635220.111451297.084820
27664Mamu-A02YTPKVVGG870145.52984217947.33626813995.8732263140.50869428699.44701918917.41696511333.871219...11601.7148765263.19665221605.96339417250.63167611143.0313194582.26495023462.45713815842.33491811077.1644394122.825718
27665Mamu-A02YTPKVVGGIGG1170145.5298429418.89596510046.157903387.25764510653.38791010389.2900525383.389946...5521.1861653344.3899008731.6492929635.4927125680.2576583185.4178819543.8307238040.9478345350.0615592927.695538
27666Mamu-A02YTSGPGIR816865.530254619.4410752349.63282180.7235034905.8694433486.588065482.922794...429.718520396.3941356877.4076122684.074701455.836990447.3021475757.8622931477.957443528.183888309.217351
27667Mamu-A02YTSGPGIRYP107128.530301783.4296435176.0683201270.5741052079.2837781463.620665894.140283...904.9982762423.6145362275.4952341794.6944601019.8932391169.6105031831.9638933725.336355883.3808012596.187281
27668Mamu-A02YTSGPGTRYP103097.419299483.0588025420.008904797.9946871746.138067995.837100561.597714...620.1894611681.4896702001.0066621304.941441674.835464733.2938131398.3646232374.786783567.5074711807.753477
27669Mamu-A02YTSGPGTRYPM1125.94179439.1741887.74461876.38357865.78295332.05805974.582612...71.948261142.673945166.81788042.92082271.100380130.10020948.41317039.95182279.366150128.174314
27670Mamu-A02YTTGGTSR870145.529842357.2728385701.642723100.2305244867.9553662688.430936159.755152...133.03959085.0320238453.858885895.542406172.39701977.6526715343.670130635.441307165.76029762.800866
27671Mamu-A02YTTGGTSRN936897.759857186.6379696025.595861119.674053268.02515984.16890136.777590...33.175027131.7904752470.57041855.16248132.079349110.133710198.86033854.43038026.40056670.350814
27672Mamu-A02YTTTGASRN9587.489353135.5189412844.46110787.09635991.768323120.19931137.542691...32.846542132.5930311835.56564684.40383234.172877119.12033294.967471111.75109031.44383366.154394
27673Mamu-A02YTYEAYVRYP102624.2185431552.3870103872.5764491954.3394565516.6012123207.8349542203.500262...2028.0315733638.2181306000.2777815129.0638652585.0645761481.9064266325.2704647169.5085072214.4379123499.440631
27674Mamu-A02YTYEAYVRYPE111905.460718864.9679196998.41996032.7340694316.8894841492.3388822768.632417...2421.7738522883.3621196011.6648102811.9386742831.3417091761.6816263551.1830952386.1232563076.6052441348.655309
27675Mamu-A02YVADALAAF915.381546453.94161771.285303108.14339573.800771431.698036320.442212...314.117009658.882253362.514922172.978331387.093189564.26619868.064668638.661214398.453547343.711818
27676Mamu-A02YVFPVIFSK939264.4935402098.9398845610.479760901.57113816244.4615988409.0867213114.359914...3489.3499813101.65615515626.7855282524.4605512279.5799141928.30518315427.30246110459.9597183026.0567832103.577319
27677Mamu-A02YVFPVIFSR936728.2300502333.45806210046.1579032600.15956322634.88795010567.0444062196.918342...1905.6844791027.06208717261.4945715843.7740892181.852143899.85813319668.76899510561.9362582396.738834831.409071
27678Mamu-A02YVPCHIRQI910764.65213621134.8903986039.48629410568.17509220710.55999912170.67723520094.652790...17995.61200114552.86703115421.88855517895.82966219588.30774213696.52602519211.52192830602.39577620054.26551413187.834441
27679Mamu-A02YVVQMLARL9152.405275232.273680739.605275105.681751528.261756625.062058724.556640...508.227064771.475124459.471596982.564782772.242698591.3298161189.8076141523.473123695.975900709.660102
\n",
  "

27680 rows × 87 columns

\n",
  "
"
  ],  "text/plain": [  " allele peptide length meas netmhc \\\n",  "0 H-2-DB AAACNVATA 9 657.657837 154.881662 \n",  "1 H-2-DB AAFEFVYV 8 30831.879502 6456.542290 \n",  "2 H-2-DB AAFVNDYSL 9 77.446180 17.458222 \n",  "3 H-2-DB AAIANQAAV 9 1.999862 9.638290 \n",  "4 H-2-DB AAIANQAVV 9 1.517050 8.550667 \n",  "5 H-2-DB AAIENYVRF 9 37.844258 252.348077 \n",  "6 H-2-DB AAINFITTM 9 3.155005 199.986187 \n",  "7 H-2-DB AAIPAPPPI 9 3243.396173 1059.253725 \n",  "8 H-2-DB AAKLNRPPL 9 654.636174 66.374307 \n",  "9 H-2-DB AALDMVDAL 9 229.614865 547.015963 \n",  "10 H-2-DB AALQHLRSI 9 905.732601 1686.553025 \n",  "11 H-2-DB AALVRLTAL 9 1106.623784 435.511874 \n",  "12 H-2-DB AAMVPTGSL 9 1836.538343 4055.085354 \n",  "13 H-2-DB AANSPWAPV 9 4325.138310 903.649474 \n",  "14 H-2-DB AAPSGAAPL 9 2.844461 97.948999 \n",  "15 H-2-DB AAPVSEPTV 9 106.905488 2654.605562 \n",  "16 H-2-DB AAVANGFAA 9 83.368118 205.116218 \n",  "17 H-2-DB AAVLLGAPV 9 373.250158 320.626932 \n",  "18 H-2-DB AAVQLLFPA 9 347.536161 2494.594727 \n",  "19 H-2-DB AAVTAGVAL 9 229.614865 1552.387010 \n",  "20 H-2-DB AAVVNRSLV 9 8.609938 26.302680 \n",  "21 H-2-DB AAYVPADAV 9 331.894458 1757.923614 \n",  "22 H-2-DB ACMVNLERL 9 737.904230 239.331576 \n",  "23 H-2-DB ADLVNHPPV 9 558.470195 1694.337800 \n",  "24 H-2-DB AEMEEALKG 9 78523.563461 41304.750199 \n",  "25 H-2-DB AFFAFRYV 8 87902.251683 18967.059212 \n",  "26 H-2-DB AGLDNKFYL 9 659.173895 357.272838 \n",  "27 H-2-DB AGLLFVLL 8 87902.251683 14996.848355 \n",  "28 H-2-DB AGLQVINL 8 59429.215862 25061.092530 \n",  "29 H-2-DB AGLVSFNFL 9 210.862815 620.869034 \n",  "... ... ... ... ... ... \n",  "27650 Mamu-A02 YNTVCVIW 8 909.913273 734.513868 \n",  "27651 Mamu-A02 YRHDGGNVL 9 78342.964277 1355.189412 \n",  "27652 Mamu-A02 YSEGQYMNTP 10 7362.070975 2958.012467 \n",  "27653 Mamu-A02 YSEVALNVTES 11 7709.034691 1682.674061 \n",  "27654 Mamu-A02 YSLVFVILM 9 1256.029964 17.498467 \n",  "27655 Mamu-A02 YSQIGAGVY 9 1.999862 17.864876 \n",  "27656 Mamu-A02 YSRDLICEQS 10 1059.253725 1297.179271 \n",  "27657 Mamu-A02 YSYKAFIKY 9 2.317395 4.285485 \n",  "27658 Mamu-A02 YSYKAFIKYP 10 4830.588020 1199.499303 \n",  "27659 Mamu-A02 YSYKAFIKYPE 11 4897.788194 671.428853 \n",  "27660 Mamu-A02 YTAFTLPSV 9 101.624869 32.210688 \n",  "27661 Mamu-A02 YTAFTLPSVN 10 2529.297996 236.591970 \n",  "27662 Mamu-A02 YTDGSCNKQS 10 11091.748153 4345.102242 \n",  "27663 Mamu-A02 YTGDFDSVI 9 215.278173 354.813389 \n",  "27664 Mamu-A02 YTPKVVGG 8 70145.529842 17947.336268 \n",  "27665 Mamu-A02 YTPKVVGGIGG 11 70145.529842 9418.895965 \n",  "27666 Mamu-A02 YTSGPGIR 8 16865.530254 619.441075 \n",  "27667 Mamu-A02 YTSGPGIRYP 10 7128.530301 783.429643 \n",  "27668 Mamu-A02 YTSGPGTRYP 10 3097.419299 483.058802 \n",  "27669 Mamu-A02 YTSGPGTRYPM 11 25.941794 39.174188 \n",  "27670 Mamu-A02 YTTGGTSR 8 70145.529842 357.272838 \n",  "27671 Mamu-A02 YTTGGTSRN 9 36897.759857 186.637969 \n",  "27672 Mamu-A02 YTTTGASRN 9 587.489353 135.518941 \n",  "27673 Mamu-A02 YTYEAYVRYP 10 2624.218543 1552.387010 \n",  "27674 Mamu-A02 YTYEAYVRYPE 11 1905.460718 864.967919 \n",  "27675 Mamu-A02 YVADALAAF 9 15.381546 453.941617 \n",  "27676 Mamu-A02 YVFPVIFSK 9 39264.493540 2098.939884 \n",  "27677 Mamu-A02 YVFPVIFSR 9 36728.230050 2333.458062 \n",  "27678 Mamu-A02 YVPCHIRQI 9 10764.652136 21134.890398 \n",  "27679 Mamu-A02 YVVQMLARL 9 152.405275 232.273680 \n",  "\n",  " netmhcpan smmpmbec_cpp mhcflurry 0 mhcflurry 1 mhcflurry 2 \\\n",  "0 711.213514 438.530698 466.814768 172.641984 343.793510 \n",  "1 785.235635 10351.421667 15087.574426 10433.579881 10853.152403 \n",  "2 7.516229 28.054336 47.820807 16.303794 29.588240 \n",  "3 9.749896 25.703958 2.887869 7.430676 23.204965 \n",  "4 8.336812 28.773984 2.579753 5.215993 17.054924 \n",  "5 114.815362 187.068214 91.632010 77.986067 288.144351 \n",  "6 389.045145 200.909281 474.790652 183.215053 43.296033 \n",  "7 493.173804 295.120923 623.878847 7834.652456 178.830163 \n",  "8 77.268059 38.459178 88.917004 63.996155 60.123046 \n",  "9 597.035287 225.423921 5459.146719 678.959069 605.313435 \n",  "10 2032.357011 698.232404 3669.074800 3156.463529 1692.175239 \n",  "11 214.783047 378.442585 2137.010157 3406.424685 1367.951646 \n",  "12 5176.068320 1545.254440 15245.046097 21471.130939 5051.710355 \n",  "13 1023.292992 557.185749 1446.578336 4093.631656 1124.045813 \n",  "14 501.187234 822.242650 77.761677 116.251052 658.194668 \n",  "15 1918.668741 1870.682140 1627.437243 2005.204756 2467.857734 \n",  "16 228.559880 200.447203 40.538621 116.659086 382.503402 \n",  "17 623.734835 286.417797 39.330610 408.638824 605.753153 \n",  "18 5152.286446 679.203633 250.552588 681.496420 1427.626931 \n",  "19 2172.701179 1927.524913 2506.291305 780.919638 2868.849059 \n",  "20 29.580125 63.826349 10.612832 19.748720 59.138583 \n",  "21 3206.269325 595.662144 9645.658532 11279.304947 1835.991854 \n",  "22 679.203633 444.631267 1891.427069 521.101746 520.331052 \n",  "23 1857.804455 325.087297 4042.236381 954.053482 1131.217632 \n",  "24 46989.410861 440554.863507 48819.182211 43577.047333 41487.708042 \n",  "25 12882.495517 7816.278046 17412.961893 8603.389475 22533.909280 \n",  "26 202.768272 260.015956 32.466886 374.195020 216.595300 \n",  "27 9885.530947 26242.185434 17654.320770 17139.822579 16697.495982 \n",  "28 12560.299637 35399.734108 31484.003229 33545.662615 26437.149676 \n",  "29 2285.598803 1811.340093 1972.836236 630.458653 1812.154993 \n",  "... ... ... ... ... ... \n",  "27650 10023.052381 48.865236 11822.907960 8396.866377 7112.873873 \n",  "27651 22233.098906 1409.288798 2553.293884 1061.021624 1050.845801 \n",  "27652 8709.635900 4477.133042 3862.289748 2829.080501 3857.430334 \n",  "27653 5105.050000 51.522864 602.395338 540.214499 382.353838 \n",  "27654 49.431069 6.324119 6.534085 12.245528 14.057669 \n",  "27655 15.346170 16.292960 15.849806 10.159481 43.079177 \n",  "27656 3863.669771 220.292646 941.907232 388.803523 516.415889 \n",  "27657 3.090295 1.778279 5.476452 30.287887 13.697417 \n",  "27658 1753.880502 3111.716337 1948.311390 1887.088237 1719.075267 \n",  "27659 2666.858665 42.559841 2940.108393 1753.513495 1992.582402 \n",  "27660 52.844525 91.833260 4.572852 4.460820 14.724639 \n",  "27661 1406.047524 14.487719 65.077377 57.659636 93.229936 \n",  "27662 11246.049740 588.843655 1636.084977 2050.430231 1818.078082 \n",  "27663 42.461956 40.550854 282.773627 61.811464 203.244505 \n",  "27664 13995.873226 3140.508694 28699.447019 18917.416965 11333.871219 \n",  "27665 10046.157903 387.257645 10653.387910 10389.290052 5383.389946 \n",  "27666 2349.632821 80.723503 4905.869443 3486.588065 482.922794 \n",  "27667 5176.068320 1270.574105 2079.283778 1463.620665 894.140283 \n",  "27668 5420.008904 797.994687 1746.138067 995.837100 561.597714 \n",  "27669 7.744618 76.383578 65.782953 32.058059 74.582612 \n",  "27670 5701.642723 100.230524 4867.955366 2688.430936 159.755152 \n",  "27671 6025.595861 119.674053 268.025159 84.168901 36.777590 \n",  "27672 2844.461107 87.096359 91.768323 120.199311 37.542691 \n",  "27673 3872.576449 1954.339456 5516.601212 3207.834954 2203.500262 \n",  "27674 6998.419960 32.734069 4316.889484 1492.338882 2768.632417 \n",  "27675 71.285303 108.143395 73.800771 431.698036 320.442212 \n",  "27676 5610.479760 901.571138 16244.461598 8409.086721 3114.359914 \n",  "27677 10046.157903 2600.159563 22634.887950 10567.044406 2196.918342 \n",  "27678 6039.486294 10568.175092 20710.559999 12170.677235 20094.652790 \n",  "27679 739.605275 105.681751 528.261756 625.062058 724.556640 \n",  "\n",  " ... mhcflurry 70 mhcflurry 71 mhcflurry 72 mhcflurry 73 \\\n",  "0 ... 355.844970 825.249008 236.052464 956.955845 \n",  "1 ... 11752.227891 15845.444839 20566.621149 9283.359745 \n",  "2 ... 39.930163 217.650523 40.095338 46.914299 \n",  "3 ... 23.685004 90.313619 5.017098 11.156760 \n",  "4 ... 19.165591 74.765437 4.378619 5.170134 \n",  "5 ... 302.361030 493.962110 374.752767 217.663016 \n",  "6 ... 43.854696 288.187373 16.122187 28.382899 \n",  "7 ... 229.813055 285.925339 352.893901 246.850697 \n",  "8 ... 88.217258 337.759556 199.810086 177.468492 \n",  "9 ... 454.257039 627.492474 3152.181431 1722.232625 \n",  "10 ... 1810.214863 2732.793770 5234.349914 1440.853223 \n",  "11 ... 1326.021493 4875.553596 1154.852516 1467.359391 \n",  "12 ... 4747.802045 11006.361248 11072.156008 3931.709923 \n",  "13 ... 1094.611036 6360.457511 307.171802 812.754323 \n",  "14 ... 800.892108 1401.236963 53.680604 108.438079 \n",  "15 ... 2127.724250 3295.585288 1445.306871 2024.766361 \n",  "16 ... 362.540055 487.307534 372.898117 390.071684 \n",  "17 ... 725.196619 1212.226998 129.636031 384.397149 \n",  "18 ... 1702.549150 2396.604364 696.951241 3932.356553 \n",  "19 ... 2517.928336 2170.382900 1055.159380 2794.140292 \n",  "20 ... 75.529552 318.637625 7.213890 29.847854 \n",  "21 ... 1730.252045 9663.861529 3394.274298 343.305639 \n",  "22 ... 668.313051 1022.964633 3781.894617 607.244752 \n",  "23 ... 1449.514385 4738.379987 2530.165152 551.129701 \n",  "24 ... 41399.988379 35250.523153 48362.447085 45097.179372 \n",  "25 ... 24016.090501 21994.318161 24405.269246 13666.218451 \n",  "26 ... 237.580396 648.877569 96.991399 445.854831 \n",  "27 ... 16757.757379 18717.164444 34186.397778 15473.301346 \n",  "28 ... 27944.897311 24644.504807 36414.273906 30879.963428 \n",  "29 ... 1769.097793 5681.965287 1380.825869 678.444333 \n",  "... ... ... ... ... ... \n",  "27650 ... 6103.762279 5706.848338 8802.552013 12567.196432 \n",  "27651 ... 894.909129 994.136579 1214.374875 2514.183313 \n",  "27652 ... 3143.962838 6180.761025 5845.021238 6467.265912 \n",  "27653 ... 250.582548 280.629057 526.229153 1021.750902 \n",  "27654 ... 10.509991 28.040511 5.547038 7.033783 \n",  "27655 ... 30.759253 82.329246 47.950542 31.018217 \n",  "27656 ... 387.881448 742.517045 414.874833 758.740294 \n",  "27657 ... 8.628232 43.868782 6.031205 3.822790 \n",  "27658 ... 1423.316155 3947.224128 1921.079502 2578.657781 \n",  "27659 ... 1562.023224 2457.526071 2553.710971 1028.374226 \n",  "27660 ... 13.080013 53.801179 6.664267 5.265337 \n",  "27661 ... 83.773598 384.640057 125.840797 52.471500 \n",  "27662 ... 1256.840523 1306.932837 1469.797130 2058.253185 \n",  "27663 ... 181.966273 462.890272 412.331323 365.904127 \n",  "27664 ... 11601.714876 5263.196652 21605.963394 17250.631676 \n",  "27665 ... 5521.186165 3344.389900 8731.649292 9635.492712 \n",  "27666 ... 429.718520 396.394135 6877.407612 2684.074701 \n",  "27667 ... 904.998276 2423.614536 2275.495234 1794.694460 \n",  "27668 ... 620.189461 1681.489670 2001.006662 1304.941441 \n",  "27669 ... 71.948261 142.673945 166.817880 42.920822 \n",  "27670 ... 133.039590 85.032023 8453.858885 895.542406 \n",  "27671 ... 33.175027 131.790475 2470.570418 55.162481 \n",  "27672 ... 32.846542 132.593031 1835.565646 84.403832 \n",  "27673 ... 2028.031573 3638.218130 6000.277781 5129.063865 \n",  "27674 ... 2421.773852 2883.362119 6011.664810 2811.938674 \n",  "27675 ... 314.117009 658.882253 362.514922 172.978331 \n",  "27676 ... 3489.349981 3101.656155 15626.785528 2524.460551 \n",  "27677 ... 1905.684479 1027.062087 17261.494571 5843.774089 \n",  "27678 ... 17995.612001 14552.867031 15421.888555 17895.829662 \n",  "27679 ... 508.227064 771.475124 459.471596 982.564782 \n",  "\n",  " mhcflurry 74 mhcflurry 75 mhcflurry 76 mhcflurry 77 mhcflurry 78 \\\n",  "0 407.920138 1335.326524 12.870162 146.240141 387.025293 \n",  "1 11241.797195 14002.382696 9334.197863 7675.906356 12913.688599 \n",  "2 32.406285 179.564236 26.909081 16.457839 34.553959 \n",  "3 19.407683 70.818218 4.119397 7.337271 19.713879 \n",  "4 16.111638 69.824731 3.507305 6.210591 15.772759 \n",  "5 301.008748 415.441450 402.005916 195.863576 368.765718 \n",  "6 41.544168 186.442729 76.292963 156.352985 44.815033 \n",  "7 184.103734 213.947696 2278.596615 207.562759 219.872392 \n",  "8 67.696375 149.009658 30.536993 87.145714 72.876322 \n",  "9 438.567638 535.066532 2163.586824 617.108573 843.582091 \n",  "10 1497.649357 1515.463774 401.738452 3099.401652 2217.881709 \n",  "11 1007.446547 3071.286450 1194.542537 1536.740292 1412.465993 \n",  "12 4959.521356 4315.006570 10710.088747 10668.520216 5155.922951 \n",  "13 910.383665 2690.526753 3445.867525 9463.967091 1005.097335 \n",  "14 773.384021 1367.342619 121.451184 437.461308 887.562225 \n",  "15 1920.328607 2410.318075 693.111248 3189.719570 2294.920568 \n",  "16 337.855848 579.190101 67.290789 346.727393 424.915484 \n",  "17 534.527633 1108.412016 91.799755 414.029628 768.902459 \n",  "18 1503.687419 3000.738741 1538.603122 2704.191770 2316.040774 \n",  "19 2302.996386 2518.167863 820.496533 2671.223438 2850.495361 \n",  "20 70.128943 272.390876 10.771821 9.904357 77.326501 \n",  "21 1448.355691 4378.616473 3786.884397 1788.670865 1658.693731 \n",  "22 646.255327 740.204201 1458.515409 845.697222 677.363608 \n",  "23 1385.307925 3537.225694 3961.024924 505.063739 1741.039589 \n",  "24 41718.251279 35448.026454 49293.207217 41773.224729 42962.716446 \n",  "25 23156.140214 20193.634254 17554.134438 8162.347392 24923.308535 \n",  "26 221.815760 385.415759 858.801079 67.825594 248.444198 \n",  "27 16370.433564 18373.292324 26600.549539 21086.746051 17927.260869 \n",  "28 27227.380989 23507.408664 32060.819215 29365.717543 29602.728299 \n",  "29 1656.264603 3436.201451 849.735139 689.350648 2083.697714 \n",  "... ... ... ... ... ... \n",  "27650 8011.764731 4650.399774 7086.501562 7825.512937 7096.775779 \n",  "27651 1272.904566 1422.421658 907.483837 1900.190825 1335.629257 \n",  "27652 3548.783744 4006.518528 5664.058638 13693.557488 3536.566833 \n",  "27653 369.581319 234.690151 486.536835 1060.598522 342.638429 \n",  "27654 12.466721 26.273485 7.151339 10.767869 12.485501 \n",  "27655 40.314174 63.923970 11.681092 10.371409 37.625173 \n",  "27656 632.258766 830.589892 793.228083 572.923767 613.892864 \n",  "27657 13.217519 25.314941 3.390880 6.536171 12.342843 \n",  "27658 1938.819343 2072.827114 1712.402882 5059.673205 1661.762077 \n",  "27659 2201.998663 1914.126766 1971.369073 2999.896671 2162.541339 \n",  "27660 14.223632 65.406748 7.573250 5.399134 14.200736 \n",  "27661 74.862144 573.887016 81.702022 66.780783 71.886595 \n",  "27662 1969.504037 1605.852235 1416.517118 1745.790685 1682.515928 \n",  "27663 245.184308 313.036807 174.941719 208.131635 220.111451 \n",  "27664 11143.031319 4582.264950 23462.457138 15842.334918 11077.164439 \n",  "27665 5680.257658 3185.417881 9543.830723 8040.947834 5350.061559 \n",  "27666 455.836990 447.302147 5757.862293 1477.957443 528.183888 \n",  "27667 1019.893239 1169.610503 1831.963893 3725.336355 883.380801 \n",  "27668 674.835464 733.293813 1398.364623 2374.786783 567.507471 \n",  "27669 71.100380 130.100209 48.413170 39.951822 79.366150 \n",  "27670 172.397019 77.652671 5343.670130 635.441307 165.760297 \n",  "27671 32.079349 110.133710 198.860338 54.430380 26.400566 \n",  "27672 34.172877 119.120332 94.967471 111.751090 31.443833 \n",  "27673 2585.064576 1481.906426 6325.270464 7169.508507 2214.437912 \n",  "27674 2831.341709 1761.681626 3551.183095 2386.123256 3076.605244 \n",  "27675 387.093189 564.266198 68.064668 638.661214 398.453547 \n",  "27676 2279.579914 1928.305183 15427.302461 10459.959718 3026.056783 \n",  "27677 2181.852143 899.858133 19668.768995 10561.936258 2396.738834 \n",  "27678 19588.307742 13696.526025 19211.521928 30602.395776 20054.265514 \n",  "27679 772.242698 591.329816 1189.807614 1523.473123 695.975900 \n",  "\n",  " mhcflurry 79 \n",  "0 1175.574895 \n",  "1 15777.427472 \n",  "2 218.821497 \n",  "3 103.209533 \n",  "4 86.157611 \n",  "5 533.387993 \n",  "6 282.989902 \n",  "7 329.439928 \n",  "8 240.820089 \n",  "9 868.502679 \n",  "10 2120.478424 \n",  "11 3537.201741 \n",  "12 8201.539185 \n",  "13 5503.108263 \n",  "14 1781.904400 \n",  "15 3389.988758 \n",  "16 728.546885 \n",  "17 1445.428048 \n",  "18 3015.279174 \n",  "19 3962.499784 \n",  "20 338.353540 \n",  "21 8368.901644 \n",  "22 750.479001 \n",  "23 2946.101555 \n",  "24 37455.936779 \n",  "25 22296.724479 \n",  "26 382.737079 \n",  "27 17732.815373 \n",  "28 24198.313575 \n",  "29 3479.754922 \n",  "... ... \n",  "27650 5180.448858 \n",  "27651 718.434273 \n",  "27652 7235.413991 \n",  "27653 236.626449 \n",  "27654 28.785291 \n",  "27655 62.095899 \n",  "27656 570.111053 \n",  "27657 27.965131 \n",  "27658 4067.969954 \n",  "27659 1245.603882 \n",  "27660 53.042656 \n",  "27661 240.199173 \n",  "27662 1105.013233 \n",  "27663 297.084820 \n",  "27664 4122.825718 \n",  "27665 2927.695538 \n",  "27666 309.217351 \n",  "27667 2596.187281 \n",  "27668 1807.753477 \n",  "27669 128.174314 \n",  "27670 62.800866 \n",  "27671 70.350814 \n",  "27672 66.154394 \n",  "27673 3499.440631 \n",  "27674 1348.655309 \n",  "27675 343.711818 \n",  "27676 2103.577319 \n",  "27677 831.409071 \n",  "27678 13187.834441 \n",  "27679 709.660102 \n",  "\n",  "[27680 rows x 87 columns]"  ]  },  "execution_count": 11,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "validation_df_with_mhcflurry_results = pandas.read_csv(\"../data/validation_predictions_full2.csv\")\n",  "validation_df_with_mhcflurry_results"  ]  },  {  "cell_type": "code",  "execution_count": 12,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/html": [  "
\n",  "\n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n", \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  "
allelepeptidelengthmeasnetmhcnetmhcpansmmpmbec_cppmhcflurry 0mhcflurry 1mhcflurry 2...mhcflurry ensemble big dropoutmhcflurry ensemble big dropout imputemhcflurry ensemble big imputemhcflurry ensemble smallmhcflurry ensemble small dropoutmhcflurry ensemble small dropout imputemhcflurry ensemble small imputemhcflurry ensemble allmhcflurry ensemble all imputemhcflurry ensemble all not impute
0H-2-DBAAACNVATA9657.657837154.881662711.213514438.530698466.814768172.641984343.793510...412.970922412.076508127.076246354.9178791032.431732979.070265316.292139382.541823356.850347410.082958
1H-2-DBAAFEFVYV830831.8795026456.542290785.23563510351.42166715087.57442610433.57988110853.152403...11546.34964511523.36547612119.33225710582.77926515236.59411115530.31689410563.99014912481.24016312303.15749012661.900504
2H-2-DBAAFVNDYSL977.44618017.4582227.51622928.05433647.82080716.30379429.588240...35.80039736.33271426.66101214.234040198.349515191.31159336.19037545.44994350.88938640.591910
3H-2-DBAAIANQAAV91.9998629.6382909.74989625.7039582.8878697.43067623.204965...21.97944722.1498545.5141309.57118875.47667273.39704810.31114917.93511617.43646318.448030
4H-2-DBAAIANQAVV91.5170508.5506678.33681228.7739842.5797535.21599317.054924...17.00996617.2105444.0877315.40407566.89828566.2777736.16871213.11781913.02296413.213366
5H-2-DBAAIENYVRF937.844258252.348077114.815362187.06821491.63201077.986067288.144351...308.430443313.295340283.004210138.379134453.930512463.507669126.418515252.636475268.474851237.732466
6H-2-DBAAINFITTM93.155005199.986187389.045145200.909281474.790652183.21505343.296033...47.64485946.92474129.16261875.234690201.404054208.73630869.72888271.02435666.80512475.510064
7H-2-DBAAIPAPPPI93243.3961731059.253725493.173804295.120923623.8788477834.652456178.830163...224.408829201.811546474.297442661.731263203.524213224.200582295.562535298.738170282.208914316.235562
8H-2-DBAAKLNRPPL9654.63617466.37430777.26805938.45917888.91700463.99615560.123046...78.32862576.676509193.105629150.854140187.610007214.239343191.850182152.833062157.065094148.715061
9H-2-DBAALDMVDAL9229.614865547.015963597.035287225.4239215459.146719678.959069605.313435...571.537601693.9720881713.7861381086.358455752.720509709.9416921346.7787601012.5098511032.652955992.759662
10H-2-DBAALQHLRSI9905.7326011686.5530252032.357011698.2324043669.0748003156.4635291692.175239...1775.1789881884.1716931789.6121621947.5196322076.6225092226.7926521964.2658952041.3283481959.7012212126.355477
11H-2-DBAALVRLTAL91106.623784435.511874214.783047378.4425852137.0101573406.4246851367.951646...1244.6853451351.9318851067.4594411329.4814363414.4028643545.2556821204.0863411590.9904491575.4435491606.690770
12H-2-DBAAMVPTGSL91836.5383434055.0853545176.0683201545.25444015245.04609721471.1309395051.710355...5127.1219465209.6255188636.3367727069.6235365894.3434847160.3808335956.9857436491.3269746618.7303696366.375957
HLA-A6802130.954562H-2-DB0.870482AANSPWAPV0.60285690.9683594325.1383100.900000903.6494740.6402011023.2929920.968413557.1857490.8898941446.5783360.6326604093.6316560.9591731124.045813...0.9226361076.4006470.6523321156.2493280.9641971603.5944060.9002931313.0228760.6532163179.3420160.9657934114.0098360.9287751362.9645050.6295301746.6195666691795.65944647681698.918976
HLA-A3001140.888740H-2-DB0.730864AAPSGAAPL0.50209090.8814432.8444610.73791397.9489990.499390501.1872340.889599822.2426500.74559277.7616770.521544116.2510520.893689658.194668...0.731959816.3801400.456482805.2796340.871974141.5068790.746114150.4170600.4598571461.8722110.8699351395.2384430.692875137.2382510.505244374.282265660384.3367992040364.490764
HLA-A0203150.950892H-2-DB0.916566AAPVSEPTV0.53431590.976453106.9054880.9513642654.6055620.5734781918.6687410.9743241870.6821400.9537371627.4372430.5928122005.2047560.9703912467.857734...0.9486262343.5023050.5869112144.1532400.9741582390.5956160.9445782085.1009070.5914632197.4789760.9728852406.3066190.9467461636.7374260.5839082047.7886046512119.69306855421978.323290
HLA-B3901160.953506H-2-DB0.705882AAVANGFAA0.29743590.95136483.3681180.734694205.1162180.295161228.5598800.960260200.4472030.72340440.5386210.303500116.6590860.951948382.503402...0.750000361.3946440.305138373.2430720.98006583.8241000.744186338.9448630.316739520.3835200.949708465.3477890.708333339.7796960.296639257.850466641265.206359886250.698599
HLA-B1501170.914988H-2-DB0.793503AAVLLGAPV0.56938490.933960373.2501580.831050320.6269320.585046623.7348350.937243286.4177970.82973639.3306100.590098408.6388240.929187605.753153...0.846512643.2306540.591735660.1335090.935596130.7125520.823245409.3863380.5890971192.9285060.9360631265.1909370.819048451.5961650.590100489.354829633471.2092943213508.199121
HLA-B1517180.910482H-2-DB0.661088AAVQLLFPA0.40731190.921477347.5361610.6611572494.5947270.4171645152.2864460.911692679.2036330.669604250.5525880.402892681.4964200.9018191427.626931...0.6379311610.6228240.4224971769.5224890.934516873.3944170.7102801388.4162770.4485752652.8859920.8996202526.0150000.6525422755.8761040.4065821614.6568915821811.0920668461439.527524
HLA-A2402190.851004H-2-DB0.653659AAVTAGVAL0.53571490.853637229.6148650.6491651552.3870100.5515222172.7011790.8707121927.5249130.5853662506.2913050.585672780.9196380.8685982868.849059...0.6329112660.5999930.5757102573.8520380.892876767.5269520.6930692439.7483340.6006862815.8232600.8489152720.4106700.6334163073.3470690.5375891929.9761305732015.95494725331847.664238
H-2-DB200.887624H-2-DB0.611321AAVVNRSLV0.59837090.9072998.6099380.66666726.3026800.63111029.5801250.89443363.8263490.56410310.6128320.62178819.7487200.88939359.138583...0.62121272.2714510.60033770.0764910.87457411.8643780.57723626.4145140.574262268.0409840.884187283.3893990.62857121.2613970.57125250.36947756447.309480321653.627395
H-2-KB210.866649H-2-DB0.794613AAYVPADAV0.52709690.900377331.8944580.7978531757.9236140.5703173206.2693250.910039595.6621440.8121659645.6585320.56523011279.3049470.9081041835.991854...0.8136751722.6978420.5731991747.8051240.8255652083.2611610.6653542101.5853940.4868364997.2699500.9159946096.2201970.8599671804.1174260.5892182692.2074245582515.59395934072881.220473
HLA-B3501220.828050H-2-DB0.737903ACMVNLERL0.50089690.831002737.9042300.722656239.3315760.524182679.2036330.829343444.6312670.7221101891.4270690.519938521.1017460.822469520.331052...0.712000654.1401780.515205664.4748230.8362811412.6056200.711027564.2549170.514413819.0752110.823734894.7039520.705411714.3775010.501630866.913344542880.0891072397853.934834
HLA-A6801230.926693H-2-DB0.904494ADLVNHPPV0.51960890.945221558.4701950.9196051694.3378000.5717601857.8044550.941744325.0872970.9050284042.2363810.556709954.0534820.9303631131.217632...0.9247911304.5582990.5714031229.5930690.9489075570.9140590.923944929.7562000.5995623301.9704990.9445533481.2331050.924347610.7729020.5564181963.4258585271953.55293131841973.348682
HLA-B0802240.978728H-2-DB0.285714AEMEEALKG0.36189490.96492478523.5634610.16000041304.7501990.34163346989.4108610.980878440554.8635070.00000048819.1822110.35848843577.0473330.96605641487.708042...0.19047641659.0018940.39383341837.7854290.98959048392.8073670.57142943698.4732300.41057935656.6577870.98721435933.9243620.10526343211.0204280.38583842130.17961950942107.76293948742152.608233
HLA-B1801250.775263H-2-DB0.324324AFFAFRYV0.20132580.81150487902.2516830.35897418967.0592120.24180312882.4955170.7744367816.2780460.33333317412.9618930.2311778603.3894750.76864722533.909280...0.35897423595.5572880.23711823748.4518230.78954913479.4314100.38095214242.7831050.23420121776.6718410.78778222004.8047300.31578913645.1610280.21553418168.14916950317607.624386205218746.517815
HLA-B5301260.836274H-2-DB0.716279AGLDNKFYL0.51127590.849549659.1738950.740566357.2728380.528186202.7682720.834934260.0159560.71226432.4668860.518640374.1950200.851550216.595300...0.733813226.1803010.515585242.1275290.885722127.8042110.753623301.8521900.559543477.3132880.821328502.5913570.734177303.1725470.495308258.410869485262.0435991018254.828500
HLA-A3301270.912425H-2-DB0.822857AGLLFVLL0.57939480.92404387902.2516830.86330914996.8483550.6005999885.5309470.92263526242.1854340.85027717654.3207700.59327917139.8225790.91769916697.495982...0.86832716861.7000020.58711217069.5975840.93115622898.5295570.82917517056.3113360.61214718450.4826380.90741418900.1819190.85509818420.4706920.57215819167.88427547319206.551553304019129.294844
HLA-A6901280.958853H-2-DB0.638889AGLQVINL0.33818980.96483059429.2158620.66666725061.0925300.34278912560.2996370.95694735399.7341080.70000031484.0032290.32578533545.6626150.94248126437.149676...0.69841327514.0211100.33533927636.5321470.94425731236.5589020.68085130641.4667150.32743224382.9791250.95486824418.5811540.68965532544.8711750.32249828800.71419447028779.777262207928821.666357
HLA-B1509290.852442H-2-DB0.487805AGLVSFNFL0.29886990.871854210.8628150.315789620.8690340.3311612285.5988030.8806911811.3400930.1290321972.8362360.330301630.4586530.8178021812.154993...0.1875002064.4222550.3543111886.5170560.9229072135.5683810.176471939.6737140.4480994363.9852610.8946184371.8703000.187500972.2968820.3646732049.1400614662034.2770293462064.111687
HLA-A3201...0.884704...0.699690...0.512869...0.893682...0.708861...0.514653...0.900643...0.777778...0.484062...0.900451....................................0.7728810.4482840.9071610.7664230.4806690.8320130.5807960.493693449640
HLA-B5801276500.894775Mamu-A020.832512YNTVCVIW0.55939280.904312909.9132730.835821734.5138680.57168810023.0523810.90726148.8652360.82564111822.9079600.5879198396.8663770.9034637112.873873...0.8274117604.8428340.5451327479.2822820.8820166258.2963790.8051959231.0217680.5315085156.2320100.9056455035.6234140.8177578607.0960360.5820266928.8658144456711.29742725647153.487383
HLA-B270327651NaNMamu-A020.000000YRHDGGNVL0.0189799NaN78342.9642770.0000001355.1894120.06060922233.098906NaN1409.2887980.0000002553.293884-0.0278561061.021624NaN1050.845801...1237.8162841182.4981701172.8734191764.4367781111.6722931060.2937501876.5310941329.0760331288.8678691370.538551
27652Mamu-A02YSEGQYMNTP107362.0709752958.0124678709.6359004477.1330423862.2897482829.0805013857.430334...3603.8805093030.6598335563.5136546258.7380644524.9414604375.4534546060.1780414805.9788104598.3148115023.021101
27653Mamu-A02YSEVALNVTES117709.0346911682.6740615105.05000051.522864602.395338540.214499382.353838...0.000000339.5723290.053658301.199532NaN601.5293410.000000643.6895470.067451251.163750NaN275.2787580.000000575.304332NaN411.355669441411.571566433411.139885
HLA-A3002276540.711574Mamu-A020.619512YSLVFVILM0.31522790.7289811256.0299640.62278517.4984670.33400049.4310690.7420426.3241190.6451616.5340850.34358312.2455280.73841314.057669...0.66343812.6767720.34216112.3342420.7327497.5123220.6112608.4058530.32057727.7097160.75427127.2219910.7041047.8206120.35495611.86497542011.851187143011.878780
HLA-A2501276550.975669Mamu-A020.363636YSQIGAGVY0.14643090.9727491.9998620.38095217.8648760.14568115.3461700.97712916.2929600.60000015.8498060.14703010.1594810.97177643.079177...0.66666739.6672290.15183638.2879520.99854024.3377110.88888916.8237080.15396858.1387360.99270164.1075200.72727318.6761030.15199731.69657241632.50006851930.912940
HLA-A2602276560.902721Mamu-A020.713615YSRDLICEQS0.469627100.9262691059.2537250.7464111297.1792710.4933763863.6697710.930901220.2926460.786070941.9072320.518496388.8035230.920672516.415889...0.766839504.1332000.525365457.4066480.957811487.2068500.839378444.4161360.561093735.2950450.942981794.5981330.790244541.0394090.531805562.468684413556.349977202568.654684
HLA-B4402276570.869757Mamu-A020.682292YSYKAFIKY0.50640590.8681962.3173950.6011564.2854850.5130613.0902950.8871971.7782790.5175725.4764520.54420930.2878870.88950313.697417...0.56880711.4455500.57491611.4950520.9345544.7758200.6071436.5683780.59896032.9649320.80201838.1035140.5706526.1104090.37790010.63757941110.632822170510.642338
HLA-B4001276580.895389Mamu-A020.735043YSYKAFIKYP0.580586100.9066504830.5880200.7230321199.4993030.6024341753.8805020.9127643111.7163370.6809821948.3113900.6122481887.0882370.9225031719.075267...0.8297871791.1575100.6353081546.2919040.9206782058.0953900.8455702512.5672400.6194183027.3413680.8623313013.7921800.6744872392.6213100.5207252254.0384324072188.69911627182321.328325
HLA-A2301276590.840581Mamu-A020.710602YSYKAFIKYPE0.556410110.8738454897.7881940.773481671.4288530.5962262666.8586650.87058042.5598410.7433632940.1083930.5829371753.5134950.8714031992.582402...0.7738422027.9172740.6055981893.3705900.8952292396.0769010.7884061967.1376490.6369442491.6960680.8493812395.8032090.7450002137.1043990.5612592248.1625293912195.34770620212302.247951
Mamu-A02276600.876989Mamu-A020.682216YTAFTLPSV0.50432990.870053101.6248690.66855532.2106880.50761452.8445250.85399291.8332600.6666674.5728520.4853964.4608200.82606814.724639...0.76712314.1619280.59896414.6290420.8830876.4394830.7480926.1988000.52462250.4486560.81069248.0797630.6400007.3806680.47858913.22682138813.52169793812.938375
HLA-A8001276610.966590Mamu-A020.344828YTAFTLPSVN0.175280100.9884792529.2979960.560000236.5919700.1942321406.0475240.98540714.4877190.46153865.0773770.18029357.6596360.97119893.229936...0.43478390.5142130.18237482.4538380.98079982.9879970.43478358.4324470.186524276.7680610.990015231.6524120.51851960.8333030.183987101.77870837999.094853782104.535252
HLA-B4403276620.785885Mamu-A020.677333YTDGSCNKQS0.419995100.81193711091.7481530.7328244345.1022420.45056011246.0497400.813593588.8436550.6139821636.0849770.4623642050.4302310.8056481818.078082...0.7663041579.4904360.5410661417.0898150.8910471162.9034850.7759561666.6942110.5878241347.5402850.7964541407.6303270.7549021675.0271270.4320211430.4746513781403.9863239131457.462722
HLA-B460127663NaNMamu-A020.000000YTGDFDSVINaN9NaN215.2781730.000000354.813389NaN42.461956NaN40.5508540.000000282.773627NaN61.811464NaN203.244505...0.000000211.238553NaN201.105289NaN108.5366310.000000258.973559NaN260.492701NaN312.6128320.000000349.272026NaN217.862273378220.9492891424214.818388
HLA-B3801276640.901216Mamu-A020.000000YTPKVVGG0.50035980.90911970145.5298420.00000017947.3362680.51573213995.8732260.9219523140.5086940.00000028699.4470190.52452718917.4169650.72576811333.871219...0.00000011428.8550780.51326911689.6615320.98007423630.0267910.00000018143.4055620.6521734168.0827920.9492064559.1643860.00000019072.1902820.54743812198.05287735112449.10108313611952.067302
HLA-B2705276650.945675Mamu-A020.571429YTPKVVGGIGG0.416364110.94458670145.5298420.5098049418.8959650.42400510046.1579030.948578387.2576450.48979610653.3879100.43821910389.2900520.9374475383.389946...0.2857145476.1809340.4305615615.0006430.9438608909.9384640.4000009591.8435020.3772082761.8639040.9416822998.1845000.3043489070.4241850.4168846112.3591743146073.34031030286151.628720
HLA-A2603276660.860835Mamu-A020.529412YTSGPGIR0.32088580.86358716865.5302540.537313619.4410750.3156342349.6328210.86260480.7235030.5185194905.8694430.3048493486.5880650.834005482.922794...0.542373444.3615520.366317481.5667530.9343004389.7509240.5818182042.3116570.426438367.2353450.843194414.5812050.5090911608.6655970.3067411099.9571543121089.6648442051110.346678
Mamu-A01276670.847141Mamu-A020.583333YTSGPGIRYP0.455049100.8891777128.5303010.643836783.4296430.5060965176.0683200.9227771270.5741050.7164182079.2837780.5275951463.6206650.917658894.140283...0.6949151021.4989610.569423879.8638490.9127552018.1897640.7068972021.3450290.5390131563.0550450.8393901463.1560160.6092721681.7152550.4699751534.0729622741445.78975722641627.746940
HLA-B0803276680.952593Mamu-A020.000000YTSGPGTRYP0.302768100.8869143097.4192990.000000483.0588020.2739435420.0089040.957037797.9946870.0000001746.1380670.309651995.8371000.407901561.597714...0.000000668.2941980.318249576.0002620.9523461797.4521660.0000001566.8225640.3159781028.1268900.9733331020.4372930.0000001285.7977450.3142661118.5609752341079.5922322171158.936326
H-2-KD276690.765223Mamu-A020.613333YTSGPGTRYPM0.336723110.76480825.9417940.56944439.1741880.3237007.7446180.76688276.3835780.54545565.7829530.34812932.0580590.75410774.582612...0.65771873.9965780.40327573.6439510.81918970.6800620.64557057.0143430.390333137.0171240.753692132.4396400.53846263.4857290.36524779.38053922981.33585345277.472231
HLA-B1503276700.788338Mamu-A020.477064YTTGGTSR0.36137180.82047870145.5298420.476190357.2728380.3777225701.6427230.839991100.2305240.5370374867.9553660.4131242688.4309360.802112159.755152...0.592593149.3140110.468922162.0794320.8700642732.7035560.5882351276.7108040.52257774.7096330.83941791.0083650.5233641025.8215270.444917453.623055165450.939613429456.322467
HLA-A0202276710.833980Mamu-A020.720000YTTGGTSRN0.56148490.89329336897.7598570.764045186.6379690.6147036025.5958610.903271119.6740530.791209268.0251590.64131284.1689010.91324836.777590...0.75555634.8105390.62714332.0822600.898697151.0353190.76923171.0084080.62428066.4047340.88220665.4307840.72727355.3090690.60693871.61146812664.711354391979.247336
HLA-A2902276720.890924Mamu-A020.700000YTTTGASRN0.62045590.884819587.4893530.666667135.5189410.6493142844.4611070.87301687.0963590.64406891.7683230.621376120.1993110.86202737.542691...0.64406838.7700580.61983034.9455540.882377113.3389510.63333381.1538660.64125768.8896170.87179564.4270060.65517262.1643240.61236472.54419311863.109548239783.389283
27673Mamu-A02YTYEAYVRYP102624.2185431552.3870103872.5764491954.3394565516.6012123207.8349542203.500262...2470.0888902189.1487765592.8378384632.3472432486.0834012571.4500514915.0724953555.4223103526.9871823584.086686
27674Mamu-A02YTYEAYVRYPE111905.460718864.9679196998.41996032.7340694316.8894841492.3388822768.632417...2925.8058472672.5939213516.5711512870.2794242542.8215362543.5068443133.5543582976.0606072941.9184653010.598981
27675Mamu-A02YVADALAAF915.381546453.94161771.285303108.14339573.800771431.698036320.442212...330.599717325.72813981.573509296.494841424.188197409.284111378.668749261.260451253.321583269.448116
HLA-B5401276760.800000Mamu-A020.727273YVFPVIFSK0.29578790.81621639264.4935400.6666672098.9398840.3148225610.4797600.800000901.5711380.72727316244.4615980.3118948409.0867210.7972973114.359914...0.8000002980.5580010.3002523312.0654290.84594617560.6182510.7272736405.5559070.3498262085.8386730.8391892419.3708910.7272739950.7419100.3336005485.878564796117.15036110194919.752146
HLA-B4002276770.916667Mamu-A020.764706YVFPVIFSR0.49430090.90873036728.2300500.6896552333.4580620.48184510046.1579030.9345242600.1595630.75862122634.8879500.49352210567.0444060.9246032196.918342...0.7586211925.4070820.4562422131.5987170.91865121847.7726910.9090917014.5225770.518720979.3577260.9345241149.7715140.75862111502.1985770.4555484447.784250744981.6849228663971.103159
HLA-B4501276780.996667Mamu-A020.750000YVPCHIRQI0.23004591.00000010764.6521360.75000021134.8903980.2476216039.4862940.99666710568.1750920.57142920710.5599990.23831612170.6772350.99333320094.652790...1.00000018715.8886970.26357418569.8714730.99333316359.2538060.80000017813.6034180.24642613002.0105001.00000013171.9007950.88888921474.8203370.25130116829.1029016517121.33380888916541.859860
27679Mamu-A02YVVQMLARL9152.405275232.273680739.605275105.681751528.261756625.062058724.556640...618.533368634.952392609.348300868.508729633.270834563.941437887.179059678.365819663.304608693.769015
\n",
  "

55 "

27680  rows × 35 98  columns

\n", "
"
  ],  "text/plain": [  " mhcflurry 0_auc mhcflurry 0_f1 mhcflurry 0_tau mhcflurry 1_auc allele peptide length meas netmhc  \\\n", "allele \n",  "HLA-A0201 0.899123 0.837826 0.554988 0.926853 \n",  "HLA-A0301 0.891561 0.834236 0.540025 0.922007 \n",  "HLA-A0201 0.899123 0.837826 0.554988 0.926853 \n",  "HLA-A0301 0.891561 0.834236 0.540025 0.922007 \n",  "HLA-A2601 0.928084 0.580000 0.432299 0.929260 \n",  "HLA-B0801 0.942694 0.762931 0.600817 0.949517 \n",  "HLA-B5101 0.933050 0.489796 0.369192 0.939082 \n",  "HLA-B5701 0.914240 0.750000 0.524933 0.916777 \n",  "HLA-B0702 0.904985 0.792711 0.564505 0.915801 \n",  "HLA-A3101 0.828510 0.782609 0.460554 0.854838 \n",  "HLA-A1101 0.920368 0.872077 0.579906 0.936520 \n",  "HLA-A0101 0.912746 0.621762 0.521720 0.924911 \n",  "HLA-A0206 0.876067 0.849449 0.465713 0.909081 \n",  "HLA-A6802 0.954562 0.870482 0.602856 0.968359 \n",  "HLA-A3001 0.888740 0.730864 0.502090 0.881443 \n",  "HLA-A0203 0.950892 0.916566 0.534315 0.976453 \n",  "HLA-B3901 0.953506 0.705882 0.297435 0.951364 \n",  "HLA-B1501 0.914988 0.793503 0.569384 0.933960 \n",  "HLA-B1517 0.910482 0.661088 0.407311 0.921477 \n",  "HLA-A2402 0.851004 0.653659 0.535714 0.853637 \n",  "H-2-DB 0.887624 0.611321 0.598370 0.907299 \n",  "H-2-KB 0.866649 0.794613 0.527096 0.900377 \n",  "HLA-B3501 0.828050 0.737903 0.500896 0.831002 \n",  "HLA-A6801 0.926693 0.904494 0.519608 0.945221 \n",  "HLA-B0802 0.978728 0.285714 0.361894 0.964924 \n",  "HLA-B1801 0.775263 0.324324 0.201325 0.811504 \n",  "HLA-B5301 0.836274 0.716279 0.511275 0.849549 \n",  "HLA-A3301 0.912425 0.822857 0.579394 0.924043 \n",  "HLA-A6901 0.958853 0.638889 0.338189 0.964830 \n",  "HLA-B1509 0.852442 0.487805 0.298869 0.871854 \n",  "HLA-A3201 0.884704 0.699690 0.512869 0.893682 \n",  "HLA-B5801 0.894775 0.832512 0.559392 0.904312 \n",  "HLA-B2703 NaN 0.000000 0.018979 NaN \n",  "HLA-A3002 0.711574 0.619512 0.315227 0.728981 \n",  "HLA-A2501 0.975669 0.363636 0.146430 0.972749 \n",  "HLA-A2602 0.902721 0.713615 0.469627 0.926269 \n",  "HLA-B4402 0.869757 0.682292 0.506405 0.868196 \n",  "HLA-B4001 0.895389 0.735043 0.580586 0.906650 \n",  "HLA-A2301 0.840581 0.710602 0.556410 0.873845 \n",  "Mamu-A02 0.876989 0.682216 0.504329 0.870053 \n",  "HLA-A8001 0.966590 0.344828 0.175280 0.988479 \n",  "HLA-B4403 0.785885 0.677333 0.419995 0.811937 \n",  "HLA-B4601 NaN 0.000000 NaN NaN \n",  "HLA-B3801 0.901216 0.000000 0.500359 0.909119 \n",  "HLA-B2705 0.945675 0.571429 0.416364 0.944586 \n",  "HLA-A2603 0.860835 0.529412 0.320885 0.863587 \n",  "Mamu-A01 0.847141 0.583333 0.455049 0.889177 \n",  "HLA-B0803 0.952593 0.000000 0.302768 0.886914 \n",  "H-2-KD 0.765223 0.613333 0.336723 0.764808 \n",  "HLA-B1503 0.788338 0.477064 0.361371 0.820478 \n",  "HLA-A0202 0.833980 0.720000 0.561484 0.893293 \n",  "HLA-A2902 0.890924 0.700000 0.620455 0.884819 \n",  "HLA-B5401 0.800000 0.727273 0.295787 0.816216 \n",  "HLA-B4002 0.916667 0.764706 0.494300 0.908730 \n",  "HLA-B4501 0.996667 0.750000 0.230045 1.000000 "0 H-2-DB AAACNVATA 9 657.657837 154.881662 \n",  "1 H-2-DB AAFEFVYV 8 30831.879502 6456.542290 \n",  "2 H-2-DB AAFVNDYSL 9 77.446180 17.458222 \n",  "3 H-2-DB AAIANQAAV 9 1.999862 9.638290 \n",  "4 H-2-DB AAIANQAVV 9 1.517050 8.550667 \n",  "5 H-2-DB AAIENYVRF 9 37.844258 252.348077 \n",  "6 H-2-DB AAINFITTM 9 3.155005 199.986187 \n",  "7 H-2-DB AAIPAPPPI 9 3243.396173 1059.253725 \n",  "8 H-2-DB AAKLNRPPL 9 654.636174 66.374307 \n",  "9 H-2-DB AALDMVDAL 9 229.614865 547.015963 \n",  "10 H-2-DB AALQHLRSI 9 905.732601 1686.553025 \n",  "11 H-2-DB AALVRLTAL 9 1106.623784 435.511874 \n",  "12 H-2-DB AAMVPTGSL 9 1836.538343 4055.085354 \n",  "13 H-2-DB AANSPWAPV 9 4325.138310 903.649474 \n",  "14 H-2-DB AAPSGAAPL 9 2.844461 97.948999 \n",  "15 H-2-DB AAPVSEPTV 9 106.905488 2654.605562 \n",  "16 H-2-DB AAVANGFAA 9 83.368118 205.116218 \n",  "17 H-2-DB AAVLLGAPV 9 373.250158 320.626932 \n",  "18 H-2-DB AAVQLLFPA 9 347.536161 2494.594727 \n",  "19 H-2-DB AAVTAGVAL 9 229.614865 1552.387010 \n",  "20 H-2-DB AAVVNRSLV 9 8.609938 26.302680 \n",  "21 H-2-DB AAYVPADAV 9 331.894458 1757.923614 \n",  "22 H-2-DB ACMVNLERL 9 737.904230 239.331576 \n",  "23 H-2-DB ADLVNHPPV 9 558.470195 1694.337800 \n",  "24 H-2-DB AEMEEALKG 9 78523.563461 41304.750199 \n",  "25 H-2-DB AFFAFRYV 8 87902.251683 18967.059212 \n",  "26 H-2-DB AGLDNKFYL 9 659.173895 357.272838 \n",  "27 H-2-DB AGLLFVLL 8 87902.251683 14996.848355 \n",  "28 H-2-DB AGLQVINL 8 59429.215862 25061.092530 \n",  "29 H-2-DB AGLVSFNFL 9 210.862815 620.869034 \n",  "... ... ... ... ... ... \n",  "27650 Mamu-A02 YNTVCVIW 8 909.913273 734.513868 \n",  "27651 Mamu-A02 YRHDGGNVL 9 78342.964277 1355.189412 \n",  "27652 Mamu-A02 YSEGQYMNTP 10 7362.070975 2958.012467 \n",  "27653 Mamu-A02 YSEVALNVTES 11 7709.034691 1682.674061 \n",  "27654 Mamu-A02 YSLVFVILM 9 1256.029964 17.498467 \n",  "27655 Mamu-A02 YSQIGAGVY 9 1.999862 17.864876 \n",  "27656 Mamu-A02 YSRDLICEQS 10 1059.253725 1297.179271 \n",  "27657 Mamu-A02 YSYKAFIKY 9 2.317395 4.285485 \n",  "27658 Mamu-A02 YSYKAFIKYP 10 4830.588020 1199.499303 \n",  "27659 Mamu-A02 YSYKAFIKYPE 11 4897.788194 671.428853 \n",  "27660 Mamu-A02 YTAFTLPSV 9 101.624869 32.210688 \n",  "27661 Mamu-A02 YTAFTLPSVN 10 2529.297996 236.591970 \n",  "27662 Mamu-A02 YTDGSCNKQS 10 11091.748153 4345.102242 \n",  "27663 Mamu-A02 YTGDFDSVI 9 215.278173 354.813389 \n",  "27664 Mamu-A02 YTPKVVGG 8 70145.529842 17947.336268 \n",  "27665 Mamu-A02 YTPKVVGGIGG 11 70145.529842 9418.895965 \n",  "27666 Mamu-A02 YTSGPGIR 8 16865.530254 619.441075 \n",  "27667 Mamu-A02 YTSGPGIRYP 10 7128.530301 783.429643 \n",  "27668 Mamu-A02 YTSGPGTRYP 10 3097.419299 483.058802 \n",  "27669 Mamu-A02 YTSGPGTRYPM 11 25.941794 39.174188 \n",  "27670 Mamu-A02 YTTGGTSR 8 70145.529842 357.272838 \n",  "27671 Mamu-A02 YTTGGTSRN 9 36897.759857 186.637969 \n",  "27672 Mamu-A02 YTTTGASRN 9 587.489353 135.518941 \n",  "27673 Mamu-A02 YTYEAYVRYP 10 2624.218543 1552.387010 \n",  "27674 Mamu-A02 YTYEAYVRYPE 11 1905.460718 864.967919 \n",  "27675 Mamu-A02 YVADALAAF 9 15.381546 453.941617 \n",  "27676 Mamu-A02 YVFPVIFSK 9 39264.493540 2098.939884 \n",  "27677 Mamu-A02 YVFPVIFSR 9 36728.230050 2333.458062 \n",  "27678 Mamu-A02 YVPCHIRQI 9 10764.652136 21134.890398 \n",  "27679 Mamu-A02 YVVQMLARL 9 152.405275 232.273680  \n", "\n",  " netmhcpan smmpmbec_cpp  mhcflurry 1_f1 0  mhcflurry 1_tau 1  mhcflurry 2_auc mhcflurry 2_f1 2  \\\n", "allele \n",  "HLA-A0201 0.870671 0.623314 0.925713 0.881167 \n",  "HLA-A0301 0.892147 0.595890 0.923343 0.879402 \n",  "HLA-A0201 0.870671 0.623314 0.925713 0.881167 \n",  "HLA-A0301 0.892147 0.595890 0.923343 0.879402 \n",  "HLA-A2601 0.593103 0.440722 0.931760 0.574899 \n",  "HLA-B0801 0.773504 0.620342 0.948274 0.778523 \n",  "HLA-B5101 0.391304 0.369359 0.948141 0.404762 \n",  "HLA-B5701 0.740299 0.535227 0.922818 0.670886 \n",  "HLA-B0702 0.866525 0.594497 0.909308 0.835526 \n",  "HLA-A3101 0.822500 0.510287 0.847235 0.817610 \n",  "HLA-A1101 0.883152 0.615351 0.936927 0.884298 \n",  "HLA-A0101 0.659794 0.531596 0.909260 0.586207 \n",  "HLA-A0206 0.872236 0.528876 0.900025 0.868712 \n",  "HLA-A6802 0.900000 0.640201 0.968413 0.889894 \n",  "HLA-A3001 0.737913 0.499390 0.889599 0.745592 \n",  "HLA-A0203 0.951364 0.573478 0.974324 0.953737 \n",  "HLA-B3901 0.734694 0.295161 0.960260 0.723404 \n",  "HLA-B1501 0.831050 0.585046 0.937243 0.829736 \n",  "HLA-B1517 0.661157 0.417164 0.911692 0.669604 \n",  "HLA-A2402 0.649165 0.551522 0.870712 0.585366 \n",  "H-2-DB 0.666667 0.631110 0.894433 0.564103 \n",  "H-2-KB 0.797853 0.570317 0.910039 0.812165 \n",  "HLA-B3501 0.722656 0.524182 0.829343 0.722110 \n",  "HLA-A6801 0.919605 0.571760 0.941744 0.905028 \n",  "HLA-B0802 0.160000 0.341633 0.980878 0.000000 \n",  "HLA-B1801 0.358974 0.241803 0.774436 0.333333 \n",  "HLA-B5301 0.740566 0.528186 0.834934 0.712264 \n",  "HLA-A3301 0.863309 0.600599 0.922635 0.850277 \n",  "HLA-A6901 0.666667 0.342789 0.956947 0.700000 \n",  "HLA-B1509 0.315789 0.331161 0.880691 0.129032 \n",  "HLA-A3201 0.708861 0.514653 0.900643 0.777778 \n",  "HLA-B5801 0.835821 0.571688 0.907261 0.825641 \n",  "HLA-B2703 0.000000 0.060609 NaN 0.000000 \n",  "HLA-A3002 0.622785 0.334000 0.742042 0.645161 \n",  "HLA-A2501 0.380952 0.145681 0.977129 0.600000 \n",  "HLA-A2602 0.746411 0.493376 0.930901 0.786070 \n",  "HLA-B4402 0.601156 0.513061 0.887197 0.517572 \n",  "HLA-B4001 0.723032 0.602434 0.912764 0.680982 \n",  "HLA-A2301 0.773481 0.596226 0.870580 0.743363 \n",  "Mamu-A02 0.668555 0.507614 0.853992 0.666667 \n",  "HLA-A8001 0.560000 0.194232 0.985407 0.461538 \n",  "HLA-B4403 0.732824 0.450560 0.813593 0.613982 \n",  "HLA-B4601 0.000000 NaN NaN 0.000000 \n",  "HLA-B3801 0.000000 0.515732 0.921952 0.000000 \n",  "HLA-B2705 0.509804 0.424005 0.948578 0.489796 \n",  "HLA-A2603 0.537313 0.315634 0.862604 0.518519 \n",  "Mamu-A01 0.643836 0.506096 0.922777 0.716418 \n",  "HLA-B0803 0.000000 0.273943 0.957037 0.000000 \n",  "H-2-KD 0.569444 0.323700 0.766882 0.545455 \n",  "HLA-B1503 0.476190 0.377722 0.839991 0.537037 \n",  "HLA-A0202 0.764045 0.614703 0.903271 0.791209 \n",  "HLA-A2902 0.666667 0.649314 0.873016 0.644068 \n",  "HLA-B5401 0.666667 0.314822 0.800000 0.727273 \n",  "HLA-B4002 0.689655 0.481845 0.934524 0.758621 \n",  "HLA-B4501 0.750000 0.247621 0.996667 0.571429 "0 711.213514 438.530698 466.814768 172.641984 343.793510 \n",  "1 785.235635 10351.421667 15087.574426 10433.579881 10853.152403 \n",  "2 7.516229 28.054336 47.820807 16.303794 29.588240 \n",  "3 9.749896 25.703958 2.887869 7.430676 23.204965 \n",  "4 8.336812 28.773984 2.579753 5.215993 17.054924 \n",  "5 114.815362 187.068214 91.632010 77.986067 288.144351 \n",  "6 389.045145 200.909281 474.790652 183.215053 43.296033 \n",  "7 493.173804 295.120923 623.878847 7834.652456 178.830163 \n",  "8 77.268059 38.459178 88.917004 63.996155 60.123046 \n",  "9 597.035287 225.423921 5459.146719 678.959069 605.313435 \n",  "10 2032.357011 698.232404 3669.074800 3156.463529 1692.175239 \n",  "11 214.783047 378.442585 2137.010157 3406.424685 1367.951646 \n",  "12 5176.068320 1545.254440 15245.046097 21471.130939 5051.710355 \n",  "13 1023.292992 557.185749 1446.578336 4093.631656 1124.045813 \n",  "14 501.187234 822.242650 77.761677 116.251052 658.194668 \n",  "15 1918.668741 1870.682140 1627.437243 2005.204756 2467.857734 \n",  "16 228.559880 200.447203 40.538621 116.659086 382.503402 \n",  "17 623.734835 286.417797 39.330610 408.638824 605.753153 \n",  "18 5152.286446 679.203633 250.552588 681.496420 1427.626931 \n",  "19 2172.701179 1927.524913 2506.291305 780.919638 2868.849059 \n",  "20 29.580125 63.826349 10.612832 19.748720 59.138583 \n",  "21 3206.269325 595.662144 9645.658532 11279.304947 1835.991854 \n",  "22 679.203633 444.631267 1891.427069 521.101746 520.331052 \n",  "23 1857.804455 325.087297 4042.236381 954.053482 1131.217632 \n",  "24 46989.410861 440554.863507 48819.182211 43577.047333 41487.708042 \n",  "25 12882.495517 7816.278046 17412.961893 8603.389475 22533.909280 \n",  "26 202.768272 260.015956 32.466886 374.195020 216.595300 \n",  "27 9885.530947 26242.185434 17654.320770 17139.822579 16697.495982 \n",  "28 12560.299637 35399.734108 31484.003229 33545.662615 26437.149676 \n",  "29 2285.598803 1811.340093 1972.836236 630.458653 1812.154993 \n",  "... ... ... ... ... ... \n",  "27650 10023.052381 48.865236 11822.907960 8396.866377 7112.873873 \n",  "27651 22233.098906 1409.288798 2553.293884 1061.021624 1050.845801 \n",  "27652 8709.635900 4477.133042 3862.289748 2829.080501 3857.430334 \n",  "27653 5105.050000 51.522864 602.395338 540.214499 382.353838 \n",  "27654 49.431069 6.324119 6.534085 12.245528 14.057669 \n",  "27655 15.346170 16.292960 15.849806 10.159481 43.079177 \n",  "27656 3863.669771 220.292646 941.907232 388.803523 516.415889 \n",  "27657 3.090295 1.778279 5.476452 30.287887 13.697417 \n",  "27658 1753.880502 3111.716337 1948.311390 1887.088237 1719.075267 \n",  "27659 2666.858665 42.559841 2940.108393 1753.513495 1992.582402 \n",  "27660 52.844525 91.833260 4.572852 4.460820 14.724639 \n",  "27661 1406.047524 14.487719 65.077377 57.659636 93.229936 \n",  "27662 11246.049740 588.843655 1636.084977 2050.430231 1818.078082 \n",  "27663 42.461956 40.550854 282.773627 61.811464 203.244505 \n",  "27664 13995.873226 3140.508694 28699.447019 18917.416965 11333.871219 \n",  "27665 10046.157903 387.257645 10653.387910 10389.290052 5383.389946 \n",  "27666 2349.632821 80.723503 4905.869443 3486.588065 482.922794 \n",  "27667 5176.068320 1270.574105 2079.283778 1463.620665 894.140283 \n",  "27668 5420.008904 797.994687 1746.138067 995.837100 561.597714 \n",  "27669 7.744618 76.383578 65.782953 32.058059 74.582612 \n",  "27670 5701.642723 100.230524 4867.955366 2688.430936 159.755152 \n",  "27671 6025.595861 119.674053 268.025159 84.168901 36.777590 \n",  "27672 2844.461107 87.096359 91.768323 120.199311 37.542691 \n",  "27673 3872.576449 1954.339456 5516.601212 3207.834954 2203.500262 \n",  "27674 6998.419960 32.734069 4316.889484 1492.338882 2768.632417 \n",  "27675 71.285303 108.143395 73.800771 431.698036 320.442212 \n",  "27676 5610.479760 901.571138 16244.461598 8409.086721 3114.359914 \n",  "27677 10046.157903 2600.159563 22634.887950 10567.044406 2196.918342 \n",  "27678 6039.486294 10568.175092 20710.559999 12170.677235 20094.652790 \n",  "27679 739.605275 105.681751 528.261756 625.062058 724.556640  \n", "\n",  "mhcflurry 2_tau mhcflurry 3_auc  ... netmhc_f1 mhcflurry ensemble big dropout  \\\n", "allele "0 ... 412.970922 \n",  "1 ... 11546.349645 \n",  "2  ... 35.800397  \n", "HLA-A0201 0.622557 0.913962 "3  ... 0.884336 21.979447  \n", "HLA-A0301 0.602523 0.916512 "4  ... 0.900621 17.009966  \n", "HLA-A0201 0.622557 0.913962 "5  ... 0.884336 308.430443  \n", "HLA-A0301 0.602523 0.916512 "6  ... 0.900621 47.644859  \n", "HLA-A2601 0.433437 0.923544 "7  ... 0.541176 224.408829  \n", "HLA-B0801 0.616491 0.940561 "8  ... 0.776053 78.328625  \n", "HLA-B5101 0.382398 0.945669 "9  ... 0.428571 571.537601  \n", "HLA-B5701 0.545377 0.914248 "10  ... 0.741840 1775.178988  \n", "HLA-B0702 0.587247 0.898044 "11  ... 0.869383 1244.685345  \n", "HLA-A3101 0.503990 0.840628 "12  ... 0.833958 5127.121946  \n", "HLA-A1101 0.612013 0.925450 "13  ... 0.883402 1076.400647  \n", "HLA-A0101 0.521745 0.887468 "14  ... 0.619565 816.380140  \n", "HLA-A0206 0.517421 0.883500 "15  ... 0.872902 2343.502305  \n", "HLA-A6802 0.632660 0.959173 "16  ... 0.922636 361.394644  \n", "HLA-A3001 0.521544 0.893689 "17  ... 0.731959 643.230654  \n", "HLA-A0203 0.592812 0.970391 "18  ... 0.948626 1610.622824  \n", "HLA-B3901 0.303500 0.951948 "19  ... 0.750000 2660.599993  \n", "HLA-B1501 0.590098 0.929187 "20  ... 0.846512 72.271451  \n", "HLA-B1517 0.402892 0.901819 "21  ... 0.637931 1722.697842  \n", "HLA-A2402 0.585672 0.868598 "22  ... 0.632911 654.140178  \n", "H-2-DB 0.621788 0.889393 "23  ... 0.621212 1304.558299  \n", "H-2-KB 0.565230 0.908104 "24  ... 0.813675 41659.001894  \n", "HLA-B3501 0.519938 0.822469 "25  ... 0.712000 23595.557288  \n", "HLA-A6801 0.556709 0.930363 "26  ... 0.924791 226.180301  \n", "HLA-B0802 0.358488 0.966056 "27 ... 16861.700002 \n",  "28 ... 27514.021110 \n",  "29 ... 2064.422255 \n",  "... ...  ...0.190476  \n", "HLA-B1801 0.231177 0.768647 "27650  ... 0.358974 7604.842834  \n", "HLA-B5301 0.518640 0.851550 "27651  ... 0.733813 1237.816284  \n", "HLA-A3301 0.593279 0.917699 "27652  ... 0.868327 3603.880509  \n", "HLA-A6901 0.325785 0.942481 "27653  ... 0.698413 339.572329  \n", "HLA-B1509 0.330301 0.817802 "27654  ... 0.187500 12.676772  \n", "HLA-A3201 0.484062 0.900451 "27655  ... 0.772881 39.667229  \n", "HLA-B5801 0.587919 0.903463 "27656  ... 0.827411 504.133200  \n", "HLA-B2703 -0.027856 NaN "27657  ... 0.000000 11.445550  \n", "HLA-A3002 0.343583 0.738413 "27658  ... 0.663438 1791.157510  \n", "HLA-A2501 0.147030 0.971776 "27659  ... 0.666667 2027.917274  \n", "HLA-A2602 0.518496 0.920672 "27660  ... 0.766839 14.161928  \n", "HLA-B4402 0.544209 0.889503 "27661  ... 0.568807 90.514213  \n", "HLA-B4001 0.612248 0.922503 "27662  ... 0.829787 1579.490436  \n", "HLA-A2301 0.582937 0.871403 "27663  ... 0.773842 211.238553  \n", "Mamu-A02 0.485396 0.826068 "27664  ... 0.767123 11428.855078  \n", "HLA-A8001 0.180293 0.971198 "27665  ... 0.434783 5476.180934  \n", "HLA-B4403 0.462364 0.805648 "27666  ... 0.766304 444.361552  \n", "HLA-B4601 NaN NaN "27667  ... 0.000000 1021.498961  \n", "HLA-B3801 0.524527 0.725768 "27668  ... 0.000000 668.294198  \n", "HLA-B2705 0.438219 0.937447 "27669  ... 0.285714 73.996578  \n", "HLA-A2603 0.304849 0.834005 "27670  ... 0.542373 149.314011  \n", "Mamu-A01 0.527595 0.917658 "27671  ... 0.694915 34.810539  \n", "HLA-B0803 0.309651 0.407901 "27672  ... 0.000000 38.770058  \n", "H-2-KD 0.348129 0.754107 "27673  ... 0.657718 2470.088890  \n", "HLA-B1503 0.413124 0.802112 "27674  ... 0.592593 2925.805847  \n", "HLA-A0202 0.641312 0.913248 "27675  ... 0.755556 330.599717  \n", "HLA-A2902 0.621376 0.862027 "27676  ... 0.644068 2980.558001  \n", "HLA-B5401 0.311894 0.797297 "27677  ... 0.800000 1925.407082  \n", "HLA-B4002 0.493522 0.924603 "27678  ... 0.758621 18715.888697  \n", "HLA-B4501 0.238316 0.993333 "27679  ... 1.000000 618.533368  \n", "\n",  " netmhc_tau netmhcpan_auc netmhcpan_f1 netmhcpan_tau mhcflurry ensemble big dropout impute mhcflurry ensemble big impute  \\\n", "allele \n",  "HLA-A0201 0.635498 0.930479 0.880963 0.637338 \n",  "HLA-A0301 0.629236 0.927287 0.885106 0.611240 \n",  "HLA-A0201 0.635498 0.930479 0.880963 0.637338 \n",  "HLA-A0301 0.629236 0.927287 0.885106 0.611240 \n",  "HLA-A2601 0.436646 0.942279 0.640000 0.451666 \n",  "HLA-B0801 0.629519 0.942822 0.701671 0.606762 \n",  "HLA-B5101 0.365307 0.948695 0.610169 0.406973 \n",  "HLA-B5701 0.484975 0.883077 0.642623 0.460133 \n",  "HLA-B0702 0.606014 0.913527 0.855011 0.604720 \n",  "HLA-A3101 0.525026 0.859261 0.822335 0.528941 \n",  "HLA-A1101 0.632199 0.945065 0.887671 0.625794 \n",  "HLA-A0101 0.524866 0.894895 0.594286 0.498767 \n",  "HLA-A0206 0.543184 0.910796 0.866258 0.535067 \n",  "HLA-A6802 0.652332 0.964197 0.900293 0.653216 \n",  "HLA-A3001 0.456482 0.871974 0.746114 0.459857 \n",  "HLA-A0203 0.586911 0.974158 0.944578 0.591463 \n",  "HLA-B3901 0.305138 0.980065 0.744186 0.316739 \n",  "HLA-B1501 0.591735 0.935596 0.823245 0.589097 \n",  "HLA-B1517 0.422497 0.934516 0.710280 0.448575 \n",  "HLA-A2402 0.575710 0.892876 0.693069 0.600686 \n",  "H-2-DB 0.600337 0.874574 0.577236 0.574262 \n",  "H-2-KB 0.573199 0.825565 0.665354 0.486836 \n",  "HLA-B3501 0.515205 0.836281 0.711027 0.514413 \n",  "HLA-A6801 0.571403 0.948907 0.923944 0.599562 \n",  "HLA-B0802 0.393833 0.989590 0.571429 0.410579 \n",  "HLA-B1801 0.237118 0.789549 0.380952 0.234201 \n",  "HLA-B5301 0.515585 0.885722 0.753623 0.559543 \n",  "HLA-A3301 0.587112 0.931156 0.829175 0.612147 \n",  "HLA-A6901 0.335339 0.944257 0.680851 0.327432 \n",  "HLA-B1509 0.354311 0.922907 0.176471 0.448099 \n",  "HLA-A3201 0.448284 0.907161 0.766423 0.480669 \n",  "HLA-B5801 0.545132 0.882016 0.805195 0.531508 \n",  "HLA-B2703 0.053658 NaN 0.000000 0.067451 \n",  "HLA-A3002 0.342161 0.732749 0.611260 0.320577 \n",  "HLA-A2501 0.151836 0.998540 0.888889 0.153968 \n",  "HLA-A2602 0.525365 0.957811 0.839378 0.561093 \n",  "HLA-B4402 0.574916 0.934554 0.607143 0.598960 \n",  "HLA-B4001 0.635308 0.920678 0.845570 0.619418 \n",  "HLA-A2301 0.605598 0.895229 0.788406 0.636944 \n",  "Mamu-A02 0.598964 0.883087 0.748092 0.524622 \n",  "HLA-A8001 0.182374 0.980799 0.434783 0.186524 \n",  "HLA-B4403 0.541066 0.891047 0.775956 0.587824 \n",  "HLA-B4601 NaN NaN 0.000000 NaN \n",  "HLA-B3801 0.513269 0.980074 0.000000 0.652173 \n",  "HLA-B2705 0.430561 0.943860 0.400000 0.377208 \n",  "HLA-A2603 0.366317 0.934300 0.581818 0.426438 \n",  "Mamu-A01 0.569423 0.912755 0.706897 0.539013 \n",  "HLA-B0803 0.318249 0.952346 0.000000 0.315978 \n",  "H-2-KD 0.403275 0.819189 0.645570 0.390333 \n",  "HLA-B1503 0.468922 0.870064 0.588235 0.522577 \n",  "HLA-A0202 0.627143 0.898697 0.769231 0.624280 \n",  "HLA-A2902 0.619830 0.882377 0.633333 0.641257 \n",  "HLA-B5401 0.300252 0.845946 0.727273 0.349826 \n",  "HLA-B4002 0.456242 0.918651 0.909091 0.518720 \n",  "HLA-B4501 0.263574 0.993333 0.800000 0.246426 "0 412.076508 127.076246 \n",  "1 11523.365476 12119.332257 \n",  "2 36.332714 26.661012 \n",  "3 22.149854 5.514130 \n",  "4 17.210544 4.087731 \n",  "5 313.295340 283.004210 \n",  "6 46.924741 29.162618 \n",  "7 201.811546 474.297442 \n",  "8 76.676509 193.105629 \n",  "9 693.972088 1713.786138 \n",  "10 1884.171693 1789.612162 \n",  "11 1351.931885 1067.459441 \n",  "12 5209.625518 8636.336772 \n",  "13 1156.249328 1603.594406 \n",  "14 805.279634 141.506879 \n",  "15 2144.153240 2390.595616 \n",  "16 373.243072 83.824100 \n",  "17 660.133509 130.712552 \n",  "18 1769.522489 873.394417 \n",  "19 2573.852038 767.526952 \n",  "20 70.076491 11.864378 \n",  "21 1747.805124 2083.261161 \n",  "22 664.474823 1412.605620 \n",  "23 1229.593069 5570.914059 \n",  "24 41837.785429 48392.807367 \n",  "25 23748.451823 13479.431410 \n",  "26 242.127529 127.804211 \n",  "27 17069.597584 22898.529557 \n",  "28 27636.532147 31236.558902 \n",  "29 1886.517056 2135.568381 \n",  "... ... ... \n",  "27650 7479.282282 6258.296379 \n",  "27651 1182.498170 1172.873419 \n",  "27652 3030.659833 5563.513654 \n",  "27653 301.199532 601.529341 \n",  "27654 12.334242 7.512322 \n",  "27655 38.287952 24.337711 \n",  "27656 457.406648 487.206850 \n",  "27657 11.495052 4.775820 \n",  "27658 1546.291904 2058.095390 \n",  "27659 1893.370590 2396.076901 \n",  "27660 14.629042 6.439483 \n",  "27661 82.453838 82.987997 \n",  "27662 1417.089815 1162.903485 \n",  "27663 201.105289 108.536631 \n",  "27664 11689.661532 23630.026791 \n",  "27665 5615.000643 8909.938464 \n",  "27666 481.566753 4389.750924 \n",  "27667 879.863849 2018.189764 \n",  "27668 576.000262 1797.452166 \n",  "27669 73.643951 70.680062 \n",  "27670 162.079432 2732.703556 \n",  "27671 32.082260 151.035319 \n",  "27672 34.945554 113.338951 \n",  "27673 2189.148776 5592.837838 \n",  "27674 2672.593921 3516.571151 \n",  "27675 325.728139 81.573509 \n",  "27676 3312.065429 17560.618251 \n",  "27677 2131.598717 21847.772691 \n",  "27678 18569.871473 16359.253806 \n",  "27679 634.952392 609.348300  \n", "\n",  " smmpmbec_cpp_auc smmpmbec_cpp_f1 smmpmbec_cpp_tau test_size mhcflurry ensemble small mhcflurry ensemble small dropout  \\\n", "allele \n",  "HLA-A0201 0.927358 0.885121 0.626224 2126 \n",  "HLA-A0301 0.933966 0.897275 0.610891 811 \n",  "HLA-A0201 0.927358 0.885121 0.626224 2126 \n",  "HLA-A0301 0.933966 0.897275 0.610891 811 \n",  "HLA-A2601 0.927339 0.603053 0.422900 1333 \n",  "HLA-B0801 0.940555 0.760000 0.618953 940 \n",  "HLA-B5101 0.927621 0.395604 0.344534 854 \n",  "HLA-B5701 0.929923 0.709091 0.569615 815 \n",  "HLA-B0702 0.897928 0.857719 0.563960 813 \n",  "HLA-A3101 0.851270 0.837037 0.502586 724 \n",  "HLA-A1101 0.944205 0.882514 0.618388 723 \n",  "HLA-A0101 0.832665 0.437811 0.428064 696 \n",  "HLA-A0206 0.904317 0.878282 0.527571 682 \n",  "HLA-A6802 0.965793 0.928775 0.629530 669 \n",  "HLA-A3001 0.869935 0.692875 0.505244 660 \n",  "HLA-A0203 0.972885 0.946746 0.583908 651 \n",  "HLA-B3901 0.949708 0.708333 0.296639 641 \n",  "HLA-B1501 0.936063 0.819048 0.590100 633 \n",  "HLA-B1517 0.899620 0.652542 0.406582 582 \n",  "HLA-A2402 0.848915 0.633416 0.537589 573 \n",  "H-2-DB 0.884187 0.628571 0.571252 564 \n",  "H-2-KB 0.915994 0.859967 0.589218 558 \n",  "HLA-B3501 0.823734 0.705411 0.501630 542 \n",  "HLA-A6801 0.944553 0.924347 0.556418 527 \n",  "HLA-B0802 0.987214 0.105263 0.385838 509 \n",  "HLA-B1801 0.787782 0.315789 0.215534 503 \n",  "HLA-B5301 0.821328 0.734177 0.495308 485 \n",  "HLA-A3301 0.907414 0.855098 0.572158 473 \n",  "HLA-A6901 0.954868 0.689655 0.322498 470 \n",  "HLA-B1509 0.894618 0.187500 0.364673 466 \n",  "HLA-A3201 0.832013 0.580796 0.493693 449 \n",  "HLA-B5801 0.905645 0.817757 0.582026 445 \n",  "HLA-B2703 NaN 0.000000 NaN 441 \n",  "HLA-A3002 0.754271 0.704104 0.354956 420 \n",  "HLA-A2501 0.992701 0.727273 0.151997 416 \n",  "HLA-A2602 0.942981 0.790244 0.531805 413 \n",  "HLA-B4402 0.802018 0.570652 0.377900 411 \n",  "HLA-B4001 0.862331 0.674487 0.520725 407 \n",  "HLA-A2301 0.849381 0.745000 0.561259 391 \n",  "Mamu-A02 0.810692 0.640000 0.478589 388 \n",  "HLA-A8001 0.990015 0.518519 0.183987 379 \n",  "HLA-B4403 0.796454 0.754902 0.432021 378 \n",  "HLA-B4601 NaN 0.000000 NaN 378 \n",  "HLA-B3801 0.949206 0.000000 0.547438 351 \n",  "HLA-B2705 0.941682 0.304348 0.416884 314 \n",  "HLA-A2603 0.843194 0.509091 0.306741 312 \n",  "Mamu-A01 0.839390 0.609272 0.469975 274 \n",  "HLA-B0803 0.973333 0.000000 0.314266 234 \n",  "H-2-KD 0.753692 0.538462 0.365247 229 \n",  "HLA-B1503 0.839417 0.523364 0.444917 165 \n",  "HLA-A0202 0.882206 0.727273 0.606938 126 \n",  "HLA-A2902 0.871795 0.655172 0.612364 118 \n",  "HLA-B5401 0.839189 0.727273 0.333600 79 \n",  "HLA-B4002 0.934524 0.758621 0.455548 74 \n",  "HLA-B4501 1.000000 0.888889 0.251301 65 "0 354.917879 1032.431732 \n",  "1 10582.779265 15236.594111 \n",  "2 14.234040 198.349515 \n",  "3 9.571188 75.476672 \n",  "4 5.404075 66.898285 \n",  "5 138.379134 453.930512 \n",  "6 75.234690 201.404054 \n",  "7 661.731263 203.524213 \n",  "8 150.854140 187.610007 \n",  "9 1086.358455 752.720509 \n",  "10 1947.519632 2076.622509 \n",  "11 1329.481436 3414.402864 \n",  "12 7069.623536 5894.343484 \n",  "13 1313.022876 3179.342016 \n",  "14 150.417060 1461.872211 \n",  "15 2085.100907 2197.478976 \n",  "16 338.944863 520.383520 \n",  "17 409.386338 1192.928506 \n",  "18 1388.416277 2652.885992 \n",  "19 2439.748334 2815.823260 \n",  "20 26.414514 268.040984 \n",  "21 2101.585394 4997.269950 \n",  "22 564.254917 819.075211 \n",  "23 929.756200 3301.970499 \n",  "24 43698.473230 35656.657787 \n",  "25 14242.783105 21776.671841 \n",  "26 301.852190 477.313288 \n",  "27 17056.311336 18450.482638 \n",  "28 30641.466715 24382.979125 \n",  "29 939.673714 4363.985261 \n",  "... ... ... \n",  "27650 9231.021768 5156.232010 \n",  "27651 1764.436778 1111.672293 \n",  "27652 6258.738064 4524.941460 \n",  "27653 643.689547 251.163750 \n",  "27654 8.405853 27.709716 \n",  "27655 16.823708 58.138736 \n",  "27656 444.416136 735.295045 \n",  "27657 6.568378 32.964932 \n",  "27658 2512.567240 3027.341368 \n",  "27659 1967.137649 2491.696068 \n",  "27660 6.198800 50.448656 \n",  "27661 58.432447 276.768061 \n",  "27662 1666.694211 1347.540285 \n",  "27663 258.973559 260.492701 \n",  "27664 18143.405562 4168.082792 \n",  "27665 9591.843502 2761.863904 \n",  "27666 2042.311657 367.235345 \n",  "27667 2021.345029 1563.055045 \n",  "27668 1566.822564 1028.126890 \n",  "27669 57.014343 137.017124 \n",  "27670 1276.710804 74.709633 \n",  "27671 71.008408 66.404734 \n",  "27672 81.153866 68.889617 \n",  "27673 4632.347243 2486.083401 \n",  "27674 2870.279424 2542.821536 \n",  "27675 296.494841 424.188197 \n",  "27676 6405.555907 2085.838673 \n",  "27677 7014.522577 979.357726 \n",  "27678 17813.603418 13002.010500 \n",  "27679 868.508729 633.270834  \n", "\n",  " train_size mhcflurry ensemble small dropout impute \\\n",  "0 979.070265  \n", "allele "1 15530.316894  \n", "HLA-A0201 9565 "2 191.311593  \n", "HLA-A0301 6141 "3 73.397048  \n", "HLA-A0201 9565 "4 66.277773  \n", "HLA-A0301 6141 "5 463.507669  \n", "HLA-A2601 2894 "6 208.736308  \n", "HLA-B0801 2267 "7 224.200582  \n", "HLA-B5101 1734 "8 214.239343  \n", "HLA-B5701 1857 "9 709.941692  \n", "HLA-B0702 3412 "10 2226.792652  \n", "HLA-A3101 4796 "11 3545.255682  \n", "HLA-A1101 5399 "12 7160.380833  \n", "HLA-A0101 3725 "13 4114.009836  \n", "HLA-A0206 4827 "14 1395.238443  \n", "HLA-A6802 4768 "15 2406.306619  \n", "HLA-A3001 2040 "16 465.347789  \n", "HLA-A0203 5542 "17 1265.190937  \n", "HLA-B3901 886 "18 2526.015000  \n", "HLA-B1501 3213 "19 2720.410670  \n", "HLA-B1517 846 "20 283.389399  \n", "HLA-A2402 2533 "21 6096.220197  \n", "H-2-DB 3216 "22 894.703952  \n", "H-2-KB 3407 "23 3481.233105  \n", "HLA-B3501 2397 "24 35933.924362  \n", "HLA-A6801 3184 "25 22004.804730  \n", "HLA-B0802 487 "26 502.591357  \n", "HLA-B1801 2052 "27 18900.181919  \n", "HLA-B5301 1018 "28 24418.581154  \n", "HLA-A3301 3040 "29 4371.870300  \n", "HLA-A6901 2079 "... ...  \n", "HLA-B1509 346 "27650 5035.623414  \n", "HLA-A3201 640 "27651 1060.293750  \n", "HLA-B5801 2564 "27652 4375.453454  \n", "HLA-B2703 433 "27653 275.278758  \n", "HLA-A3002 1430 "27654 27.221991  \n", "HLA-A2501 519 "27655 64.107520  \n", "HLA-A2602 202 "27656 794.598133  \n", "HLA-B4402 1705 "27657 38.103514  \n", "HLA-B4001 2718 "27658 3013.792180  \n", "HLA-A2301 2021 "27659 2395.803209  \n", "Mamu-A02 938 "27660 48.079763  \n", "HLA-A8001 782 "27661 231.652412  \n", "HLA-B4403 913 "27662 1407.630327  \n", "HLA-B4601 1424 "27663 312.612832  \n", "HLA-B3801 136 "27664 4559.164386  \n", "HLA-B2705 3028 "27665 2998.184500  \n", "HLA-A2603 205 "27666 414.581205  \n", "Mamu-A01 2264 "27667 1463.156016  \n", "HLA-B0803 217 "27668 1020.437293  \n", "H-2-KD 452 "27669 132.439640  \n", "HLA-B1503 429 "27670 91.008365  \n", "HLA-A0202 3919 "27671 65.430784  \n", "HLA-A2902 2397 "27672 64.427006  \n", "HLA-B5401 1019 "27673 2571.450051  \n", "HLA-B4002 866 "27674 2543.506844  \n", "HLA-B4501 889 "27675 409.284111 \n",  "27676 2419.370891 \n",  "27677 1149.771514 \n",  "27678 13171.900795 \n",  "27679 563.941437 \n",  "\n",  " mhcflurry ensemble small impute mhcflurry ensemble all \\\n",  "0 316.292139 382.541823 \n",  "1 10563.990149 12481.240163 \n",  "2 36.190375 45.449943 \n",  "3 10.311149 17.935116 \n",  "4 6.168712 13.117819 \n",  "5 126.418515 252.636475 \n",  "6 69.728882 71.024356 \n",  "7 295.562535 298.738170 \n",  "8 191.850182 152.833062 \n",  "9 1346.778760 1012.509851 \n",  "10 1964.265895 2041.328348 \n",  "11 1204.086341 1590.990449 \n",  "12 5956.985743 6491.326974 \n",  "13 1362.964505 1746.619566 \n",  "14 137.238251 374.282265 \n",  "15 1636.737426 2047.788604 \n",  "16 339.779696 257.850466 \n",  "17 451.596165 489.354829 \n",  "18 2755.876104 1614.656891 \n",  "19 3073.347069 1929.976130 \n",  "20 21.261397 50.369477 \n",  "21 1804.117426 2692.207424 \n",  "22 714.377501 866.913344 \n",  "23 610.772902 1963.425858 \n",  "24 43211.020428 42130.179619 \n",  "25 13645.161028 18168.149169 \n",  "26 303.172547 258.410869 \n",  "27 18420.470692 19167.884275 \n",  "28 32544.871175 28800.714194 \n",  "29 972.296882 2049.140061 \n",  "... ... ... \n",  "27650 8607.096036 6928.865814 \n",  "27651 1876.531094 1329.076033 \n",  "27652 6060.178041 4805.978810 \n",  "27653 575.304332 411.355669 \n",  "27654 7.820612 11.864975 \n",  "27655 18.676103 31.696572 \n",  "27656 541.039409 562.468684 \n",  "27657 6.110409 10.637579 \n",  "27658 2392.621310 2254.038432 \n",  "27659 2137.104399 2248.162529 \n",  "27660 7.380668 13.226821 \n",  "27661 60.833303 101.778708 \n",  "27662 1675.027127 1430.474651 \n",  "27663 349.272026 217.862273 \n",  "27664 19072.190282 12198.052877 \n",  "27665 9070.424185 6112.359174 \n",  "27666 1608.665597 1099.957154 \n",  "27667 1681.715255 1534.072962 \n",  "27668 1285.797745 1118.560975 \n",  "27669 63.485729 79.380539 \n",  "27670 1025.821527 453.623055 \n",  "27671 55.309069 71.611468 \n",  "27672 62.164324 72.544193 \n",  "27673 4915.072495 3555.422310 \n",  "27674 3133.554358 2976.060607 \n",  "27675 378.668749 261.260451 \n",  "27676 9950.741910 5485.878564 \n",  "27677 11502.198577 4447.784250 \n",  "27678 21474.820337 16829.102901 \n",  "27679 887.179059 678.365819  \n", "\n",  "[55 " mhcflurry ensemble all impute mhcflurry ensemble all not impute \n",  "0 356.850347 410.082958 \n",  "1 12303.157490 12661.900504 \n",  "2 50.889386 40.591910 \n",  "3 17.436463 18.448030 \n",  "4 13.022964 13.213366 \n",  "5 268.474851 237.732466 \n",  "6 66.805124 75.510064 \n",  "7 282.208914 316.235562 \n",  "8 157.065094 148.715061 \n",  "9 1032.652955 992.759662 \n",  "10 1959.701221 2126.355477 \n",  "11 1575.443549 1606.690770 \n",  "12 6618.730369 6366.375957 \n",  "13 1795.659446 1698.918976 \n",  "14 384.336799 364.490764 \n",  "15 2119.693068 1978.323290 \n",  "16 265.206359 250.698599 \n",  "17 471.209294 508.199121 \n",  "18 1811.092066 1439.527524 \n",  "19 2015.954947 1847.664238 \n",  "20 47.309480 53.627395 \n",  "21 2515.593959 2881.220473 \n",  "22 880.089107 853.934834 \n",  "23 1953.552931 1973.348682 \n",  "24 42107.762939 42152.608233 \n",  "25 17607.624386 18746.517815 \n",  "26 262.043599 254.828500 \n",  "27 19206.551553 19129.294844 \n",  "28 28779.777262 28821.666357 \n",  "29 2034.277029 2064.111687 \n",  "... ... ... \n",  "27650 6711.297427 7153.487383 \n",  "27651 1288.867869 1370.538551 \n",  "27652 4598.314811 5023.021101 \n",  "27653 411.571566 411.139885 \n",  "27654 11.851187 11.878780 \n",  "27655 32.500068 30.912940 \n",  "27656 556.349977 568.654684 \n",  "27657 10.632822 10.642338 \n",  "27658 2188.699116 2321.328325 \n",  "27659 2195.347706 2302.247951 \n",  "27660 13.521697 12.938375 \n",  "27661 99.094853 104.535252 \n",  "27662 1403.986323 1457.462722 \n",  "27663 220.949289 214.818388 \n",  "27664 12449.101083 11952.067302 \n",  "27665 6073.340310 6151.628720 \n",  "27666 1089.664844 1110.346678 \n",  "27667 1445.789757 1627.746940 \n",  "27668 1079.592232 1158.936326 \n",  "27669 81.335853 77.472231 \n",  "27670 450.939613 456.322467 \n",  "27671 64.711354 79.247336 \n",  "27672 63.109548 83.389283 \n",  "27673 3526.987182 3584.086686 \n",  "27674 2941.918465 3010.598981 \n",  "27675 253.321583 269.448116 \n",  "27676 6117.150361 4919.752146 \n",  "27677 4981.684922 3971.103159 \n",  "27678 17121.333808 16541.859860 \n",  "27679 663.304608 693.769015 \n",  "\n",  "[27680  rows x 35 98  columns]" ]  },  "execution_count": 20, 12,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df "# Extend with ensemble predictions\n",  "all_indices  = pandas.read_csv(\"../data/validation_scores.csv\", index_col=\"allele\")\n",  "df" sorted(set.union(*[set(indices) for (name, indices) in model_groups.iteritems()]))\n",  "all_indices_impute = sorted(\n",  " set.union(*[set(indices) for (name, indices) in model_groups.iteritems() if 'impute' in name]))\n",  "all_indices_not_impute = sorted(\n",  " set.union(*[set(indices) for (name, indices) in model_groups.iteritems() if 'impute' not in name]))\n",  "\n",  "for (name, indices) in list(model_groups.iteritems()) + [(\"all\", all_indices), (\"all impute\", all_indices_impute), (\"all not impute\", all_indices_not_impute)]:\n",  " validation_df_with_mhcflurry_results[\"mhcflurry ensemble %s\" % name] = \\\n",  " scipy.stats.mstats.gmean(\n",  " validation_df_with_mhcflurry_results[[\"mhcflurry %d\" % i for i in indices]],\n",  " axis=1)\n",  "\n",  "validation_df_with_mhcflurry_results"  ]  },  {  "cell_type": "code",  "execution_count": 29, 20,  "metadata": {  "collapsed": false  }, 

" \n",  " \n",  " \n",  " allele\n",  " mhcflurry 0_auc\n",  " mhcflurry 0_f1\n",  " mhcflurry 0_tau\n",  " mhcflurry 1_auc\n", 10_auc\n",  " mhcflurry 1_f1\n", 10_f1\n",  " mhcflurry 1_tau\n", 10_tau\n",  " mhcflurry 2_auc\n", 11_auc\n",  " mhcflurry 2_f1\n", 11_f1\n",  " mhcflurry 2_tau\n",  " mhcflurry 3_auc\n", 11_tau\n",  " ...\n",  " netmhc_f1\n",  " netmhc_tau\n",  " netmhcpan_auc\n",  " netmhcpan_f1\n",  " netmhcpan_tau\n",  " smmpmbec_cpp_auc\n", 

" smmpmbec_cpp_tau\n",  " test_size\n",  " train_size\n",  " mhcflurry standard_tau\n",  " mhcflurry standard_f1\n",  " mhcflurry standard_auc\n",  " \n",  " \n",  " allele\n", 

" \n",  " \n",  " \n",  " \n"," \n",  " HLA-A0201\n",  " 0.899123\n",  " 0.837826\n",  " 0.554988\n",  " 0.926853\n",  " 0.870671\n",  " 0.623314\n",  " 0.925713\n",  " 0.881167\n",  " 0.622557\n",  " 0.913962\n",  " ...\n",  " 0.880963\n",  " 0.637338\n",  " 0.927358\n",  " 0.885121\n",  " 0.626224\n",  " 2126\n",  " 9565\n",  " 0.622718\n",  " 0.874891\n",  " 0.925388\n",  " \n",  " \n",  " HLA-A0301\n",  " 0.891561\n",  " 0.834236\n",  " 0.540025\n",  " 0.922007\n",  " 0.892147\n",  " 0.595890\n",  " 0.923343\n",  " 0.879402\n",  " 0.602523\n",  " 0.916512\n",  " ...\n",  " 0.885106\n",  " 0.611240\n",  " 0.933966\n",  " 0.897275\n",  " 0.610891\n",  " 811\n",  " 6141\n",  " 0.601211\n",  " 0.879144\n",  " 0.922855\n",  " \n",  " \n",  " HLA-A0201\n",  " 0.899123\n",  " 0.837826\n",  " 0.554988\n",  " 0.926853\n",  " 0.870671\n",  " 0.623314\n",  " 0.925713\n",  " 0.881167\n",  " 0.622557\n",  " 0.913962\n",  " ...\n",  " 0.880963\n",  " 0.637338\n",  " 0.927358\n",  " 0.885121\n",  " 0.626224\n",  " 2126\n",  " 9565\n",  " 0.622718\n",  " 0.874891\n",  " 0.925388\n",  " \n",  " \n",  " HLA-A0301\n",  " 0.891561\n",  " 0.834236\n",  " 0.540025\n",  " 0.922007\n",  " 0.892147\n",  " 0.595890\n",  " 0.923343\n",  " 0.879402\n",  " 0.602523\n",  " 0.916512\n",  " ...\n",  " 0.885106\n",  " 0.611240\n",  " 0.933966\n",  " 0.897275\n",  " 0.610891\n",  " 811\n",  " 6141\n",  " 0.601211\n",  " 0.879144\n",  " 0.922855\n",  " \n",  " \n",  " HLA-A2601\n",  " 0.928084\n",  " 0.580000\n",  " 0.432299\n",  " 0.929260\n",  " 0.593103\n",  " 0.440722\n",  " 0.931760\n",  " 0.574899\n",  " 0.433437\n",  " 0.923544\n",  " ...\n",  " 0.640000\n",  " 0.451666\n",  " 0.927339\n",  " 0.603053\n",  " 0.422900\n",  " 1333\n",  " 2894\n",  " 0.432822\n",  " 0.553719\n",  " 0.931268\n",  " \n",  " \n",  " HLA-B0801\n",  " 0.942694\n",  " 0.762931\n",  " 0.600817\n",  " 0.949517\n",  " 0.773504\n",  " 0.620342\n",  " 0.948274\n",  " 0.778523\n",  " 0.616491\n",  " 0.940561\n",  " ...\n",  " 0.701671\n",  " 0.606762\n",  " 0.940555\n",  " 0.760000\n",  " 0.618953\n",  " 940\n",  " 2267\n",  " 0.616177\n",  " 0.779736\n",  " 0.949331\n",  " \n",  " \n",  " HLA-B5101\n",  " 0.933050\n",  " 0.489796\n",  " 0.369192\n",  " 0.939082\n",  " 0.391304\n",  " 0.369359\n",  " 0.948141\n",  " 0.404762\n",  " 0.382398\n",  " 0.945669\n",  " ...\n",  " 0.610169\n",  " 0.406973\n",  " 0.927621\n",  " 0.395604\n",  " 0.344534\n",  " 854\n",  " 1734\n",  " 0.379767\n",  " 0.418605\n",  " 0.946123\n",  " \n",  " \n",  " HLA-B5701\n", overall\n",  " 0.914240\n", overall\n",  " 0.750000\n", 0.916791\n",  " 0.524933\n", 0.770198\n",  " 0.916777\n", 0.551841\n",  " 0.740299\n", 0.924137\n",  " 0.535227\n", 0.779420\n",  " 0.922818\n", 0.564822\n",  " 0.670886\n", 0.907951\n",  " 0.545377\n", 0.700910\n",  " 0.914248\n", 0.538382\n",  " ...\n",  " 0.642623\n", 0.800909\n",  " 0.460133\n", 0.582258\n",  " 0.929923\n", 0.932924\n",  " 0.709091\n", 0.793170\n",  " 0.569615\n", 0.579586\n",  " 815\n", 0.919208\n",  " 1857\n", 0.784295\n",  " 0.548574\n", 0.561996\n",  " 0.701863\n", 27680\n",  " 0.923588\n", NaN\n",  " \n",  " \n",  " HLA-B0702\n", H-2-DB\n",  " 0.904985\n", H-2-DB\n",  " 0.792711\n", 0.891129\n",  " 0.564505\n", 0.636704\n",  " 0.915801\n", 0.607055\n",  " 0.866525\n", 0.894199\n",  " 0.594497\n", 0.544643\n",  " 0.909308\n", 0.620387\n",  " 0.835526\n", 0.889827\n",  " 0.587247\n", 0.349727\n",  " 0.898044\n", 0.615268\n",  " ...\n",  " 0.855011\n", 0.621212\n",  " 0.604720\n", 0.600337\n",  " 0.897928\n", 0.874574\n",  " 0.857719\n", 0.577236\n",  " 0.563960\n", 0.574262\n",  " 813\n", 0.884187\n",  " 3412\n", 0.628571\n",  " 0.587399\n", 0.571252\n",  " 0.835165\n", 564\n",  " 0.909692\n", 3216\n",  " \n",  " \n",  " HLA-A3101\n", H-2-KB\n",  " 0.828510\n", H-2-KB\n",  " 0.782609\n", 0.887740\n",  " 0.460554\n", 0.795053\n",  " 0.854838\n", 0.551784\n",  " 0.822500\n", 0.910714\n",  " 0.510287\n", 0.821239\n",  " 0.847235\n", 0.569634\n",  " 0.817610\n", 0.903935\n",  " 0.503990\n", 0.760456\n",  " 0.840628\n", 0.561134\n",  " ...\n",  " 0.822335\n", 0.813675\n",  " 0.528941\n", 0.573199\n",  " 0.851270\n", 0.825565\n",  " 0.837037\n", 0.665354\n",  " 0.502586\n", 0.486836\n",  " 724\n", 0.915994\n",  " 4796\n", 0.859967\n",  " 0.505116\n", 0.589218\n",  " 0.816583\n", 558\n",  " 0.847396\n", 3407\n",  " \n",  " \n",  " HLA-A1101\n", H-2-KD\n",  " 0.920368\n", H-2-KD\n",  " 0.872077\n", 0.775344\n",  " 0.579906\n", 0.613139\n",  " 0.936520\n", 0.359457\n",  " 0.883152\n", 0.787208\n",  " 0.615351\n", 0.575758\n",  " 0.936927\n", 0.378337\n",  " 0.884298\n", 0.785797\n",  " 0.612013\n", 0.555556\n",  " 0.925450\n", 0.365622\n",  " ...\n",  " 0.887671\n", 0.657718\n",  " 0.625794\n", 0.403275\n",  " 0.944205\n", 0.819189\n",  " 0.882514\n", 0.645570\n",  " 0.618388\n", 0.390333\n",  " 723\n", 0.753692\n",  " 5399\n", 0.538462\n",  " 0.611919\n", 0.365247\n",  " 0.884298\n", 229\n",  " 0.937280\n", 452\n",  " \n",  " \n",  " HLA-A0101\n",  " 0.912746\n", HLA-A0101\n",  " 0.621762\n", 0.901156\n",  " 0.521720\n", 0.605405\n",  " 0.924911\n", 0.501124\n",  " 0.659794\n", 0.911578\n",  " 0.531596\n", 0.587571\n",  " 0.909260\n", 0.521736\n",  " 0.586207\n", 0.889515\n",  " 0.521745\n", 0.299213\n",  " 0.887468\n", 0.498039\n",  " ...\n",  " 0.619565\n",  " 0.524866\n",  " 0.894895\n",  " 0.594286\n",  " 0.498767\n",  " 0.832665\n", 

" 0.428064\n",  " 696\n",  " 3725\n",  " 0.519116\n",  " 0.560000\n",  " 0.908668\n",  " \n",  " \n",  " HLA-A0206\n",  " 0.876067\n",  " 0.849449\n",  " 0.465713\n",  " 0.909081\n",  " 0.872236\n",  " 0.528876\n",  " 0.900025\n",  " 0.868712\n",  " 0.517421\n",  " 0.883500\n",  " ...\n",  " 0.866258\n",  " 0.535067\n",  " 0.904317\n",  " 0.878282\n",  " 0.527571\n",  " 682\n",  " 4827\n",  " 0.519496\n",  " 0.880779\n",  " 0.898990\n",  " \n",  " \n",  " HLA-A6802\n", HLA-A0201\n",  " 0.954562\n", HLA-A0201\n",  " 0.870482\n", 0.901909\n",  " 0.602856\n", 0.845684\n",  " 0.968359\n", 0.573243\n",  " 0.900000\n", 0.925812\n",  " 0.640201\n", 0.871728\n",  " 0.968413\n", 0.623190\n",  " 0.889894\n", 0.913368\n",  " 0.632660\n", 0.861688\n",  " 0.959173\n", 0.599266\n",  " ...\n",  " 0.900293\n", 0.884336\n",  " 0.653216\n", 0.635498\n",  " 0.965793\n", 0.930479\n",  " 0.928775\n", 0.880963\n",  " 0.629530\n", 0.637338\n",  " 669\n", 0.927358\n",  " 4768\n", 0.885121\n",  " 0.634703\n", 0.626224\n",  " 0.885845\n", 2126\n",  " 0.968637\n", 9565\n",  " \n",  " \n",  " HLA-A3001\n", HLA-A0202\n",  " 0.888740\n", HLA-A0202\n",  " 0.730864\n", 0.832040\n",  " 0.502090\n", 0.717391\n",  " 0.881443\n", 0.498543\n",  " 0.737913\n", 0.905765\n",  " 0.499390\n", 0.791209\n",  " 0.889599\n", 0.646429\n",  " 0.745592\n", 0.912694\n",  " 0.521544\n", 0.787234\n",  " 0.893689\n", 0.656408\n",  " ...\n",  " 0.746114\n", 0.755556\n",  " 0.459857\n", 0.627143\n",  " 0.869935\n", 0.898697\n",  " 0.692875\n", 0.769231\n",  " 0.505244\n", 0.624280\n",  " 660\n", 0.882206\n",  " 2040\n", 0.727273\n",  " 0.520738\n", 0.606938\n",  " 0.749367\n", 126\n",  " 0.888110\n", 3919\n",  " \n",  " \n",  " HLA-A0203\n",  " 0.950892\n", HLA-A0203\n",  " 0.916566\n", 0.951758\n",  " 0.534315\n", 0.924731\n",  " 0.976453\n", 0.550961\n",  " 0.951364\n", 0.974648\n",  " 0.573478\n", 0.954869\n",  " 0.974324\n", 0.594523\n",  " 0.953737\n", 0.970475\n",  " 0.592812\n", 0.948503\n",  " 0.970391\n", 0.577628\n",  " ...\n",  " 0.948626\n",  " 0.586911\n",  " 0.974158\n",  " 0.944578\n",  " 0.591463\n",  " 0.972885\n", 

" 0.583908\n",  " 651\n",  " 5542\n",  " 0.595852\n",  " 0.957041\n",  " 0.974815\n",  " \n",  " \n",  " HLA-B3901\n", HLA-A0206\n",  " 0.953506\n", HLA-A0206\n",  " 0.705882\n", 0.862964\n",  " 0.297435\n", 0.831633\n",  " 0.951364\n", 0.443633\n",  " 0.734694\n", 0.899344\n",  " 0.295161\n", 0.875306\n",  " 0.960260\n", 0.518406\n",  " 0.723404\n", 0.883182\n",  " 0.303500\n", 0.868159\n",  " 0.951948\n", 0.496525\n",  " ...\n",  " 0.744186\n", 0.872902\n",  " 0.316739\n", 0.543184\n",  " 0.949708\n", 0.910796\n",  " 0.708333\n", 0.866258\n",  " 0.296639\n", 0.535067\n",  " 641\n", 0.904317\n",  " 886\n", 0.878282\n",  " 0.288446\n", 0.527571\n",  " 0.666667\n", 682\n",  " 0.943377\n", 4827\n",  " \n",  " \n",  " HLA-B1501\n", HLA-A0301\n",  " 0.914988\n", HLA-A0301\n",  " 0.793503\n", 0.891751\n",  " 0.569384\n", 0.841542\n",  " 0.933960\n", 0.530830\n",  " 0.831050\n", 0.922273\n",  " 0.585046\n", 0.865510\n",  " 0.937243\n", 0.601402\n",  " 0.829736\n", 0.918873\n",  " 0.590098\n", 0.728411\n",  " 0.929187\n", 0.582643\n",  " ...\n",  " 0.823245\n", 0.900621\n",  " 0.589097\n", 0.629236\n",  " 0.936063\n", 0.927287\n",  " 0.819048\n", 0.885106\n",  " 0.590100\n", 0.611240\n",  " 633\n", 0.933966\n",  " 3213\n", 0.897275\n",  " 0.590860\n", 0.610891\n",  " 0.830918\n", 811\n",  " 0.938188\n", 6141\n",  " \n",  " \n",  " HLA-B1517\n", HLA-A1101\n",  " 0.910482\n", HLA-A1101\n",  " 0.661088\n", 0.927653\n",  " 0.407311\n", 0.874471\n",  " 0.921477\n", 0.588756\n",  " 0.661157\n", 0.937180\n",  " 0.417164\n", 0.885517\n",  " 0.911692\n", 0.612339\n",  " 0.669604\n", 0.927661\n",  " 0.402892\n", 0.873950\n",  " 0.901819\n", 0.586194\n",  " ...\n",  " 0.710280\n", 0.883402\n",  " 0.448575\n", 0.632199\n",  " 0.899620\n", 0.945065\n",  " 0.652542\n", 0.887671\n",  " 0.406582\n", 0.625794\n",  " 582\n", 0.944205\n",  " 846\n", 0.882514\n",  " 0.410409\n", 0.618388\n",  " 0.639004\n", 723\n",  " 0.909998\n", 5399\n",  " \n",  " \n",  " HLA-A2301\n",  " HLA-A2301\n",  " 0.834979\n",  " 0.729345\n",  " 0.529725\n",  " 0.872916\n",  " 0.731118\n",  " 0.593738\n",  " 0.861315\n",  " 0.634483\n",  " 0.570282\n",  " ...\n",  " 0.773842\n",  " 0.605598\n",  " 0.895229\n",  " 0.788406\n",  " 0.636944\n",  " 0.849381\n",  " 0.745000\n",  " 0.561259\n",  " 391\n",  " 2021\n",  " \n",  " \n",  " HLA-A2402\n",  " 0.851004\n", HLA-A2402\n",  " 0.653659\n", 0.856434\n",  " 0.535714\n", 0.669834\n",  " 0.853637\n", 0.555656\n",  " 0.649165\n", 0.867408\n",  " 0.551522\n", 0.579946\n",  " 0.870712\n", 0.578389\n",  " 0.585366\n", 0.876370\n",  " 0.585672\n", 0.356164\n",  " 0.868598\n", 0.586201\n",  " ...\n",  " 0.632911\n",  " 0.575710\n",  " 0.892876\n",  " 0.693069\n",  " 0.600686\n",  " 0.848915\n", 

" 0.537589\n",  " 573\n",  " 2533\n",  " 0.578611\n",  " 0.583784\n",  " 0.865991\n",  " \n",  " \n",  " H-2-DB\n", HLA-A2501\n",  " 0.887624\n", HLA-A2501\n",  " 0.611321\n", 0.992701\n",  " 0.598370\n", 0.571429\n",  " 0.907299\n", 0.151524\n",  " 0.995134\n",  " 0.727273\n",  " 0.152722\n",  " 0.998054\n",  " 0.750000\n",  " 0.153471\n",  " ...\n",  " 0.666667\n",  " 0.631110\n", 0.151836\n",  " 0.894433\n", 0.998540\n",  " 0.564103\n", 0.888889\n",  " 0.621788\n", 0.153968\n",  " 0.889393\n", 0.992701\n",  " 0.727273\n",  " 0.151997\n",  " 416\n",  " 519\n",  " \n",  " \n",  " HLA-A2601\n",  " HLA-A2601\n",  " 0.931620\n",  " 0.614334\n",  " 0.431520\n",  " 0.933148\n",  " 0.566667\n",  " 0.435573\n",  " 0.927566\n",  " 0.317073\n",  " 0.428294\n",  " ...\n",  " 0.577236\n", 0.541176\n",  " 0.574262\n", 0.436646\n",  " 0.884187\n", 0.942279\n",  " 0.628571\n", 0.640000\n",  " 0.571252\n", 0.451666\n",  " 564\n", 0.927339\n",  " 3216\n", 0.603053\n",  " 0.618274\n", 0.422900\n",  " 0.563877\n", 1333\n",  " 0.892264\n", 2894\n",  " \n",  " \n",  " H-2-KB\n", HLA-A2602\n",  " 0.866649\n", HLA-A2602\n",  " 0.794613\n", 0.895741\n",  " 0.527096\n", 0.674286\n",  " 0.900377\n", 0.463429\n",  " 0.797853\n", 0.929743\n",  " 0.570317\n", 0.765714\n",  " 0.910039\n", 0.509348\n",  " 0.812165\n", 0.885672\n",  " 0.565230\n", 0.710059\n",  " 0.908104\n", 0.443344\n",  " ...\n",  " 0.665354\n", 0.766839\n",  " 0.486836\n", 0.525365\n",  " 0.915994\n", 0.957811\n",  " 0.859967\n", 0.839378\n",  " 0.589218\n", 0.561093\n",  " 558\n", 0.942981\n",  " 3407\n", 0.790244\n",  " 0.570651\n", 0.531805\n",  " 0.812165\n", 413\n",  " 0.911974\n", 202\n",  " \n",  " \n",  " HLA-B3501\n", HLA-A2603\n",  " 0.828050\n", HLA-A2603\n",  " 0.737903\n", 0.869189\n",  " 0.500896\n", 0.557377\n",  " 0.831002\n", 0.326277\n",  " 0.722656\n", 0.914398\n",  " 0.524182\n", 0.408163\n",  " 0.829343\n", 0.377292\n",  " 0.722110\n", 0.852580\n",  " 0.519938\n", 0.272727\n",  " 0.822469\n", 0.306978\n",  " ...\n",  " 0.711027\n", 0.542373\n",  " 0.514413\n", 0.366317\n",  " 0.823734\n", 0.934300\n",  " 0.705411\n", 0.581818\n",  " 0.501630\n", 0.426438\n",  " 542\n", 0.843194\n",  " 0.509091\n",  " 0.306741\n",  " 312\n",  " 205\n",  " \n",  " \n",  " HLA-A2902\n",  " HLA-A2902\n",  " 0.895401\n",  " 0.622951\n",  " 0.648086\n",  " 0.877493\n",  " 0.644068\n",  " 0.630893\n",  " 0.857957\n",  " 0.629630\n",  " 0.594667\n",  " ...\n",  " 0.644068\n",  " 0.619830\n",  " 0.882377\n",  " 0.633333\n",  " 0.641257\n",  " 0.871795\n",  " 0.655172\n",  " 0.612364\n",  " 118\n",  " 2397\n",  " 0.517529\n",  " 0.714286\n",  " 0.828331\n",  " \n",  " \n",  " HLA-A6801\n", HLA-A3001\n",  " 0.926693\n", HLA-A3001\n",  " 0.904494\n", 0.881763\n",  " 0.519608\n", 0.734491\n",  " 0.945221\n", 0.483303\n",  " 0.919605\n", 0.887159\n",  " 0.571760\n", 0.748052\n",  " 0.941744\n", 0.512159\n",  " 0.905028\n", 0.891398\n",  " 0.556709\n", 0.747368\n",  " 0.930363\n", 0.514166\n",  " ...\n",  " 0.923944\n", 0.731959\n",  " 0.599562\n", 0.456482\n",  " 0.944553\n", 0.871974\n",  " 0.924347\n", 0.746114\n",  " 0.556418\n", 0.459857\n",  " 527\n", 0.869935\n",  " 3184\n", 0.692875\n",  " 0.553065\n", 0.505244\n",  " 0.905292\n", 660\n",  " 0.941373\n", 2040\n",  " \n",  " \n",  " HLA-B0802\n", HLA-A3002\n",  " 0.978728\n", HLA-A3002\n",  " 0.285714\n", 0.740724\n",  " 0.361894\n", 0.587537\n",  " 0.964924\n", 0.335931\n",  " 0.160000\n", 0.754918\n",  " 0.341633\n", 0.637076\n",  " 0.980878\n", 0.355555\n",  " 0.000000\n", 0.754802\n",  " 0.358488\n", 0.582133\n",  " 0.966056\n", 0.353739\n",  " ...\n",  " 0.571429\n", 0.663438\n",  " 0.410579\n", 0.342161\n",  " 0.987214\n", 0.732749\n",  " 0.105263\n", 0.611260\n",  " 0.385838\n", 0.320577\n",  " 509\n", 0.754271\n",  " 487\n", 0.704104\n",  " 0.364774\n", 0.354956\n",  " 0.000000\n", 420\n",  " 0.974089\n", 1430\n",  " \n",  " \n",  " HLA-B1801\n", HLA-A3101\n",  " 0.775263\n", HLA-A3101\n",  " 0.324324\n", 0.847970\n",  " 0.201325\n", 0.790637\n",  " 0.811504\n", 0.489596\n",  " 0.358974\n", 0.847081\n",  " 0.241803\n", 0.816583\n",  " 0.774436\n", 0.505649\n",  " 0.333333\n", 0.839532\n",  " 0.231177\n", 0.784876\n",  " 0.768647\n", 0.486671\n",  " ...\n",  " 0.380952\n", 0.833958\n",  " 0.234201\n", 0.525026\n",  " 0.787782\n", 0.859261\n",  " 0.315789\n", 0.822335\n",  " 0.215534\n", 0.528941\n",  " 503\n", 0.851270\n",  " 2052\n", 0.837037\n",  " 0.230967\n", 0.502586\n",  " 0.333333\n", 724\n",  " 0.775038\n", 4796\n",  " \n",  " \n",  " HLA-B5301\n", HLA-A3201\n",  " 0.836274\n", HLA-A3201\n",  " 0.716279\n", 0.903308\n",  " 0.511275\n", 0.747331\n",  " 0.849549\n", 0.504529\n",  " 0.740566\n", 0.898435\n",  " 0.528186\n", 0.772881\n",  " 0.834934\n", 0.466982\n",  " 0.712264\n", 0.894282\n",  " 0.518640\n", 0.749117\n",  " 0.851550\n", 0.438716\n",  " ...\n",  " 0.753623\n", 0.772881\n",  " 0.559543\n", 0.448284\n",  " 0.821328\n", 0.907161\n",  " 0.734177\n", 0.766423\n",  " 0.495308\n", 0.480669\n",  " 485\n", 0.832013\n",  " 1018\n", 0.580796\n",  " 0.529645\n", 0.493693\n",  " 0.713253\n", 449\n",  " 0.845182\n", 640\n",  " \n",  " \n",  " HLA-A3301\n",  " 0.912425\n", HLA-A3301\n",  " 0.822857\n", 0.915822\n",  " 0.579394\n", 0.812144\n",  " 0.924043\n", 0.585833\n",  " 0.863309\n", 0.926914\n",  " 0.600599\n", 0.803922\n",  " 0.922635\n", 0.593872\n",  " 0.850277\n", 0.919876\n",  " 0.593279\n", 0.388889\n",  " 0.917699\n", 0.573477\n",  " ...\n",  " 0.868327\n",  " 0.587112\n",  " 0.931156\n",  " 0.829175\n",  " 0.612147\n",  " 0.907414\n", 

" 0.572158\n",  " 473\n",  " 3040\n",  " 0.593153\n", \n",  " 0.837989\n", \n",  " 0.923011\n", HLA-A6801\n",  " HLA-A6801\n",  " 0.933051\n",  " 0.918688\n",  " 0.518524\n",  " 0.944722\n",  " 0.910364\n",  " 0.562203\n",  " 0.935997\n",  " 0.893431\n",  " 0.539995\n",  " ...\n",  " 0.924791\n",  " 0.571403\n",  " 0.948907\n",  " 0.923944\n",  " 0.599562\n",  " 0.944553\n",  " 0.924347\n",  " 0.556418\n",  " 527\n",  " 3184\n",  " \n",  " \n",  " HLA-A6802\n",  " HLA-A6802\n",  " 0.955764\n",  " 0.857143\n",  " 0.590486\n",  " 0.968081\n",  " 0.886191\n",  " 0.635309\n",  " 0.959900\n",  " 0.708408\n",  " 0.603869\n",  " ...\n",  " 0.922636\n",  " 0.652332\n",  " 0.964197\n",  " 0.900293\n",  " 0.653216\n",  " 0.965793\n",  " 0.928775\n",  " 0.629530\n",  " 669\n",  " 4768\n",  " \n",  " \n",  " HLA-A6901\n",  " 0.958853\n", HLA-A6901\n",  " 0.638889\n", 0.959546\n",  " 0.338189\n", 0.630137\n",  " 0.964830\n", 0.334796\n",  " 0.666667\n", 0.958593\n",  " 0.342789\n", 0.736842\n",  " 0.956947\n", 0.331893\n",  " 0.700000\n", 0.941355\n",  " 0.325785\n", 0.487805\n",  " 0.942481\n", 0.312966\n",  " ...\n",  " 0.698413\n",  " 0.335339\n",  " 0.944257\n",  " 0.680851\n",  " 0.327432\n",  " 0.954868\n", 

" 0.322498\n",  " 470\n",  " 2079\n",  " 0.322656\n",  " 0.721311\n",  " 0.953569\n",  " \n",  " \n",  " HLA-B1509\n", HLA-A8001\n",  " 0.852442\n", HLA-A8001\n",  " 0.487805\n", 0.950077\n",  " 0.298869\n", 0.307692\n",  " 0.871854\n", 0.171367\n",  " 0.315789\n", 0.986559\n",  " 0.331161\n", 0.545455\n",  " 0.880691\n", 0.185429\n",  " 0.129032\n", 0.985791\n",  " 0.330301\n", 0.470588\n",  " 0.817802\n", 0.189219\n",  " ...\n",  " 0.176471\n", 0.434783\n",  " 0.448099\n", 0.182374\n",  " 0.894618\n", 0.980799\n",  " 0.187500\n", 0.434783\n",  " 0.364673\n", 0.186524\n",  " 466\n", 0.990015\n",  " 346\n", 0.518519\n",  " 0.294024\n", 0.183987\n",  " 0.216216\n", 379\n",  " 0.861990\n", 782\n",  " \n",  " \n",  " HLA-A3201\n", HLA-B0702\n",  " 0.884704\n", HLA-B0702\n",  " 0.699690\n", 0.893816\n",  " 0.512869\n", 0.804494\n",  " 0.893682\n", 0.557662\n",  " 0.708861\n", 0.910484\n",  " 0.514653\n", 0.825749\n",  " 0.900643\n", 0.590398\n",  " 0.777778\n", 0.899076\n",  " 0.484062\n", 0.704689\n",  " 0.900451\n", 0.576627\n",  " ...\n",  " 0.766423\n", 0.869383\n",  " 0.480669\n", 0.606014\n",  " 0.832013\n", 0.913527\n",  " 0.580796\n", 0.855011\n",  " 0.493693\n", 0.604720\n",  " 449\n", 0.897928\n",  " 640\n", 0.857719\n",  " 0.540213\n", 0.563960\n",  " 0.756410\n", 813\n",  " 0.910653\n", 3412\n",  " \n",  " \n",  " HLA-B5801\n", HLA-B0801\n",  " 0.894775\n", HLA-B0801\n",  " 0.832512\n", 0.944786\n",  " 0.559392\n", 0.752834\n",  " 0.904312\n", 0.604698\n",  " 0.835821\n", 0.947216\n",  " 0.571688\n", 0.752252\n",  " 0.907261\n", 0.614472\n",  " 0.825641\n", 0.938434\n",  " 0.587919\n", 0.553672\n",  " 0.903463\n", 0.603882\n",  " ...\n",  " 0.805195\n", 0.776053\n",  " 0.531508\n", 0.629519\n",  " 0.905645\n", 0.942822\n",  " 0.817757\n", 0.701671\n",  " 0.582026\n", 0.606762\n",  " 445\n", 0.940555\n",  " 2564\n", 0.760000\n",  " 0.588062\n", 0.618953\n",  " 0.827763\n", 940\n",  " 0.907100\n", 2267\n",  " \n",  " \n",  " HLA-B2703\n", HLA-B0802\n",  " NaN\n", HLA-B0802\n",  " 0.000000\n", 0.969450\n",  " 0.018979\n", 0.200000\n",  " NaN\n", 0.371902\n",  " 0.000000\n",  " 0.060609\n",  " NaN\n",  " 0.000000\n",  " -0.027856\n",  " NaN\n",  " ...\n",  " 0.000000\n",  " 0.067451\n",  " NaN\n",  " 0.000000\n",  " NaN\n",  " 441\n",  " 433\n",  " 0.029998\n", 0.978389\n",  " 0.000000\n",  " NaN\n", 0.368566\n",  " \n", 0.966735\n",  " \n", 0.000000\n",  " HLA-A3002\n",  " 0.711574\n",  " 0.619512\n",  " 0.315227\n",  " 0.728981\n",  " 0.622785\n",  " 0.334000\n",  " 0.742042\n",  " 0.645161\n",  " 0.343583\n",  " 0.738413\n",  " ...\n",  " 0.611260\n",  " 0.320577\n",  " 0.754271\n",  " 0.704104\n",  " 0.354956\n",  " 420\n",  " 1430\n",  " 0.343652\n",  " 0.631313\n",  " 0.740308\n",  " \n",  " \n",  " HLA-A2501\n",  " 0.975669\n",  " 0.363636\n",  " 0.146430\n",  " 0.972749\n",  " 0.380952\n",  " 0.145681\n",  " 0.977129\n",  " 0.600000\n",  " 0.147030\n",  " 0.971776\n",  " ...\n",  " 0.888889\n",  " 0.153968\n",  " 0.992701\n",  " 0.727273\n",  " 0.151997\n",  " 416\n",  " 519\n",  " 0.151224\n",  " 0.500000\n",  " 0.991241\n",  " \n",  " \n",  " HLA-A2602\n",  " 0.902721\n",  " 0.713615\n",  " 0.469627\n",  " 0.926269\n",  " 0.746411\n",  " 0.493376\n",  " 0.930901\n",  " 0.786070\n",  " 0.518496\n",  " 0.920672\n", 0.353712\n",  " ...\n",  " 0.839378\n", 0.190476\n",  " 0.561093\n", 0.393833\n",  " 0.942981\n", 0.989590\n",  " 0.790244\n", 0.571429\n",  " 0.531805\n", 0.410579\n",  " 413\n", 0.987214\n",  " 202\n", 0.105263\n",  " 0.479073\n", 0.385838\n",  " 0.756219\n", 509\n",  " 0.913016\n", 487\n",  " \n",  " \n",  " HLA-B4402\n", HLA-B0803\n",  " 0.869757\n", HLA-B0803\n",  " 0.682292\n", 0.974321\n",  " 0.506405\n", 0.200000\n",  " 0.868196\n", 0.308791\n",  " 0.601156\n", 0.938272\n",  " 0.513061\n", 0.200000\n",  " 0.887197\n", 0.284053\n",  " 0.517572\n", 0.660247\n",  " 0.544209\n", 0.000000\n",  " 0.889503\n", 0.147246\n",  " ...\n",  " 0.607143\n", 0.000000\n",  " 0.598960\n", 0.318249\n",  " 0.802018\n", 0.952346\n",  " 0.570652\n", 0.000000\n",  " 0.377900\n", 0.315978\n",  " 411\n", 0.973333\n",  " 1705\n", 0.000000\n",  " 0.548878\n", 0.314266\n",  " 0.488599\n", 234\n",  " 0.887989\n", 217\n",  " \n",  " \n",  " HLA-B4001\n", HLA-B1501\n",  " 0.895389\n", HLA-B1501\n",  " 0.735043\n", 0.898576\n",  " 0.580586\n", 0.770335\n",  " 0.906650\n", 0.548021\n",  " 0.723032\n", 0.936809\n",  " 0.602434\n", 0.817518\n",  " 0.912764\n", 0.589179\n",  " 0.680982\n", 0.930032\n",  " 0.612248\n", 0.715909\n",  " 0.922503\n", 0.579299\n",  " ...\n",  " 0.845570\n", 0.846512\n",  " 0.619418\n", 0.591735\n",  " 0.862331\n", 0.935596\n",  " 0.674487\n", 0.823245\n",  " 0.520725\n", 0.589097\n",  " 407\n", 0.936063\n",  " 2718\n", 0.819048\n",  " 0.613517\n", 0.590100\n",  " 0.654088\n", 633\n",  " 0.913586\n", 3213\n",  " \n",  " \n",  " HLA-A2301\n", HLA-B1503\n",  " 0.840581\n", HLA-B1503\n",  " 0.710602\n", 0.844812\n",  " 0.556410\n", 0.676923\n",  " 0.873845\n", 0.479128\n",  " 0.773481\n", 0.836547\n",  " 0.596226\n", 0.655738\n",  " 0.870580\n", 0.495029\n",  " 0.743363\n", 0.793159\n",  " 0.582937\n", 0.539683\n",  " 0.871403\n", 0.446426\n",  " ...\n",  " 0.788406\n", 0.592593\n",  " 0.636944\n", 0.468922\n",  " 0.849381\n", 0.870064\n",  " 0.745000\n", 0.588235\n",  " 0.561259\n", 0.522577\n",  " 391\n", 0.839417\n",  " 2021\n", 0.523364\n",  " 0.592758\n", 0.444917\n",  " 0.746356\n", 165\n",  " 0.874270\n", 429\n",  " \n",  " \n",  " Mamu-A02\n", HLA-B1509\n",  " 0.876989\n", HLA-B1509\n",  " 0.682216\n", 0.854809\n",  " 0.504329\n", 0.307692\n",  " 0.870053\n", 0.302344\n",  " 0.668555\n", 0.876667\n",  " 0.507614\n", 0.066667\n",  " 0.853992\n", 0.350511\n",  " 0.666667\n", 0.815829\n",  " 0.485396\n", 0.000000\n",  " 0.826068\n", 0.285066\n",  " ...\n",  " 0.748092\n", 0.187500\n",  " 0.524622\n", 0.354311\n",  " 0.810692\n", 0.922907\n",  " 0.640000\n", 0.176471\n",  " 0.478589\n", 0.448099\n",  " 388\n", 0.894618\n",  " 938\n", 0.187500\n",  " 0.502013\n", 0.364673\n",  " 0.657459\n", 466\n",  " 0.867954\n", 346\n",  " \n",  " \n",  " HLA-A8001\n", HLA-B1517\n",  " 0.966590\n", HLA-B1517\n",  " 0.344828\n", 0.917827\n",  " 0.175280\n", 0.666667\n",  " 0.988479\n", 0.414557\n",  " 0.560000\n", 0.915408\n",  " 0.194232\n", 0.700461\n",  " 0.985407\n", 0.416301\n",  " 0.461538\n", 0.907470\n",  " 0.180293\n", 0.713568\n",  " 0.971198\n", 0.389533\n",  " ...\n",  " 0.434783\n", 0.637931\n",  " 0.186524\n", 0.422497\n",  " 0.990015\n", 0.934516\n",  " 0.518519\n", 0.710280\n",  " 0.183987\n", 0.448575\n",  " 379\n", 0.899620\n",  " 782\n", 0.652542\n",  " 0.166354\n", 0.406582\n",  " 0.333333\n", 582\n",  " 0.966590\n", 846\n",  " \n",  " \n",  " HLA-B4403\n", HLA-B1801\n",  " 0.785885\n", HLA-B1801\n",  " 0.677333\n", 0.774286\n",  " 0.419995\n", 0.439024\n",  " 0.811937\n", 0.211662\n",  " 0.732824\n", 0.782030\n",  " 0.450560\n", 0.235294\n",  " 0.813593\n", 0.228810\n",  " 0.613982\n", 0.783308\n",  " 0.462364\n", 0.068966\n",  " 0.805648\n", 0.239988\n",  " ...\n",  " 0.775956\n", 0.358974\n",  " 0.587824\n", 0.237118\n",  " 0.796454\n", 0.789549\n",  " 0.754902\n", 0.380952\n",  " 0.432021\n", 0.234201\n",  " 378\n", 0.787782\n",  " 913\n", 0.315789\n",  " 0.431010\n", 0.215534\n",  " 0.719388\n", 503\n",  " 0.790096\n", 2052\n",  " \n",  " \n",  " HLA-B4601\n", HLA-B2703\n",  " HLA-B2703\n",  " NaN\n",  " 0.000000\n",  " NaN\n", 0.056018\n",  " NaN\n",  " 0.000000\n",  " NaN\n", 0.062446\n",  " NaN\n",  " 0.000000\n",  " NaN\n",  " NaN\n", -0.036427\n",  " ...\n",  " 0.000000\n",  " NaN\n", 0.053658\n",  " NaN\n",  " 0.000000\n",  " NaN\n",  " 378\n",  " 1424\n", 0.067451\n",  " NaN\n",  " 0.000000\n",  " NaN\n",  " 441\n",  " 433\n",  " \n",  " \n",  " HLA-B2705\n",  " HLA-B2705\n",  " 0.946038\n",  " 0.520000\n",  " 0.409150\n",  " 0.946642\n",  " 0.434783\n",  " 0.438604\n",  " 0.938778\n",  " 0.256410\n",  " 0.426224\n",  " ...\n",  " 0.285714\n",  " 0.430561\n",  " 0.943860\n",  " 0.400000\n",  " 0.377208\n",  " 0.941682\n",  " 0.304348\n",  " 0.416884\n",  " 314\n",  " 3028\n",  " \n",  " \n",  " HLA-B3501\n",  " HLA-B3501\n",  " 0.817746\n",  " 0.696538\n",  " 0.483306\n",  " 0.832408\n",  " 0.715177\n",  " 0.520130\n",  " 0.822722\n",  " 0.704805\n",  " 0.494024\n",  " ...\n",  " 0.712000\n",  " 0.515205\n",  " 0.836281\n",  " 0.711027\n",  " 0.514413\n",  " 0.823734\n",  " 0.705411\n",  " 0.501630\n",  " 542\n",  " 2397\n",  " \n",  " \n",  " HLA-B3801\n",  " 0.901216\n", HLA-B3801\n",  " 0.903951\n",  " 0.000000\n",  " 0.500359\n", 0.459762\n",  " 0.909119\n", 0.886795\n",  " 0.000000\n",  " 0.515732\n", 0.431934\n",  " 0.921952\n", 0.341844\n",  " 0.000000\n",  " 0.524527\n",  " 0.725768\n", -0.194121\n",  " ...\n",  " 0.000000\n",  " 0.513269\n",  " 0.980074\n",  " 0.000000\n",  " 0.652173\n",  " 0.949206\n",  " 0.000000\n",  " 0.547438\n",  " 351\n",  " 136\n",  " 0.523753\n",  " 0.000000\n",  " 0.935900\n",  " \n",  " \n",  " HLA-B2705\n", HLA-B3901\n",  " 0.945675\n", HLA-B3901\n",  " 0.571429\n", 0.956623\n",  " 0.416364\n", 0.720000\n",  " 0.944586\n", 0.298735\n",  " 0.509804\n", 0.961039\n",  " 0.424005\n", 0.765957\n",  " 0.948578\n", 0.305990\n",  " 0.489796\n", 0.948701\n",  " 0.438219\n", 0.650000\n",  " 0.937447\n", 0.300846\n",  " ...\n",  " 0.400000\n", 0.750000\n",  " 0.377208\n", 0.305138\n",  " 0.941682\n", 0.980065\n",  " 0.304348\n", 0.744186\n",  " 0.416884\n", 0.316739\n",  " 314\n", 0.949708\n",  " 3028\n", 0.708333\n",  " 0.438390\n", 0.296639\n",  " 0.520000\n", 641\n",  " 0.947973\n", 886\n",  " \n",  " \n",  " HLA-A2603\n", HLA-B4001\n",  " 0.860835\n", HLA-B4001\n",  " 0.529412\n", 0.908463\n",  " 0.320885\n", 0.750716\n",  " 0.863587\n", 0.596380\n",  " 0.537313\n", 0.914359\n",  " 0.315634\n", 0.745665\n",  " 0.862604\n", 0.616642\n",  " 0.518519\n", 0.918467\n",  " 0.304849\n", 0.379032\n",  " 0.834005\n", 0.617008\n",  " ...\n",  " 0.581818\n", 0.829787\n",  " 0.426438\n", 0.635308\n",  " 0.843194\n", 0.920678\n",  " 0.509091\n", 0.845570\n",  " 0.306741\n", 0.619418\n",  " 312\n", 0.862331\n",  " 205\n", 0.674487\n",  " 0.319324\n", 0.520725\n",  " 0.576271\n", 407\n",  " 0.877150\n", 2718\n",  " \n",  " \n",  " HLA-B4002\n",  " HLA-B4002\n",  " 0.921627\n",  " 0.750000\n",  " 0.525437\n",  " 0.935516\n",  " 0.714286\n",  " 0.512204\n",  " 0.934524\n",  " 0.363636\n",  " 0.469391\n",  " ...\n",  " 0.758621\n",  " 0.456242\n",  " 0.918651\n",  " 0.909091\n",  " 0.518720\n",  " 0.934524\n",  " 0.758621\n",  " 0.455548\n",  " 74\n",  " 866\n",  " \n",  " \n",  " HLA-B4402\n",  " HLA-B4402\n",  " 0.885611\n",  " 0.648199\n",  " 0.524912\n",  " 0.903627\n",  " 0.503226\n",  " 0.565924\n",  " 0.905261\n",  " 0.122449\n",  " 0.572317\n",  " ...\n",  " 0.568807\n",  " 0.574916\n",  " 0.934554\n",  " 0.607143\n",  " 0.598960\n",  " 0.802018\n",  " 0.570652\n",  " 0.377900\n",  " 411\n",  " 1705\n",  " \n",  " \n",  " Mamu-A01\n", HLA-B4403\n",  " 0.847141\n", HLA-B4403\n",  " 0.583333\n", 0.804104\n",  " 0.455049\n", 0.674352\n",  " 0.889177\n", 0.453800\n",  " 0.643836\n", 0.822127\n",  " 0.506096\n", 0.567657\n",  " 0.922777\n", 0.477520\n",  " 0.716418\n", 0.826030\n",  " 0.527595\n", 0.344000\n",  " 0.917658\n", 0.474618\n",  " ...\n",  " 0.706897\n", 0.766304\n",  " 0.539013\n", 0.541066\n",  " 0.839390\n", 0.891047\n",  " 0.609272\n", 0.775956\n",  " 0.469975\n", 0.587824\n",  " 274\n", 0.796454\n",  " 2264\n", 0.754902\n",  " 0.525326\n", 0.432021\n",  " 0.719424\n", 378\n",  " 0.920975\n", 913\n",  " \n",  " \n",  " HLA-B0803\n", HLA-B4501\n",  " 0.952593\n", HLA-B4501\n",  " 1.000000\n",  " 0.750000\n",  " 0.239350\n",  " 1.000000\n",  " 0.750000\n",  " 0.251757\n",  " 1.000000\n",  " 0.571429\n",  " 0.290012\n",  " ...\n",  " 1.000000\n",  " 0.263574\n",  " 0.993333\n",  " 0.800000\n",  " 0.246426\n",  " 1.000000\n",  " 0.888889\n",  " 0.251301\n",  " 65\n",  " 889\n",  " \n",  " \n",  " HLA-B4601\n",  " HLA-B4601\n",  " NaN\n",  " 0.000000\n",  " 0.302768\n", NaN\n",  " 0.886914\n", NaN\n",  " 0.000000\n",  " 0.273943\n", NaN\n",  " 0.957037\n", NaN\n",  " 0.000000\n",  " 0.309651\n",  " 0.407901\n", NaN\n",  " ...\n",  " 0.000000\n",  " 0.315978\n", NaN\n",  " 0.973333\n", NaN\n",  " 0.000000\n",  " 0.314266\n", NaN\n",  " 234\n",  " 217\n",  " 0.289431\n", NaN\n",  " 0.000000\n",  " 0.910123\n", NaN\n",  " \n", 378\n",  " \n",  " H-2-KD\n",  " 0.765223\n",  " 0.613333\n",  " 0.336723\n",  " 0.764808\n",  " 0.569444\n",  " 0.323700\n",  " 0.766882\n",  " 0.545455\n",  " 0.348129\n",  " 0.754107\n",  " ...\n",  " 0.645570\n",  " 0.390333\n",  " 0.753692\n",  " 0.538462\n",  " 0.365247\n",  " 229\n",  " 452\n",  " 0.321850\n",  " 0.594203\n",  " 0.750622\n",  " \n",  " \n",  " HLA-B1503\n",  " 0.788338\n",  " 0.477064\n",  " 0.361371\n",  " 0.820478\n",  " 0.476190\n",  " 0.377722\n",  " 0.839991\n",  " 0.537037\n",  " 0.413124\n",  " 0.802112\n",  " ...\n",  " 0.588235\n",  " 0.522577\n",  " 0.839417\n",  " 0.523364\n",  " 0.444917\n",  " 165\n",  " 429\n",  " 0.426175\n",  " 0.551020\n",  " 0.820937\n", 1424\n",  " \n",  " \n",  " HLA-A0202\n", HLA-B5101\n",  " 0.833980\n", HLA-B5101\n",  " 0.720000\n", 0.931112\n",  " 0.561484\n", 0.458716\n",  " 0.893293\n", 0.368507\n",  " 0.764045\n", 0.947013\n",  " 0.614703\n", 0.380952\n",  " 0.903271\n", 0.379882\n",  " 0.791209\n", 0.949703\n",  " 0.641312\n", 0.222222\n",  " 0.913248\n", 0.380791\n",  " ...\n",  " 0.769231\n", 0.428571\n",  " 0.624280\n", 0.365307\n",  " 0.882206\n", 0.948695\n",  " 0.727273\n", 0.610169\n",  " 0.606938\n", 0.406973\n",  " 126\n", 0.927621\n",  " 3919\n", 0.395604\n",  " 0.644894\n", 0.344534\n",  " 0.782609\n", 854\n",  " 0.903548\n", 1734\n",  " \n",  " \n",  " HLA-A2902\n", HLA-B5301\n",  " 0.890924\n", HLA-B5301\n",  " 0.700000\n", 0.850993\n",  " 0.620455\n", 0.752336\n",  " 0.884819\n", 0.526623\n",  " 0.666667\n", 0.848975\n",  " 0.649314\n", 0.715000\n",  " 0.873016\n", 0.537388\n",  " 0.644068\n", 0.857396\n",  " 0.621376\n", 0.653061\n",  " 0.862027\n", 0.545337\n",  " ...\n",  " 0.633333\n", 0.733813\n",  " 0.641257\n", 0.515585\n",  " 0.871795\n", 0.885722\n",  " 0.655172\n", 0.753623\n",  " 0.612364\n", 0.559543\n",  " 118\n", 0.821328\n",  " 2397\n", 0.734177\n",  " 0.625060\n", 0.495308\n",  " 0.644068\n", 485\n",  " 0.873830\n", 1018\n",  " \n",  " \n",  " HLA-B5401\n",  " 0.800000\n", HLA-B5401\n",  " 0.810811\n",  " 0.727273\n",  " 0.304572\n",  " 0.805405\n",  " 0.727273\n",  " 0.295787\n",  " 0.816216\n",  " 0.666667\n",  " 0.314822\n",  " 0.800000\n", 0.802703\n",  " 0.727273\n",  " 0.311894\n",  " 0.797297\n", 0.328001\n",  " ...\n",  " 0.800000\n",  " 0.300252\n",  " 0.845946\n",  " 0.727273\n",  " 0.349826\n",  " 0.839189\n", 

" 0.333600\n",  " 79\n",  " 1019\n",  " 0.303840\n",  " 0.727273\n",  " 0.797297\n",  " \n",  " \n",  " HLA-B4002\n", HLA-B5701\n",  " 0.916667\n", HLA-B5701\n",  " 0.764706\n", 0.910343\n",  " 0.494300\n", 0.738739\n",  " 0.908730\n", 0.515322\n",  " 0.689655\n", 0.923162\n",  " 0.481845\n", 0.666667\n",  " 0.934524\n", 0.545770\n",  " 0.758621\n", 0.911326\n",  " 0.493522\n", 0.535714\n",  " 0.924603\n", 0.525831\n",  " ...\n",  " 0.909091\n", 0.741840\n",  " 0.518720\n", 0.484975\n",  " 0.934524\n", 0.883077\n",  " 0.758621\n", 0.642623\n",  " 0.455548\n", 0.460133\n",  " 74\n", 0.929923\n",  " 866\n", 0.709091\n",  " 0.480289\n", 0.569615\n",  " 815\n",  " 1857\n",  " \n",  " \n",  " HLA-B5801\n",  " HLA-B5801\n",  " 0.897543\n",  " 0.824691\n",  " 0.556252\n",  " 0.906918\n",  " 0.818414\n",  " 0.584738\n",  " 0.904392\n",  " 0.767568\n",  " 0.584167\n",  " ...\n",  " 0.827411\n",  " 0.545132\n",  " 0.882016\n",  " 0.805195\n",  " 0.531508\n",  " 0.905645\n",  " 0.817757\n",  " 0.582026\n",  " 445\n",  " 2564\n",  " \n",  " \n",  " Mamu-A01\n",  " Mamu-A01\n",  " 0.872810\n",  " 0.626866\n",  " 0.474873\n",  " 0.925878\n",  " 0.748092\n",  " 0.534401\n",  " 0.920470\n",  " 0.709677\n",  " 0.902778\n", 0.517494\n",  " ...\n",  " 0.694915\n",  " 0.569423\n",  " 0.912755\n",  " 0.706897\n",  " 0.539013\n",  " 0.839390\n",  " 0.609272\n",  " 0.469975\n",  " 274\n",  " 2264\n",  " \n",  " \n",  " HLA-B4501\n", Mamu-A02\n",  " 0.996667\n", Mamu-A02\n",  " 0.750000\n", 0.911300\n",  " 0.230045\n", 0.736486\n",  " 1.000000\n", 0.547823\n",  " 0.750000\n", 0.899894\n",  " 0.247621\n", 0.711974\n",  " 0.996667\n", 0.551297\n",  " 0.571429\n", 0.881034\n",  " 0.238316\n", 0.692557\n",  " 0.993333\n", 0.532768\n",  " ...\n",  " 0.800000\n", 0.767123\n",  " 0.246426\n", 0.598964\n",  " 1.000000\n", 0.883087\n",  " 0.888889\n", 0.748092\n",  " 0.251301\n", 0.524622\n",  " 65\n", 0.810692\n",  " 889\n", 0.640000\n",  " 0.261062\n", 0.478589\n",  " 0.750000\n", 388\n",  " 0.996667\n", 938\n",  " \n",  " \n",  "\n",  "

55 "

54  rows × 38 285  columns

\n", ""
  ],  "text/plain": [  " allele  mhcflurry 0_auc mhcflurry 0_f1 mhcflurry 0_taumhcflurry 1_auc  \\\n", "allele \n", "HLA-A0201 0.899123 0.837826 0.554988 0.926853 "overall overall 0.916791 0.770198 0.551841  \n", "HLA-A0301 0.891561 0.834236 0.540025 0.922007 "H-2-DB H-2-DB 0.891129 0.636704 0.607055  \n", "HLA-A0201 0.899123 0.837826 0.554988 0.926853 "H-2-KB H-2-KB 0.887740 0.795053 0.551784  \n", "HLA-A0301 0.891561 0.834236 0.540025 0.922007 "H-2-KD H-2-KD 0.775344 0.613139 0.359457  \n", "HLA-A2601 0.928084 0.580000 0.432299 0.929260 "HLA-A0101 HLA-A0101 0.901156 0.605405 0.501124  \n", "HLA-B0801 0.942694 0.762931 0.600817 0.949517 "HLA-A0201 HLA-A0201 0.901909 0.845684 0.573243  \n", "HLA-B5101 0.933050 0.489796 0.369192 0.939082 "HLA-A0202 HLA-A0202 0.832040 0.717391 0.498543  \n", "HLA-B5701 0.914240 0.750000 0.524933 0.916777 "HLA-A0203 HLA-A0203 0.951758 0.924731 0.550961  \n", "HLA-B0702 0.904985 0.792711 0.564505 0.915801 "HLA-A0206 HLA-A0206 0.862964 0.831633 0.443633  \n", "HLA-A3101 0.828510 0.782609 0.460554 0.854838 "HLA-A0301 HLA-A0301 0.891751 0.841542 0.530830  \n", "HLA-A1101 0.920368 0.872077 0.579906 0.936520 HLA-A1101 0.927653 0.874471 0.588756  \n", "HLA-A0101 0.912746 0.621762 0.521720 0.924911 "HLA-A2301 HLA-A2301 0.834979 0.729345 0.529725  \n", "HLA-A0206 0.876067 0.849449 0.465713 0.909081 "HLA-A2402 HLA-A2402 0.856434 0.669834 0.555656  \n", "HLA-A6802 0.954562 0.870482 0.602856 0.968359 "HLA-A2501 HLA-A2501 0.992701 0.571429 0.151524  \n", "HLA-A3001 0.888740 0.730864 0.502090 0.881443 "HLA-A2601 HLA-A2601 0.931620 0.614334 0.431520  \n", "HLA-A0203 0.950892 0.916566 0.534315 0.976453 "HLA-A2602 HLA-A2602 0.895741 0.674286 0.463429  \n", "HLA-B3901 0.953506 0.705882 0.297435 0.951364 "HLA-A2603 HLA-A2603 0.869189 0.557377 0.326277  \n", "HLA-B1501 0.914988 0.793503 0.569384 0.933960 "HLA-A2902 HLA-A2902 0.895401 0.622951 0.648086  \n", "HLA-B1517 0.910482 0.661088 0.407311 0.921477 "HLA-A3001 HLA-A3001 0.881763 0.734491 0.483303  \n", "HLA-A2402 0.851004 0.653659 0.535714 0.853637 "HLA-A3002 HLA-A3002 0.740724 0.587537 0.335931  \n", "H-2-DB 0.887624 0.611321 0.598370 0.907299 "HLA-A3101 HLA-A3101 0.847970 0.790637 0.489596  \n", "H-2-KB 0.866649 0.794613 0.527096 0.900377 "HLA-A3201 HLA-A3201 0.903308 0.747331 0.504529  \n", "HLA-B3501 0.828050 0.737903 0.500896 0.831002 "HLA-A3301 HLA-A3301 0.915822 0.812144 0.585833  \n", "HLA-A6801 0.926693 0.904494 0.519608 0.945221 HLA-A6801 0.933051 0.918688 0.518524  \n", "HLA-B0802 0.978728 0.285714 0.361894 0.964924 "HLA-A6802 HLA-A6802 0.955764 0.857143 0.590486  \n", "HLA-B1801 0.775263 0.324324 0.201325 0.811504 "HLA-A6901 HLA-A6901 0.959546 0.630137 0.334796  \n", "HLA-B5301 0.836274 0.716279 0.511275 0.849549 "HLA-A8001 HLA-A8001 0.950077 0.307692 0.171367  \n", "HLA-A3301 0.912425 0.822857 0.579394 0.924043 "HLA-B0702 HLA-B0702 0.893816 0.804494 0.557662  \n", "HLA-A6901 0.958853 0.638889 0.338189 0.964830 "HLA-B0801 HLA-B0801 0.944786 0.752834 0.604698 \n",  "HLA-B0802 HLA-B0802 0.969450 0.200000 0.371902 \n",  "HLA-B0803 HLA-B0803 0.974321 0.200000 0.308791 \n",  "HLA-B1501 HLA-B1501 0.898576 0.770335 0.548021 \n",  "HLA-B1503 HLA-B1503 0.844812 0.676923 0.479128  \n", "HLA-B1509 0.852442 0.487805 0.298869 0.871854 HLA-B1509 0.854809 0.307692 0.302344  \n", "HLA-A3201 0.884704 0.699690 0.512869 0.893682 "HLA-B1517 HLA-B1517 0.917827 0.666667 0.414557  \n", "HLA-B5801 0.894775 0.832512 0.559392 0.904312 "HLA-B1801 HLA-B1801 0.774286 0.439024 0.211662  \n", "HLA-B2703 HLA-B2703  NaN 0.000000 0.018979 NaN 0.056018  \n", "HLA-A3002 0.711574 0.619512 0.315227 0.728981 "HLA-B2705 HLA-B2705 0.946038 0.520000 0.409150  \n", "HLA-A2501 0.975669 0.363636 0.146430 0.972749 "HLA-B3501 HLA-B3501 0.817746 0.696538 0.483306  \n", "HLA-A2602 0.902721 0.713615 0.469627 0.926269 "HLA-B3801 HLA-B3801 0.903951 0.000000 0.459762  \n", "HLA-B4402 0.869757 0.682292 0.506405 0.868196 "HLA-B3901 HLA-B3901 0.956623 0.720000 0.298735  \n", "HLA-B4001 0.895389 0.735043 0.580586 0.906650 \n",  "HLA-A2301 0.840581 0.710602 0.556410 0.873845 HLA-B4001 0.908463 0.750716 0.596380  \n", "Mamu-A02 0.876989 0.682216 0.504329 0.870053 "HLA-B4002 HLA-B4002 0.921627 0.750000 0.525437  \n", "HLA-A8001 0.966590 0.344828 0.175280 0.988479 "HLA-B4402 HLA-B4402 0.885611 0.648199 0.524912  \n", "HLA-B4403 0.785885 0.677333 0.419995 0.811937 HLA-B4403 0.804104 0.674352 0.453800 \n",  "HLA-B4501 HLA-B4501 1.000000 0.750000 0.239350  \n", "HLA-B4601 HLA-B4601  NaN 0.000000 NaNNaN  \n", "HLA-B3801 0.901216 0.000000 0.500359 0.909119 \n",  "HLA-B2705 0.945675 0.571429 0.416364 0.944586 \n",  "HLA-A2603 0.860835 0.529412 0.320885 0.863587 \n",  "Mamu-A01 0.847141 0.583333 0.455049 0.889177 \n",  "HLA-B0803 0.952593 0.000000 0.302768 0.886914 \n",  "H-2-KD 0.765223 0.613333 0.336723 0.764808 \n",  "HLA-B1503 0.788338 0.477064 0.361371 0.820478 \n",  "HLA-A0202 0.833980 0.720000 0.561484 0.893293 "HLA-B5101 HLA-B5101 0.931112 0.458716 0.368507  \n", "HLA-A2902 0.890924 0.700000 0.620455 0.884819 "HLA-B5301 HLA-B5301 0.850993 0.752336 0.526623  \n", "HLA-B5401 0.800000 HLA-B5401 0.810811  0.727273 0.295787 0.816216 0.304572  \n", "HLA-B4002 0.916667 0.764706 0.494300 0.908730 "HLA-B5701 HLA-B5701 0.910343 0.738739 0.515322  \n", "HLA-B4501 0.996667 0.750000 0.230045 1.000000 "HLA-B5801 HLA-B5801 0.897543 0.824691 0.556252 \n",  "Mamu-A01 Mamu-A01 0.872810 0.626866 0.474873 \n",  "Mamu-A02 Mamu-A02 0.911300 0.736486 0.547823  \n", "\n",  " mhcflurry 1_f1 10_auc  mhcflurry 1_tau 10_f1  mhcflurry 2_auc mhcflurry 2_f1 10_tau  \\\n", "allele \n", "HLA-A0201 0.870671 0.623314 0.925713 0.881167 "overall 0.924137 0.779420 0.564822  \n", "HLA-A0301 0.892147 0.595890 0.923343 0.879402 "H-2-DB 0.894199 0.544643 0.620387  \n", "HLA-A0201 0.870671 0.623314 0.925713 0.881167 "H-2-KB 0.910714 0.821239 0.569634  \n", "HLA-A0301 0.892147 0.595890 0.923343 0.879402 "H-2-KD 0.787208 0.575758 0.378337  \n", "HLA-A2601 0.593103 0.440722 0.931760 0.574899 "HLA-A0101 0.911578 0.587571 0.521736  \n", "HLA-B0801 0.773504 0.620342 0.948274 0.778523 "HLA-A0201 0.925812 0.871728 0.623190  \n", "HLA-B5101 0.391304 0.369359 0.948141 0.404762 "HLA-A0202 0.905765 0.791209 0.646429  \n", "HLA-B5701 0.740299 0.535227 0.922818 0.670886 "HLA-A0203 0.974648 0.954869 0.594523  \n", "HLA-B0702 0.866525 0.594497 0.909308 0.835526 "HLA-A0206 0.899344 0.875306 0.518406  \n", "HLA-A3101 0.822500 0.510287 0.847235 0.817610 "HLA-A0301 0.922273 0.865510 0.601402  \n", "HLA-A1101 0.883152 0.615351 0.936927 0.884298 0.937180 0.885517 0.612339  \n", "HLA-A0101 0.659794 0.531596 0.909260 0.586207 "HLA-A2301 0.872916 0.731118 0.593738  \n", "HLA-A0206 0.872236 0.528876 0.900025 0.868712 "HLA-A2402 0.867408 0.579946 0.578389  \n", "HLA-A6802 0.900000 0.640201 0.968413 0.889894 "HLA-A2501 0.995134 0.727273 0.152722  \n", "HLA-A3001 0.737913 0.499390 0.889599 0.745592 "HLA-A2601 0.933148 0.566667 0.435573  \n", "HLA-A0203 0.951364 0.573478 0.974324 0.953737 "HLA-A2602 0.929743 0.765714 0.509348  \n", "HLA-B3901 0.734694 0.295161 0.960260 0.723404 "HLA-A2603 0.914398 0.408163 0.377292  \n", "HLA-B1501 0.831050 0.585046 0.937243 0.829736 "HLA-A2902 0.877493 0.644068 0.630893  \n", "HLA-B1517 0.661157 0.417164 0.911692 0.669604 "HLA-A3001 0.887159 0.748052 0.512159  \n", "HLA-A2402 0.649165 0.551522 0.870712 0.585366 "HLA-A3002 0.754918 0.637076 0.355555  \n", "H-2-DB 0.666667 0.631110 0.894433 0.564103 "HLA-A3101 0.847081 0.816583 0.505649  \n", "H-2-KB 0.797853 0.570317 0.910039 0.812165 "HLA-A3201 0.898435 0.772881 0.466982  \n", "HLA-B3501 0.722656 0.524182 0.829343 0.722110 "HLA-A3301 0.926914 0.803922 0.593872  \n", "HLA-A6801 0.919605 0.571760 0.941744 0.905028 0.944722 0.910364 0.562203 \n",  "HLA-A6802 0.968081 0.886191 0.635309 \n",  "HLA-A6901 0.958593 0.736842 0.331893 \n",  "HLA-A8001 0.986559 0.545455 0.185429 \n",  "HLA-B0702 0.910484 0.825749 0.590398 \n",  "HLA-B0801 0.947216 0.752252 0.614472  \n", "HLA-B0802 0.160000 0.341633 0.980878 0.978389  0.000000 0.368566  \n", "HLA-B1801 0.358974 0.241803 0.774436 0.333333 \n",  "HLA-B5301 0.740566 0.528186 0.834934 0.712264 "HLA-B0803 0.938272 0.200000 0.284053  \n", "HLA-A3301 0.863309 0.600599 0.922635 0.850277 "HLA-B1501 0.936809 0.817518 0.589179  \n", "HLA-A6901 0.666667 0.342789 0.956947 0.700000 "HLA-B1503 0.836547 0.655738 0.495029  \n", "HLA-B1509 0.315789 0.331161 0.880691 0.129032 0.876667 0.066667 0.350511  \n", "HLA-A3201 0.708861 0.514653 0.900643 0.777778 "HLA-B1517 0.915408 0.700461 0.416301  \n", "HLA-B5801 0.835821 0.571688 0.907261 0.825641 "HLA-B1801 0.782030 0.235294 0.228810  \n", "HLA-B27030.000000 0.060609  NaN 0.000000 0.062446  \n", "HLA-A3002 0.622785 0.334000 0.742042 0.645161 "HLA-B2705 0.946642 0.434783 0.438604  \n", "HLA-A2501 0.380952 0.145681 0.977129 0.600000 "HLA-B3501 0.832408 0.715177 0.520130  \n", "HLA-A2602 0.746411 0.493376 0.930901 0.786070 "HLA-B3801 0.886795 0.000000 0.431934  \n", "HLA-B4402 0.601156 0.513061 0.887197 0.517572 "HLA-B3901 0.961039 0.765957 0.305990  \n", "HLA-B4001 0.723032 0.602434 0.912764 0.680982 \n",  "HLA-A2301 0.773481 0.596226 0.870580 0.743363 0.914359 0.745665 0.616642  \n", "Mamu-A02 0.668555 0.507614 0.853992 0.666667 "HLA-B4002 0.935516 0.714286 0.512204  \n", "HLA-A8001 0.560000 0.194232 0.985407 0.461538 "HLA-B4402 0.903627 0.503226 0.565924  \n", "HLA-B4403 0.732824 0.450560 0.813593 0.613982 0.822127 0.567657 0.477520 \n",  "HLA-B4501 1.000000 0.750000 0.251757  \n", "HLA-B46010.000000 NaN  NaN 0.000000 NaN  \n", "HLA-B3801 0.000000 0.515732 0.921952 0.000000 \n",  "HLA-B2705 0.509804 0.424005 0.948578 0.489796 \n",  "HLA-A2603 0.537313 0.315634 0.862604 0.518519 \n",  "Mamu-A01 0.643836 0.506096 0.922777 0.716418 \n",  "HLA-B0803 0.000000 0.273943 0.957037 0.000000 \n",  "H-2-KD 0.569444 0.323700 0.766882 0.545455 "HLA-B5101 0.947013 0.380952 0.379882  \n", "HLA-B1503 0.476190 0.377722 0.839991 0.537037 "HLA-B5301 0.848975 0.715000 0.537388  \n", "HLA-A0202 0.764045 0.614703 0.903271 0.791209 "HLA-B5401 0.805405 0.727273 0.314822  \n", "HLA-A2902 "HLA-B5701 0.923162  0.666667 0.649314 0.873016 0.644068 0.545770  \n", "HLA-B5401 0.666667 0.314822 0.800000 0.727273 "HLA-B5801 0.906918 0.818414 0.584738  \n", "HLA-B4002 0.689655 0.481845 0.934524 0.758621 "Mamu-A01 0.925878 0.748092 0.534401  \n", "HLA-B4501 0.750000 0.247621 0.996667 0.571429 "Mamu-A02 0.899894 0.711974 0.551297  \n", "\n",  " mhcflurry 2_tau 11_auc  mhcflurry 3_auc 11_f1 mhcflurry 11_tau  ... \\\n", "allele ... \n", "HLA-A0201 0.622557 0.913962 "overall 0.907951 0.700910 0.538382  ... \n", "HLA-A0301 0.602523 0.916512 "H-2-DB 0.889827 0.349727 0.615268  ... \n", "HLA-A0201 0.622557 0.913962 "H-2-KB 0.903935 0.760456 0.561134  ... \n", "HLA-A0301 0.602523 0.916512 "H-2-KD 0.785797 0.555556 0.365622  ... \n", "HLA-A2601 0.433437 0.923544 "HLA-A0101 0.889515 0.299213 0.498039  ... \n", "HLA-B0801 0.616491 0.940561 "HLA-A0201 0.913368 0.861688 0.599266  ... \n", "HLA-B5101 0.382398 0.945669 "HLA-A0202 0.912694 0.787234 0.656408  ... \n", "HLA-B5701 0.545377 0.914248 "HLA-A0203 0.970475 0.948503 0.577628  ... \n", "HLA-B0702 0.587247 0.898044 "HLA-A0206 0.883182 0.868159 0.496525  ... \n", "HLA-A3101 0.503990 0.840628 "HLA-A0301 0.918873 0.728411 0.582643  ... \n", "HLA-A1101 0.612013 0.925450 0.927661 0.873950 0.586194  ... \n", "HLA-A0101 0.521745 0.887468 "HLA-A2301 0.861315 0.634483 0.570282  ... \n", "HLA-A0206 0.517421 0.883500 "HLA-A2402 0.876370 0.356164 0.586201  ... \n", "HLA-A6802 0.632660 0.959173 "HLA-A2501 0.998054 0.750000 0.153471  ... \n", "HLA-A3001 0.521544 0.893689 "HLA-A2601 0.927566 0.317073 0.428294  ... \n", "HLA-A0203 0.592812 0.970391 "HLA-A2602 0.885672 0.710059 0.443344  ... \n", "HLA-B3901 0.303500 0.951948 "HLA-A2603 0.852580 0.272727 0.306978  ... \n", "HLA-B1501 0.590098 0.929187 "HLA-A2902 0.857957 0.629630 0.594667  ... \n", "HLA-B1517 0.402892 0.901819 "HLA-A3001 0.891398 0.747368 0.514166  ... \n", "HLA-A2402 0.585672 0.868598 "HLA-A3002 0.754802 0.582133 0.353739  ... \n", "H-2-DB 0.621788 0.889393 "HLA-A3101 0.839532 0.784876 0.486671  ... \n", "H-2-KB 0.565230 0.908104 "HLA-A3201 0.894282 0.749117 0.438716  ... \n", "HLA-B3501 0.519938 0.822469 "HLA-A3301 0.919876 0.388889 0.573477  ... \n", "HLA-A6801 0.556709 0.930363 ... \n",  "HLA-B0802 0.358488 0.966056 0.935997 0.893431 0.539995  ... \n", "HLA-B1801 0.231177 0.768647 "HLA-A6802 0.959900 0.708408 0.603869  ... \n", "HLA-B5301 0.518640 0.851550 "HLA-A6901 0.941355 0.487805 0.312966  ... \n", "HLA-A3301 0.593279 0.917699 "HLA-A8001 0.985791 0.470588 0.189219  ... \n", "HLA-A6901 0.325785 0.942481 "HLA-B0702 0.899076 0.704689 0.576627  ... \n", "HLA-B1509 0.330301 0.817802 "HLA-B0801 0.938434 0.553672 0.603882  ... \n", "HLA-A3201 0.484062 0.900451 "HLA-B0802 0.966735 0.000000 0.353712  ... \n", "HLA-B5801 0.587919 0.903463 "HLA-B0803 0.660247 0.000000 0.147246  ... \n", "HLA-B2703 -0.027856 NaN "HLA-B1501 0.930032 0.715909 0.579299  ... \n", "HLA-A3002 0.343583 0.738413 "HLA-B1503 0.793159 0.539683 0.446426  ... \n", "HLA-A2501 0.147030 0.971776 "HLA-B1509 0.815829 0.000000 0.285066  ... \n", "HLA-A2602 0.518496 0.920672 "HLA-B1517 0.907470 0.713568 0.389533  ... \n", "HLA-B4402 0.544209 0.889503 "HLA-B1801 0.783308 0.068966 0.239988  ... \n", "HLA-B4001 0.612248 0.922503 "HLA-B2703 NaN 0.000000 -0.036427  ... \n", "HLA-A2301 0.582937 0.871403 "HLA-B2705 0.938778 0.256410 0.426224  ... \n", "Mamu-A02 0.485396 0.826068 "HLA-B3501 0.822722 0.704805 0.494024  ... \n", "HLA-A8001 0.180293 0.971198 "HLA-B3801 0.341844 0.000000 -0.194121  ... \n", "HLA-B4403 0.462364 0.805648 "HLA-B3901 0.948701 0.650000 0.300846  ... \n", "HLA-B4601 NaN NaN "HLA-B4001 0.918467 0.379032 0.617008  ... \n", "HLA-B3801 0.524527 0.725768 "HLA-B4002 0.934524 0.363636 0.469391  ... \n", "HLA-B2705 0.438219 0.937447 "HLA-B4402 0.905261 0.122449 0.572317  ... \n", "HLA-A2603 0.304849 0.834005 "HLA-B4403 0.826030 0.344000 0.474618  ... \n", "Mamu-A01 0.527595 0.917658 "HLA-B4501 1.000000 0.571429 0.290012  ... \n", "HLA-B0803 0.309651 0.407901 "HLA-B4601 NaN 0.000000 NaN  ... \n", "H-2-KD 0.348129 0.754107 "HLA-B5101 0.949703 0.222222 0.380791  ... \n", "HLA-B1503 0.413124 0.802112 "HLA-B5301 0.857396 0.653061 0.545337  ... \n", "HLA-A0202 0.641312 0.913248 "HLA-B5401 0.802703 0.727273 0.328001  ... \n", "HLA-A2902 0.621376 0.862027 "HLA-B5701 0.911326 0.535714 0.525831  ... \n", "HLA-B5401 0.311894 0.797297 "HLA-B5801 0.904392 0.767568 0.584167  ... \n", "HLA-B4002 0.493522 0.924603 "Mamu-A01 0.920470 0.709677 0.517494  ... \n", "HLA-B4501 0.238316 0.993333 "Mamu-A02 0.881034 0.692557 0.532768  ... \n", "\n",  " netmhc_f1 netmhc_tau netmhcpan_auc  netmhcpan_f1 netmhcpan_tausmmpmbec_cpp_auc smmpmbec_cpp_f1  \\\n", "allele \n", "HLA-A0201 0.880963 0.637338 0.927358 0.885121 "overall 0.800909 0.582258 0.932924 0.793170 0.579586  \n", "HLA-A0301 0.885106 0.611240 0.933966 0.897275 "H-2-DB 0.621212 0.600337 0.874574 0.577236 0.574262 \n",  "H-2-KB 0.813675 0.573199 0.825565 0.665354 0.486836 \n",  "H-2-KD 0.657718 0.403275 0.819189 0.645570 0.390333 \n",  "HLA-A0101 0.619565 0.524866 0.894895 0.594286 0.498767  \n", "HLA-A0201 0.884336 0.635498 0.930479  0.880963 0.637338 0.927358 0.885121 \n",  "HLA-A0202 0.755556 0.627143 0.898697 0.769231 0.624280 \n",  "HLA-A0203 0.948626 0.586911 0.974158 0.944578 0.591463 \n",  "HLA-A0206 0.872902 0.543184 0.910796 0.866258 0.535067  \n", "HLA-A0301 0.900621 0.629236 0.927287  0.885106 0.611240 0.933966 0.897275 \n",  "HLA-A1101 0.883402 0.632199 0.945065 0.887671 0.625794 \n",  "HLA-A2301 0.773842 0.605598 0.895229 0.788406 0.636944 \n",  "HLA-A2402 0.632911 0.575710 0.892876 0.693069 0.600686 \n",  "HLA-A2501 0.666667 0.151836 0.998540 0.888889 0.153968  \n", "HLA-A2601 0.541176 0.436646 0.942279  0.640000 0.4516660.927339 0.603053  \n", "HLA-B0801 0.701671 0.606762 0.940555 0.760000 "HLA-A2602 0.766839 0.525365 0.957811 0.839378 0.561093  \n", "HLA-B5101 0.610169 0.406973 0.927621 0.395604 "HLA-A2603 0.542373 0.366317 0.934300 0.581818 0.426438  \n", "HLA-B5701 0.642623 0.460133 0.929923 0.709091 "HLA-A2902 0.644068 0.619830 0.882377 0.633333 0.641257  \n", "HLA-B0702 0.855011 0.604720 0.897928 0.857719 "HLA-A3001 0.731959 0.456482 0.871974 0.746114 0.459857 \n",  "HLA-A3002 0.663438 0.342161 0.732749 0.611260 0.320577  \n", "HLA-A3101 0.833958 0.525026 0.859261  0.822335 0.5289410.851270 0.837037  \n", "HLA-A1101 0.887671 0.625794 0.944205 0.882514 "HLA-A3201 0.772881 0.448284 0.907161 0.766423 0.480669  \n", "HLA-A0101 0.594286 0.498767 0.832665 0.437811 "HLA-A3301 0.868327 0.587112 0.931156 0.829175 0.612147  \n", "HLA-A0206 0.866258 0.535067 0.904317 0.878282 "HLA-A6801 0.924791 0.571403 0.948907 0.923944 0.599562  \n", "HLA-A6802 0.922636 0.652332 0.964197  0.900293 0.6532160.965793 0.928775  \n", "HLA-A3001 0.746114 0.459857 0.869935 0.692875 \n",  "HLA-A0203 0.944578 0.591463 0.972885 0.946746 \n",  "HLA-B3901 0.744186 0.316739 0.949708 0.708333 \n",  "HLA-B1501 0.823245 0.589097 0.936063 0.819048 \n",  "HLA-B1517 0.710280 0.448575 0.899620 0.652542 \n",  "HLA-A2402 0.693069 0.600686 0.848915 0.633416 \n",  "H-2-DB 0.577236 0.574262 0.884187 0.628571 "HLA-A6901 0.698413 0.335339 0.944257 0.680851 0.327432  \n", "H-2-KB 0.665354 0.486836 0.915994 0.859967 "HLA-A8001 0.434783 0.182374 0.980799 0.434783 0.186524  \n", "HLA-B3501 0.711027 0.514413 0.823734 0.705411 "HLA-B0702 0.869383 0.606014 0.913527 0.855011 0.604720  \n", "HLA-A6801 0.923944 0.599562 0.944553 0.924347 "HLA-B0801 0.776053 0.629519 0.942822 0.701671 0.606762  \n", "HLA-B0802 0.190476 0.393833 0.989590  0.571429 0.4105790.987214 0.105263  \n", "HLA-B1801 0.380952 0.234201 0.787782 0.315789 \n",  "HLA-B5301 0.753623 0.559543 0.821328 0.734177 "HLA-B0803 0.000000 0.318249 0.952346 0.000000 0.315978  \n", "HLA-A3301 0.829175 0.612147 0.907414 0.855098 "HLA-B1501 0.846512 0.591735 0.935596 0.823245 0.589097  \n", "HLA-A6901 0.680851 0.327432 0.954868 0.689655 "HLA-B1503 0.592593 0.468922 0.870064 0.588235 0.522577  \n", "HLA-B1509 0.187500 0.354311 0.922907  0.176471 0.4480990.894618 0.187500  \n", "HLA-A3201 0.766423 0.480669 0.832013 0.580796 "HLA-B1517 0.637931 0.422497 0.934516 0.710280 0.448575  \n", "HLA-B5801 0.805195 0.531508 0.905645 0.817757 "HLA-B1801 0.358974 0.237118 0.789549 0.380952 0.234201  \n", "HLA-B2703 0.000000 0.067451 0.053658  NaN 0.000000 0.067451  \n", "HLA-A3002 0.611260 0.320577 0.754271 0.704104 "HLA-B2705 0.285714 0.430561 0.943860 0.400000 0.377208  \n", "HLA-A2501 0.888889 0.153968 0.992701 0.727273 "HLA-B3501 0.712000 0.515205 0.836281 0.711027 0.514413  \n", "HLA-A2602 0.839378 0.561093 0.942981 0.790244 "HLA-B3801 0.000000 0.513269 0.980074 0.000000 0.652173  \n", "HLA-B4402 0.607143 0.598960 0.802018 0.570652 "HLA-B3901 0.750000 0.305138 0.980065 0.744186 0.316739  \n", "HLA-B4001 0.829787 0.635308 0.920678  0.845570 0.6194180.862331 0.674487 \n",  "HLA-A2301 0.788406 0.636944 0.849381 0.745000  \n", "Mamu-A02 0.748092 0.524622 0.810692 0.640000 "HLA-B4002 0.758621 0.456242 0.918651 0.909091 0.518720  \n", "HLA-A8001 0.434783 0.186524 0.990015 0.518519 "HLA-B4402 0.568807 0.574916 0.934554 0.607143 0.598960  \n", "HLA-B4403 0.766304 0.541066 0.891047  0.775956 0.587824 0.796454 0.754902 \n",  "HLA-B4501 1.000000 0.263574 0.993333 0.800000 0.246426  \n", "HLA-B4601 0.000000 NaN NaN 0.000000 NaN  \n", "HLA-B3801 0.000000 0.652173 0.949206 0.000000 \n",  "HLA-B2705 0.400000 0.377208 0.941682 0.304348 \n",  "HLA-A2603 0.581818 0.426438 0.843194 0.509091 \n",  "Mamu-A01 0.706897 0.539013 0.839390 0.609272 \n",  "HLA-B0803 0.000000 0.315978 0.973333 0.000000 \n",  "H-2-KD 0.645570 0.390333 0.753692 0.538462 \n",  "HLA-B1503 0.588235 0.522577 0.839417 0.523364 \n",  "HLA-A0202 0.769231 0.624280 0.882206 0.727273 "HLA-B5101 0.428571 0.365307 0.948695 0.610169 0.406973  \n", "HLA-A2902 0.633333 0.641257 0.871795 0.655172 "HLA-B5301 0.733813 0.515585 0.885722 0.753623 0.559543  \n", "HLA-B5401 0.800000 0.300252 0.845946  0.727273 0.3498260.839189 0.727273  \n", "HLA-B4002 0.909091 0.518720 0.934524 0.758621 "HLA-B5701 0.741840 0.484975 0.883077 0.642623 0.460133  \n", "HLA-B4501 0.800000 0.246426 1.000000 0.888889 "HLA-B5801 0.827411 0.545132 0.882016 0.805195 0.531508 \n",  "Mamu-A01 0.694915 0.569423 0.912755 0.706897 0.539013 \n",  "Mamu-A02 0.767123 0.598964 0.883087 0.748092 0.524622  \n", "\n",  " smmpmbec_cpp_auc smmpmbec_cpp_f1  smmpmbec_cpp_tau test_sizetrain_size mhcflurry standard_tau  \\\n", "allele \n", "HLA-A0201 0.626224 2126 9565 0.622718 "overall 0.919208 0.784295 0.561996 27680  \n", "HLA-A0301 0.610891 811 6141 0.601211 "H-2-DB 0.884187 0.628571 0.571252 564 \n",  "H-2-KB 0.915994 0.859967 0.589218 558 \n",  "H-2-KD 0.753692 0.538462 0.365247 229 \n",  "HLA-A0101 0.832665 0.437811 0.428064 696  \n", "HLA-A0201 0.927358 0.885121  0.626224 2126 9565 0.622718 \n",  "HLA-A0202 0.882206 0.727273 0.606938 126 \n",  "HLA-A0203 0.972885 0.946746 0.583908 651 \n",  "HLA-A0206 0.904317 0.878282 0.527571 682  \n", "HLA-A0301 0.933966 0.897275  0.610891 811 6141 0.601211 \n",  "HLA-A1101 0.944205 0.882514 0.618388 723 \n",  "HLA-A2301 0.849381 0.745000 0.561259 391 \n",  "HLA-A2402 0.848915 0.633416 0.537589 573 \n",  "HLA-A2501 0.992701 0.727273 0.151997 416  \n", "HLA-A2601 0.927339 0.603053  0.422900 13332894 0.432822  \n", "HLA-B0801 0.618953 940 2267 0.616177 "HLA-A2602 0.942981 0.790244 0.531805 413  \n", "HLA-B5101 0.344534 854 1734 0.379767 "HLA-A2603 0.843194 0.509091 0.306741 312  \n", "HLA-B5701 0.569615 815 1857 0.548574 "HLA-A2902 0.871795 0.655172 0.612364 118  \n", "HLA-B0702 0.563960 813 3412 0.587399 "HLA-A3001 0.869935 0.692875 0.505244 660 \n",  "HLA-A3002 0.754271 0.704104 0.354956 420  \n", "HLA-A3101 0.851270 0.837037  0.502586 7244796 0.505116  \n", "HLA-A1101 0.618388 723 5399 0.611919 "HLA-A3201 0.832013 0.580796 0.493693 449  \n", "HLA-A0101 0.428064 696 3725 0.519116 "HLA-A3301 0.907414 0.855098 0.572158 473  \n", "HLA-A0206 0.527571 682 4827 0.519496 "HLA-A6801 0.944553 0.924347 0.556418 527  \n", "HLA-A6802 0.965793 0.928775  0.629530 6694768 0.634703 \n",  "HLA-A3001 0.505244 660 2040 0.520738 \n",  "HLA-A0203 0.583908 651 5542 0.595852 \n",  "HLA-B3901 0.296639 641 886 0.288446  \n", "HLA-B1501 0.590100 633 3213 0.590860 \n",  "HLA-B1517 0.406582 582 846 0.410409 \n",  "HLA-A2402 0.537589 573 2533 0.578611 \n",  "H-2-DB 0.571252 564 3216 0.618274 "HLA-A6901 0.954868 0.689655 0.322498 470  \n", "H-2-KB 0.589218 558 3407 0.570651 "HLA-A8001 0.990015 0.518519 0.183987 379  \n", "HLA-B3501 0.501630 542 2397 0.517529 "HLA-B0702 0.897928 0.857719 0.563960 813  \n", "HLA-A6801 0.556418 527 3184 0.553065 "HLA-B0801 0.940555 0.760000 0.618953 940  \n", "HLA-B0802 0.987214 0.105263  0.385838 509487 0.364774 \n",  "HLA-B1801 0.215534 503 2052 0.230967  \n", "HLA-B5301 0.495308 485 1018 0.529645 "HLA-B0803 0.973333 0.000000 0.314266 234  \n", "HLA-A3301 0.572158 473 3040 0.593153 "HLA-B1501 0.936063 0.819048 0.590100 633  \n", "HLA-A6901 0.322498 470 2079 0.322656 "HLA-B1503 0.839417 0.523364 0.444917 165  \n", "HLA-B1509 0.894618 0.187500  0.364673 466346 0.294024  \n", "HLA-A3201 0.493693 449 640 0.540213 "HLA-B1517 0.899620 0.652542 0.406582 582  \n", "HLA-B5801 0.582026 445 2564 0.588062 "HLA-B1801 0.787782 0.315789 0.215534 503  \n", "HLA-B2703 NaN 0.000000 NaN  441433 0.029998  \n", "HLA-A3002 0.354956 420 1430 0.343652 "HLA-B2705 0.941682 0.304348 0.416884 314  \n", "HLA-A2501 0.151997 416 519 0.151224 "HLA-B3501 0.823734 0.705411 0.501630 542  \n", "HLA-A2602 0.531805 413 202 0.479073 "HLA-B3801 0.949206 0.000000 0.547438 351  \n", "HLA-B4402 0.377900 411 1705 0.548878 "HLA-B3901 0.949708 0.708333 0.296639 641  \n", "HLA-B4001 0.862331 0.674487  0.520725 4072718 0.613517  \n", "HLA-A2301 0.561259 391 2021 0.592758 \n",  "Mamu-A02 0.478589 388 938 0.502013 "HLA-B4002 0.934524 0.758621 0.455548 74  \n", "HLA-A8001 0.183987 379 782 0.166354 "HLA-B4402 0.802018 0.570652 0.377900 411  \n", "HLA-B4403 0.796454 0.754902  0.432021 378 913 0.431010 \n",  "HLA-B4501 1.000000 0.888889 0.251301 65  \n", "HLA-B4601 NaN 378 1424 0.000000  NaN 378  \n", "HLA-B3801 0.547438 351 136 0.523753 \n",  "HLA-B2705 0.416884 314 3028 0.438390 \n",  "HLA-A2603 0.306741 312 205 0.319324 \n",  "Mamu-A01 0.469975 274 2264 0.525326 \n",  "HLA-B0803 0.314266 234 217 0.289431 \n",  "H-2-KD 0.365247 229 452 0.321850 \n",  "HLA-B1503 0.444917 165 429 0.426175 \n",  "HLA-A0202 0.606938 126 3919 0.644894 "HLA-B5101 0.927621 0.395604 0.344534 854  \n", "HLA-A2902 0.612364 118 2397 0.625060 "HLA-B5301 0.821328 0.734177 0.495308 485  \n", "HLA-B5401 0.839189 0.727273  0.333600 791019 0.303840  \n", "HLA-B4002 0.455548 74 866 0.480289 "HLA-B5701 0.929923 0.709091 0.569615 815  \n", "HLA-B4501 0.251301 65 889 0.261062 "HLA-B5801 0.905645 0.817757 0.582026 445 \n",  "Mamu-A01 0.839390 0.609272 0.469975 274 \n",  "Mamu-A02 0.810692 0.640000 0.478589 388  \n", "\n",  " mhcflurry standard_f1 mhcflurry standard_auc train_size  \n", "allele \n", "HLA-A0201 0.874891 0.925388 "overall NaN  \n", "HLA-A0301 0.879144 0.922855 "H-2-DB 3216  \n", "HLA-A0201 0.874891 0.925388 "H-2-KB 3407  \n", "HLA-A0301 0.879144 0.922855 "H-2-KD 452  \n", "HLA-A2601 0.553719 0.931268 "HLA-A0101 3725  \n", "HLA-B0801 0.779736 0.949331 "HLA-A0201 9565  \n", "HLA-B5101 0.418605 0.946123 "HLA-A0202 3919  \n", "HLA-B5701 0.701863 0.923588 "HLA-A0203 5542  \n", "HLA-B0702 0.835165 0.909692 "HLA-A0206 4827  \n", "HLA-A3101 0.816583 0.847396 "HLA-A0301 6141  \n", "HLA-A1101 0.884298 0.937280 5399  \n", "HLA-A0101 0.560000 0.908668 "HLA-A2301 2021  \n", "HLA-A0206 0.880779 0.898990 "HLA-A2402 2533  \n", "HLA-A6802 0.885845 0.968637 "HLA-A2501 519  \n", "HLA-A3001 0.749367 0.888110 "HLA-A2601 2894  \n", "HLA-A0203 0.957041 0.974815 "HLA-A2602 202  \n", "HLA-B3901 0.666667 0.943377 "HLA-A2603 205  \n", "HLA-B1501 0.830918 0.938188 "HLA-A2902 2397  \n", "HLA-B1517 0.639004 0.909998 "HLA-A3001 2040  \n", "HLA-A2402 0.583784 0.865991 "HLA-A3002 1430  \n", "H-2-DB 0.563877 0.892264 "HLA-A3101 4796  \n", "H-2-KB 0.812165 0.911974 "HLA-A3201 640  \n", "HLA-B3501 0.714286 0.828331 "HLA-A3301 3040  \n", "HLA-A6801 0.905292 0.941373 \n",  "HLA-B0802 0.000000 0.974089 \n",  "HLA-B1801 0.333333 0.775038 3184  \n", "HLA-B5301 0.713253 0.845182 \n",  "HLA-A3301 0.837989 0.923011 "HLA-A6802 4768  \n", "HLA-A6901 0.721311 0.953569 \n",  "HLA-B1509 0.216216 0.861990 2079  \n", "HLA-A3201 0.756410 0.910653 "HLA-A8001 782  \n", "HLA-B5801 0.827763 0.907100 "HLA-B0702 3412  \n", "HLA-B2703 0.000000 NaN "HLA-B0801 2267  \n", "HLA-A3002 0.631313 0.740308 "HLA-B0802 487  \n", "HLA-A2501 0.500000 0.991241 "HLA-B0803 217  \n", "HLA-A2602 0.756219 0.913016 "HLA-B1501 3213  \n", "HLA-B4402 0.488599 0.887989 "HLA-B1503 429  \n", "HLA-B4001 0.654088 0.913586 "HLA-B1509 346  \n", "HLA-A2301 0.746356 0.874270 "HLA-B1517 846  \n", "Mamu-A02 0.657459 0.867954 "HLA-B1801 2052  \n", "HLA-A8001 0.333333 0.966590 "HLA-B2703 433  \n", "HLA-B4403 0.719388 0.790096 "HLA-B2705 3028  \n", "HLA-B4601 0.000000 NaN "HLA-B3501 2397  \n", "HLA-B3801 0.000000 0.935900 136  \n", "HLA-B2705 0.520000 0.947973 "HLA-B3901 886  \n", "HLA-A2603 0.576271 0.877150 "HLA-B4001 2718  \n", "Mamu-A01 0.719424 0.920975 "HLA-B4002 866  \n", "HLA-B0803 0.000000 0.910123 "HLA-B4402 1705  \n", "H-2-KD 0.594203 0.750622 "HLA-B4403 913  \n", "HLA-B1503 0.551020 0.820937 "HLA-B4501 889  \n", "HLA-A0202 0.782609 0.903548 "HLA-B4601 1424  \n", "HLA-A2902 0.644068 0.873830 "HLA-B5101 1734 \n",  "HLA-B5301 1018  \n", "HLA-B5401 0.727273 0.797297 1019  \n", "HLA-B4002 0.709677 0.902778 "HLA-B5701 1857  \n", "HLA-B4501 0.750000 0.996667 "HLA-B5801 2564 \n",  "Mamu-A01 2264 \n",  "Mamu-A02 938  \n", "\n",  "[55 "[54  rows x 38 285  columns]" ]  },  "execution_count": 29, 20,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "threshold = 1000\n",  "big_model = 6\n",  "small_model = 5\n",  "extra_cols "scores_df  = collections.defaultdict(list)\n", "for (allele, row) in df.iterrows():\n",  " for metric in [\"auc\", \"f1\", \"tau\"]:\n",  " model "predictors  = big_model if row.train_size >= threshold else small_model\n",  " extra_cols[\"mhcflurry standard_%s\" % metric].append(row[\"mhcflurry %s_%s\" % (model, metric)])\n",  " \n",  "for (col, values) in extra_cols.items():\n",  " df[col] validation_df_with_mhcflurry_results.columns[4:]\n",  "pairs  = values\n", [\n",  " (\"overall\", validation_df_with_mhcflurry_results)\n",  "] + list(validation_df_with_mhcflurry_results.groupby(\"allele\"))\n",  "\n",  "df" "for (allele, grouped) in pairs:\n",  " scores_df[\"allele\"].append(allele)\n",  " scores_df[\"test_size\"].append(len(grouped.meas))\n",  " for predictor in predictors:\n",  " scores = make_scores(grouped.meas, grouped[predictor])\n",  " for (key, value) in scores.items():\n",  " scores_df[\"%s_%s\" % (predictor, key)].append(value)\n",  " \n",  "scores_df = pandas.DataFrame(scores_df)\n",  "scores_df[\"train_size\"] = [\n",  " len(set(all_train_data[a].original_peptides)) if a != 'overall' else numpy.nan\n",  " for a in scores_df.allele\n",  "]\n",  "scores_df.index = scores_df.allele\n",  "scores_df"  ]  },  {  "cell_type": "code",  "execution_count": 51, 15,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ "mhcflurry 4_tau 0.447560\n",  "mhcflurry 0_tau 0.449200\n",  "mhcflurry 3_tau 0.449642\n",  "mhcflurry 7_tau 0.462858\n",  "mhcflurry 5_tau 0.468839\n",  "mhcflurry 1_tau 0.471471\n",  "smmpmbec_cpp_tau 0.471492\n",  "mhcflurry 2_tau 0.472481\n",  "mhcflurry standard_tau 0.472755\n",  "mhcflurry 6_tau 0.474900\n",  "netmhc_tau 0.483207\n",  "netmhcpan_tau 0.491046\n",  "mhcflurry 3_f1 0.533349\n",  "mhcflurry 7_f1 0.543681\n",  "mhcflurry 2_f1 0.630669\n",  "mhcflurry standard_f1 0.631175\n",  "mhcflurry 6_f1 0.635060\n",  "mhcflurry 5_f1 0.636095\n",  "mhcflurry 0_f1 0.636355\n",  "smmpmbec_cpp_f1 0.637798\n",  "mhcflurry 1_f1 0.644236\n",  "mhcflurry 4_f1 0.649554\n",  "netmhc_f1 0.659745\n",  "netmhcpan_f1 0.670119\n",  "mhcflurry 3_auc 0.881133\n",  "mhcflurry 0_auc 0.888551\n",  "mhcflurry 4_auc 0.890536\n",  "smmpmbec_cpp_auc 0.895268\n",  "mhcflurry 7_auc 0.898431\n",  "mhcflurry 5_auc 0.900119\n",  "mhcflurry standard_auc 0.900856\n",  "mhcflurry 1_auc 0.901088\n",  "mhcflurry 6_auc 0.903171\n",  "mhcflurry 2_auc 0.903755\n",  "netmhc_auc 0.909872\n",  "netmhcpan_auc 0.913077\n",  "test_size 556.672727\n",  "train_size 2463.400000\n",  "dtype: float64" "overall H-2-DB H-2-KB H-2-KD HLA-A0101 HLA-A0201 HLA-A0202 HLA-A0203 HLA-A0206 HLA-A0301 HLA-A1101 HLA-A2301 HLA-A2402 HLA-A2501 HLA-A2601 HLA-A2602 HLA-A2603 HLA-A2902 HLA-A3001 HLA-A3002 HLA-A3101 HLA-A3201 HLA-A3301 HLA-A6801 HLA-A6802 HLA-A6901 HLA-A8001 HLA-B0702 HLA-B0801 HLA-B0802 HLA-B0803 HLA-B1501 HLA-B1503 HLA-B1509 HLA-B1517 HLA-B1801 HLA-B2703 HLA-B2705 HLA-B3501 HLA-B3801 HLA-B3901 HLA-B4001 HLA-B4002 HLA-B4402 HLA-B4403 HLA-B4501 HLA-B4601 HLA-B5101 HLA-B5301 HLA-B5401 HLA-B5701 HLA-B5801 Mamu-A01 Mamu-A02\n",  "(54, 285)\n"  ]},  "execution_count": 51,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df.mean().sort(inplace=False)" "print(\" \".join(scores_df.index))\n",  "print(scores_df.shape)"  ]  },  {  "cell_type": "code",  "execution_count": 50, 16,  "metadata": {  "collapsed": false false,  "scrolled": true  },  "outputs": [  {  "data": {  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ "allele overall\n",  "test_size 27680\n",  "netmhcpan_auc 0.9329235\n",  "netmhc_auc 0.9299468\n",  "mhcflurry 4_tau 0.496057\n", 66_auc 0.9276946\n",  "mhcflurry 0_tau 0.502704\n",  "smmpmbec_cpp_tau 0.516050\n", ensemble all not impute_auc 0.9274469\n",  "mhcflurry 3_tau 0.522841\n", ensemble all_auc 0.9273025\n",  "mhcflurry 7_tau 0.525517\n", ensemble all impute_auc 0.9270227\n",  "mhcflurry 5_tau 0.528831\n", 78_auc 0.9269599\n",  "mhcflurry 1_tau 0.532539\n", 30_auc 0.9267281\n",  "mhcflurry 2_tau 0.534358\n", 34_auc 0.926603\n",  "mhcflurry standard_tau 0.534703\n", ensemble big dropout_auc 0.9265897\n",  "mhcflurry 6_tau 0.534703\n",  "netmhcpan_tau 0.534936\n",  "netmhc_tau 0.536833\n", 2_auc 0.9265458\n",  "mhcflurry 3_f1 0.603511\n", 6_auc 0.926512\n",  "mhcflurry 7_f1 0.609657\n", 58_auc 0.9265101\n",  "mhcflurry 26_auc 0.9264645\n",  "mhcflurry 70_auc 0.926379\n",  "mhcflurry ensemble big dropout impute_auc 0.9263097\n",  "mhcflurry 54_auc 0.9262953\n",  "mhcflurry 50_auc 0.9261597\n",  "mhcflurry ensemble small_auc 0.9260523\n",  "mhcflurry 38_auc 0.9256249\n",  "mhcflurry ensemble small impute_auc 0.9255788\n",  "mhcflurry 74_auc 0.9254442\n",  "mhcflurry 18_auc 0.9253663\n",  "mhcflurry ensemble big_auc 0.9252539\n",  "mhcflurry 62_auc 0.9252499\n",  "mhcflurry 1_auc 0.9251363\n",  "mhcflurry 25_auc 0.925059\n",  "mhcflurry 46_auc 0.9250404\n",  "mhcflurry 77_auc 0.9250151\n",  "mhcflurry 42_auc 0.9249553\n",  "mhcflurry 41_auc 0.9248634\n",  "mhcflurry 22_auc 0.924837\n",  "mhcflurry ensemble big impute_auc 0.924693\n",  "mhcflurry 17_auc 0.9245582\n",  "mhcflurry 14_auc 0.9243773\n",  "mhcflurry 10_auc 0.9241365\n",  "mhcflurry 13_auc 0.9236454\n",  "mhcflurry 37_auc 0.9235483\n",  "mhcflurry 5_auc 0.9232581\n",  "mhcflurry 29_auc 0.923079\n",  "mhcflurry 61_auc 0.9225573\n",  "mhcflurry 45_auc 0.92203\n",  "mhcflurry 49_auc 0.9218943\n",  "mhcflurry 73_auc 0.9215377\n",  "mhcflurry 9_auc 0.9211544\n",  "mhcflurry 65_auc 0.9211082\n",  "mhcflurry 53_auc 0.9204571\n",  "mhcflurry 33_auc 0.9201546\n",  "mhcflurry 21_auc 0.9200809\n",  "smmpmbec_cpp_auc 0.9192085\n",  "mhcflurry 69_auc 0.9188508\n",  "mhcflurry 57_auc 0.9187933\n",  "mhcflurry 32_auc 0.9182587\n",  "mhcflurry 16_auc 0.9179979\n",  "mhcflurry 8_auc 0.9177871\n",  "mhcflurry 76_auc 0.9176313\n",  "mhcflurry 52_auc 0.9172838\n",  "mhcflurry 0_auc 0.916791\n",  "mhcflurry 24_auc 0.9167361\n",  "mhcflurry 68_auc 0.916697\n",  "mhcflurry 44_auc 0.9166833\n",  "mhcflurry 40_auc 0.9164816\n",  "mhcflurry 12_auc 0.9159834\n",  "mhcflurry 72_auc 0.9157665\n",  "mhcflurry 36_auc 0.9156711\n",  "mhcflurry 56_auc 0.9155434\n",  "mhcflurry 20_auc 0.9154917\n",  "mhcflurry 64_auc 0.9154197\n",  "mhcflurry 48_auc 0.9146821\n",  "mhcflurry 4_auc 0.9144389\n",  "mhcflurry 60_auc 0.9143242\n",  "mhcflurry 28_auc 0.9140373\n",  "mhcflurry 67_auc 0.9113344\n",  "mhcflurry 63_auc 0.9107003\n",  "mhcflurry ensemble small dropout impute_auc 0.9104685\n",  "mhcflurry 23_auc 0.9101152\n",  "mhcflurry 35_auc 0.9100286\n",  "mhcflurry ensemble small dropout_auc 0.9096992\n",  "mhcflurry 39_auc 0.9095753\n",  "mhcflurry 15_auc 0.9095053\n",  "mhcflurry 47_auc 0.9094201\n",  "mhcflurry 51_auc 0.9094098\n",  "mhcflurry 7_auc 0.9093973\n",  "mhcflurry 31_auc 0.9093858\n",  "mhcflurry 71_auc 0.9092001\n",  "mhcflurry 3_auc 0.9091138\n",  "mhcflurry 75_auc 0.9087963\n",  "mhcflurry 19_auc 0.9085923\n",  "mhcflurry 55_auc 0.9083305\n",  "mhcflurry 27_auc 0.9083127\n",  "mhcflurry 79_auc 0.9080429\n",  "mhcflurry 11_auc 0.9079513\n",  "mhcflurry 59_auc 0.9077703\n",  "mhcflurry 43_auc 0.9072028\n",  "netmhc_f1 0.800909\n",  "mhcflurry ensemble small impute_f1 0.7979408\n",  "mhcflurry ensemble small_f1 0.7967471\n",  "mhcflurry 61_f1 0.7939957\n",  "mhcflurry 53_f1 0.7935798\n",  "netmhcpan_f1 0.79317\n",  "mhcflurry 5_f1 0.7930784\n",  "mhcflurry 25_f1 0.7927928\n",  "mhcflurry 37_f1 0.7925502\n",  "mhcflurry 13_f1 0.7920404\n",  "mhcflurry 1_f1 0.7919847\n",  "mhcflurry 29_f1 0.7918618\n",  "mhcflurry 33_f1 0.7918418\n",  "mhcflurry 77_f1 0.7917902\n",  "mhcflurry 21_f1 0.7917156\n",  "mhcflurry 41_f1 0.7915733\n",  "mhcflurry 17_f1 0.7913087\n",  "mhcflurry 69_f1 0.7904965\n",  "mhcflurry 57_f1 0.7899725\n",  "mhcflurry 73_f1 0.7898332\n",  "mhcflurry 49_f1 0.7892845\n",  "mhcflurry 65_f1 0.7891668\n",  "mhcflurry 45_f1 0.7888004\n",  "mhcflurry 9_f1 0.7885644\n",  "mhcflurry ensemble big_f1 0.7880386\n",  "mhcflurry ensemble big impute_f1 0.7876643\n",  "smmpmbec_cpp_f1 0.707976\n", 0.7842948\n",  "mhcflurry 0_f1 0.709276\n", ensemble all impute_f1 0.7834421\n",  "mhcflurry standard_f1 0.710507\n", ensemble all_f1 0.7831562\n",  "mhcflurry 6_f1 0.710507\n", ensemble all not impute_f1 0.7829103\n",  "mhcflurry 46_f1 0.7804512\n",  "mhcflurry ensemble big dropout impute_f1 0.7801976\n",  "mhcflurry 74_f1 0.7798017\n",  "mhcflurry 62_f1 0.7797805\n",  "mhcflurry 18_f1 0.7796728\n",  "mhcflurry 30_f1 0.7796317\n",  "mhcflurry 10_f1 0.7794203\n",  "mhcflurry 26_f1 0.7793574\n",  "mhcflurry ensemble big dropout_f1 0.7791847\n",  "mhcflurry 38_f1 0.7791503\n",  "mhcflurry 58_f1 0.7790845\n",  "mhcflurry 70_f1 0.7790094\n",  "mhcflurry 34_f1 0.778719\n",  "mhcflurry 2_f1 0.711558\n", 0.7787089\n",  "mhcflurry 6_f1 0.7786206\n",  "mhcflurry 54_f1 0.7785537\n",  "mhcflurry 22_f1 0.7784216\n",  "mhcflurry 42_f1 0.7783621\n",  "mhcflurry 66_f1 0.7782664\n",  "mhcflurry 14_f1 0.7778355\n",  "mhcflurry 50_f1 0.7767733\n",  "mhcflurry 78_f1 0.7766462\n",  "mhcflurry 72_f1 0.7718351\n",  "mhcflurry 16_f1 0.7716651\n",  "mhcflurry 0_f1 0.7701976\n",  "mhcflurry 8_f1 0.7691697\n",  "mhcflurry 76_f1 0.7684735\n",  "mhcflurry 24_f1 0.7682127\n",  "mhcflurry 20_f1 0.7681332\n",  "mhcflurry 68_f1 0.7677677\n",  "mhcflurry 56_f1 0.7673442\n",  "mhcflurry 32_f1 0.7669131\n",  "mhcflurry 36_f1 0.7663382\n",  "mhcflurry 44_f1 0.7659984\n",  "mhcflurry 52_f1 0.7656837\n",  "mhcflurry 60_f1 0.7630563\n",  "mhcflurry 40_f1 0.7626047\n",  "mhcflurry 48_f1 0.7621489\n",  "mhcflurry 12_f1 0.761656\n",  "mhcflurry 28_f1 0.7606356\n",  "mhcflurry 64_f1 0.7591274\n",  "mhcflurry 4_f1 0.716505\n", 0.7586207\n",  "mhcflurry 5_f1 0.717820\n",  "netmhcpan_f1 0.720971\n", 7_f1 0.7056149\n",  "mhcflurry 1_f1 0.722733\n",  "netmhc_f1 0.724166\n", 67_f1 0.7039766\n",  "mhcflurry 4_auc 0.883488\n", 63_f1 0.7034001\n",  "mhcflurry 0_auc 0.883998\n",  "smmpmbec_cpp_auc 0.890551\n", 55_f1 0.7032967\n",  "mhcflurry 3_auc 0.895132\n", 51_f1 0.7031399\n",  "mhcflurry 7_auc 0.896575\n", 15_f1 0.7030903\n",  "mhcflurry 5_auc 0.899532\n", ensemble small dropout impute_f1 0.7030565\n",  "mhcflurry 6_auc 0.900616\n", 39_f1 0.7026512\n",  "mhcflurry standard_auc 0.900616\n", 59_f1 0.7023764\n",  "mhcflurry 2_auc 0.900671\n", 19_f1 0.7019573\n",  "mhcflurry 1_auc 0.900868\n",  "netmhcpan_auc 0.902212\n",  "netmhc_auc 0.902225\n",  "test_size 652.027027\n", 23_f1 0.7015467\n",  "mhcflurry 11_f1 0.7009102\n",  "mhcflurry 43_f1 0.7006686\n",  "mhcflurry 47_f1 0.7004973\n",  "mhcflurry 3_f1 0.7004532\n",  "mhcflurry ensemble small dropout_f1 0.7000765\n",  "mhcflurry 31_f1 0.6998342\n",  "mhcflurry 27_f1 0.6995722\n",  "mhcflurry 79_f1 0.6994076\n",  "mhcflurry 71_f1 0.6992275\n",  "mhcflurry 35_f1 0.6984674\n",  "mhcflurry 75_f1 0.6968204\n",  "netmhc_tau 0.5822579\n",  "netmhcpan_tau 0.5795864\n",  "mhcflurry ensemble small_tau 0.5741622\n",  "mhcflurry ensemble small impute_tau 0.5728441\n",  "mhcflurry ensemble all not impute_tau 0.572302\n",  "mhcflurry ensemble all_tau 0.5721626\n",  "mhcflurry ensemble all impute_tau 0.5717648\n",  "mhcflurry 1_tau 0.5707296\n",  "mhcflurry 25_tau 0.5702134\n",  "mhcflurry 17_tau 0.5697772\n",  "mhcflurry 58_tau 0.5689395\n",  "mhcflurry 61_tau 0.5689001\n",  "mhcflurry 66_tau 0.5687588\n",  "mhcflurry 77_tau 0.5687417\n",  "mhcflurry 41_tau 0.5684992\n",  "mhcflurry 29_tau 0.5683163\n",  "mhcflurry 78_tau 0.5682688\n",  "mhcflurry ensemble big dropout_tau 0.5681078\n",  "mhcflurry 30_tau 0.5678771\n",  "mhcflurry ensemble big dropout impute_tau 0.5678107\n",  "mhcflurry 70_tau 0.5677436\n",  "mhcflurry 34_tau 0.5677211\n",  "mhcflurry 6_tau 0.5675603\n",  "mhcflurry 2_tau 0.5674683\n",  "mhcflurry 50_tau 0.5673749\n",  "mhcflurry ensemble big_tau 0.5673644\n",  "mhcflurry 26_tau 0.5673374\n",  "mhcflurry 54_tau 0.5672822\n",  "mhcflurry 13_tau 0.5670392\n",  "mhcflurry 38_tau 0.566927\n",  "mhcflurry 45_tau 0.5669264\n",  "mhcflurry 49_tau 0.5666638\n",  "mhcflurry 9_tau 0.5665427\n",  "mhcflurry 73_tau 0.5664529\n",  "mhcflurry 62_tau 0.56626\n",  "mhcflurry 74_tau 0.5661914\n",  "mhcflurry 18_tau 0.566101\n",  "mhcflurry ensemble big impute_tau 0.5660125\n",  "mhcflurry 5_tau 0.5659198\n",  "mhcflurry 37_tau 0.5658243\n",  "mhcflurry 22_tau 0.5655625\n",  "mhcflurry 46_tau 0.5655446\n",  "mhcflurry 14_tau 0.5654076\n",  "mhcflurry 42_tau 0.5653219\n",  "mhcflurry 33_tau 0.5652696\n",  "mhcflurry 65_tau 0.5652493\n",  "mhcflurry 10_tau 0.5648219\n",  "mhcflurry 53_tau 0.5646125\n",  "mhcflurry 21_tau 0.5633814\n",  "mhcflurry 69_tau 0.5623363\n",  "smmpmbec_cpp_tau 0.5619957\n",  "mhcflurry 57_tau 0.5610829\n",  "mhcflurry 32_tau 0.5541116\n",  "mhcflurry 16_tau 0.5537476\n",  "mhcflurry 8_tau 0.5534618\n",  "mhcflurry 76_tau 0.5528196\n",  "mhcflurry 72_tau 0.5519963\n",  "mhcflurry 24_tau 0.5519645\n",  "mhcflurry 44_tau 0.5519362\n",  "mhcflurry 0_tau 0.5518408\n",  "mhcflurry 52_tau 0.5518376\n",  "mhcflurry 40_tau 0.5517939\n",  "mhcflurry 12_tau 0.5514853\n",  "mhcflurry 56_tau 0.5511021\n",  "mhcflurry 36_tau 0.5509265\n",  "mhcflurry 48_tau 0.5503656\n",  "mhcflurry 68_tau 0.5500605\n",  "mhcflurry 60_tau 0.5493259\n",  "mhcflurry 64_tau 0.5492648\n",  "mhcflurry 20_tau 0.5487944\n",  "mhcflurry 4_tau 0.5479511\n",  "mhcflurry 28_tau 0.5470462\n",  "mhcflurry 63_tau 0.5444154\n",  "mhcflurry ensemble small dropout impute_tau 0.5435574\n",  "mhcflurry 23_tau 0.541832\n",  "mhcflurry 15_tau 0.5416039\n",  "mhcflurry 7_tau 0.5414706\n",  "mhcflurry 47_tau 0.5414117\n",  "mhcflurry 35_tau 0.5410543\n",  "mhcflurry 71_tau 0.5410063\n",  "mhcflurry 67_tau 0.5409146\n",  "mhcflurry 39_tau 0.5406932\n",  "mhcflurry ensemble small dropout_tau 0.5405695\n",  "mhcflurry 3_tau 0.5404765\n",  "mhcflurry 79_tau 0.5402274\n",  "mhcflurry 55_tau 0.5402122\n",  "mhcflurry 31_tau 0.539697\n",  "mhcflurry 51_tau 0.5385472\n",  "mhcflurry 11_tau 0.5383823\n",  "mhcflurry 75_tau 0.5380515\n",  "mhcflurry 43_tau 0.5375163\n",  "mhcflurry 19_tau 0.5373251\n",  "mhcflurry 59_tau 0.5366789\n",  "mhcflurry 27_tau 0.5362197\n",  "train_size 3386.513514\n",  "dtype: float64" NaN\n",  "Name: overall, dtype: object\n"  ]},  "execution_count": 50,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df[df.train_size > 1000].mean().sort(inplace=False)" "print_full(scores_df.ix[\"overall\"].sort(inplace=False, ascending=False))"  ]  },  {  "cell_type": "code",  "execution_count": 47, 19,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/html": [  "
\n",  "\n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  " \n",  "
mhcflurry 0_aucmhcflurry 0_f1mhcflurry 0_taumhcflurry 1_aucmhcflurry 1_f1mhcflurry 1_taumhcflurry 2_aucmhcflurry 2_f1mhcflurry 2_taumhcflurry 3_auc...netmhcpan_f1netmhcpan_tausmmpmbec_cpp_aucsmmpmbec_cpp_f1smmpmbec_cpp_tautest_sizetrain_sizemhcflurry standard_taumhcflurry standard_f1mhcflurry standard_auc
allele
HLA-B38010.90121600.5003590.90911900.5157320.92195200.5245270.725768...00.6521730.94920600.5474383511360.52375300.9359
\n",
  "

1 rows × 38 columns

\n",
  "
"
  ],  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ " mhcflurry 0_auc mhcflurry 0_f1 mhcflurry 0_tau mhcflurry "train_size 3131.285714\n",  "test_size 605.371429\n",  "mhcflurry ensemble all_auc 0.904481\n",  "mhcflurry ensemble all impute_auc 0.904463\n",  "mhcflurry ensemble all not impute_auc 0.904237\n",  "mhcflurry ensemble small impute_auc 0.903239\n",  "mhcflurry ensemble small_auc 0.902855\n",  "mhcflurry 70_auc 0.901710\n",  "mhcflurry 61_auc 0.901698\n",  "mhcflurry 2_auc 0.901526\n",  "mhcflurry 25_auc 0.901514\n",  "mhcflurry 10_auc 0.901496\n",  "mhcflurry 30_auc 0.901488\n",  "mhcflurry 54_auc 0.901413\n",  "mhcflurry 42_auc 0.901378\n",  "mhcflurry 38_auc 0.901373\n",  "mhcflurry ensemble big dropout impute_auc 0.901344\n",  "mhcflurry ensemble big dropout_auc 0.901337\n",  "mhcflurry 78_auc 0.901272\n",  "mhcflurry 18_auc 0.901231\n",  "mhcflurry 66_auc 0.901220\n",  "mhcflurry 26_auc 0.901101\n",  "mhcflurry 34_auc 0.901031\n",  "mhcflurry 46_auc 0.901013\n",  "mhcflurry 74_auc 0.900951\n",  "mhcflurry 58_auc 0.900882\n",  "mhcflurry 6_auc 0.900875\n",  "mhcflurry 5_auc 0.900869\n",  "mhcflurry 62_auc 0.900825\n",  "mhcflurry 29_auc 0.900816\n",  "mhcflurry 22_auc 0.900789\n",  "mhcflurry 50_auc 0.900742\n",  "netmhcpan_auc 0.900643\n",  "mhcflurry 14_auc 0.900625\n",  "netmhc_auc 0.900374\n",  "mhcflurry 53_auc 0.899733\n",  "mhcflurry 77_auc 0.899660\n",  "mhcflurry 17_auc 0.899553\n",  "mhcflurry  1_auc \\\n",  "allele \n",  "HLA-B3801 0.901216 0 0.500359 0.909119 \n",  "\n",  " mhcflurry 0.899466\n",  "mhcflurry 73_auc 0.899449\n",  "mhcflurry 21_auc 0.899404\n",  "mhcflurry 45_auc 0.899360\n",  "mhcflurry 13_auc 0.899256\n",  "mhcflurry 9_auc 0.899235\n",  "mhcflurry 57_auc 0.899228\n",  "mhcflurry 41_auc 0.899022\n",  "mhcflurry 33_auc 0.898872\n",  "mhcflurry 37_auc 0.898646\n",  "mhcflurry 49_auc 0.898458\n",  "mhcflurry 65_auc 0.897986\n",  "mhcflurry 69_auc 0.897844\n",  "mhcflurry ensemble big impute_auc 0.897612\n",  "mhcflurry ensemble big_auc 0.897363\n",  "mhcflurry ensemble small dropout impute_auc 0.897266\n",  "mhcflurry 63_auc 0.897125\n",  "mhcflurry 67_auc 0.897119\n",  "mhcflurry 55_auc 0.897014\n",  "mhcflurry 35_auc 0.896943\n",  "mhcflurry 79_auc 0.896845\n",  "mhcflurry ensemble small dropout_auc 0.896843\n",  "mhcflurry 39_auc 0.896504\n",  "mhcflurry 43_auc 0.896449\n",  "mhcflurry 15_auc 0.896438\n",  "mhcflurry 31_auc 0.896215\n",  "mhcflurry 19_auc 0.896121\n",  "mhcflurry 71_auc 0.895993\n",  "mhcflurry 75_auc 0.895973\n",  "mhcflurry 47_auc 0.895941\n",  "mhcflurry 11_auc 0.895814\n",  "mhcflurry 7_auc 0.895711\n",  "mhcflurry 51_auc 0.895613\n",  "mhcflurry 23_auc 0.895576\n",  "mhcflurry 59_auc 0.895564\n",  "mhcflurry 27_auc 0.895380\n",  "mhcflurry 3_auc 0.894910\n",  "mhcflurry 76_auc 0.888502\n",  "mhcflurry 16_auc 0.888199\n",  "smmpmbec_cpp_auc 0.888191\n",  "mhcflurry 8_auc 0.887882\n",  "mhcflurry 56_auc 0.887530\n",  "mhcflurry 36_auc 0.886830\n",  "mhcflurry 32_auc 0.886811\n",  "mhcflurry 0_auc 0.886591\n",  "mhcflurry 68_auc 0.886177\n",  "mhcflurry 52_auc 0.886162\n",  "mhcflurry 24_auc 0.886143\n",  "mhcflurry 44_auc 0.886107\n",  "mhcflurry 20_auc 0.885845\n",  "mhcflurry 60_auc 0.885607\n",  "mhcflurry 12_auc 0.885568\n",  "mhcflurry 40_auc 0.885557\n",  "mhcflurry 72_auc 0.885176\n",  "mhcflurry 64_auc 0.884733\n",  "mhcflurry 28_auc 0.884478\n",  "mhcflurry 48_auc 0.883997\n",  "mhcflurry 4_auc 0.883439\n",  "mhcflurry ensemble small impute_f1 0.722027\n",  "mhcflurry 61_f1 0.720844\n",  "mhcflurry 5_f1 0.720426\n",  "mhcflurry ensemble small_f1 0.720226\n",  "mhcflurry 53_f1 0.719349\n",  "mhcflurry 29_f1 0.718717\n",  "mhcflurry  1_f1 mhcflurry 1_tau mhcflurry 2_auc mhcflurry 0.718588\n",  "mhcflurry 13_f1 0.718490\n",  "mhcflurry 69_f1 0.718278\n",  "mhcflurry 41_f1 0.717699\n",  "mhcflurry 33_f1 0.717482\n",  "mhcflurry ensemble big_f1 0.716870\n",  "mhcflurry ensemble big impute_f1 0.716762\n",  "mhcflurry 21_f1 0.716524\n",  "mhcflurry 77_f1 0.715732\n",  "mhcflurry 9_f1 0.715548\n",  "mhcflurry 17_f1 0.715131\n",  "netmhc_f1 0.714548\n",  "mhcflurry 45_f1 0.714293\n",  "mhcflurry 49_f1 0.713544\n",  "mhcflurry 73_f1 0.712242\n",  "mhcflurry 37_f1 0.711815\n",  "netmhcpan_f1 0.711710\n",  "mhcflurry 25_f1 0.711678\n",  "mhcflurry 65_f1 0.711592\n",  "mhcflurry 57_f1 0.710520\n",  "mhcflurry 16_f1 0.707594\n",  "mhcflurry 68_f1 0.703877\n",  "mhcflurry ensemble all not impute_f1 0.703530\n",  "mhcflurry ensemble all_f1 0.702774\n",  "mhcflurry 20_f1 0.702678\n",  "mhcflurry ensemble all impute_f1 0.701946\n",  "mhcflurry 46_f1 0.701876\n",  "mhcflurry 48_f1 0.701814\n",  "mhcflurry 0_f1 0.701446\n",  "mhcflurry 24_f1 0.700946\n",  "mhcflurry 56_f1 0.700336\n",  "mhcflurry 60_f1 0.700016\n",  "mhcflurry  2_f1 \\\n",  "allele \n",  "HLA-B3801 0 0.515732 0.921952 0 \n",  "\n",  " mhcflurry 0.699697\n",  "mhcflurry 30_f1 0.699681\n",  "mhcflurry 36_f1 0.699666\n",  "mhcflurry 38_f1 0.699596\n",  "mhcflurry 8_f1 0.698524\n",  "mhcflurry 26_f1 0.698401\n",  "mhcflurry 76_f1 0.698083\n",  "mhcflurry 32_f1 0.698014\n",  "mhcflurry 72_f1 0.697731\n",  "smmpmbec_cpp_f1 0.697506\n",  "mhcflurry ensemble big dropout impute_f1 0.697252\n",  "mhcflurry 58_f1 0.696892\n",  "mhcflurry 54_f1 0.696874\n",  "mhcflurry 18_f1 0.696667\n",  "mhcflurry 14_f1 0.696457\n",  "mhcflurry 12_f1 0.696281\n",  "mhcflurry 34_f1 0.695836\n",  "mhcflurry 22_f1 0.695792\n",  "mhcflurry 10_f1 0.695557\n",  "mhcflurry 74_f1 0.695523\n",  "mhcflurry 70_f1 0.695341\n",  "mhcflurry ensemble big dropout_f1 0.695004\n",  "mhcflurry 42_f1 0.694451\n",  "mhcflurry 44_f1 0.694241\n",  "mhcflurry 52_f1 0.693513\n",  "mhcflurry 64_f1 0.693509\n",  "mhcflurry 62_f1 0.693465\n",  "mhcflurry 50_f1 0.692919\n",  "mhcflurry 78_f1 0.692257\n",  "mhcflurry 28_f1 0.691077\n",  "mhcflurry 66_f1 0.690039\n",  "mhcflurry 6_f1 0.689937\n",  "mhcflurry 40_f1 0.687786\n",  "mhcflurry 4_f1 0.685036\n",  "mhcflurry 39_f1 0.581834\n",  "mhcflurry 63_f1 0.581534\n",  "mhcflurry 7_f1 0.580654\n",  "mhcflurry ensemble small dropout impute_f1 0.580381\n",  "mhcflurry 23_f1 0.580356\n",  "mhcflurry 51_f1 0.579608\n",  "mhcflurry 59_f1 0.579047\n",  "mhcflurry 67_f1 0.579030\n",  "mhcflurry 43_f1 0.578815\n",  "mhcflurry 19_f1 0.578126\n",  "mhcflurry 15_f1 0.578002\n",  "mhcflurry 55_f1 0.577825\n",  "mhcflurry 27_f1 0.576224\n",  "mhcflurry ensemble small dropout_f1 0.575161\n",  "mhcflurry 11_f1 0.575116\n",  "mhcflurry 79_f1 0.575072\n",  "mhcflurry 75_f1 0.574614\n",  "mhcflurry 47_f1 0.574409\n",  "mhcflurry 71_f1 0.571993\n",  "mhcflurry 3_f1 0.571441\n",  "mhcflurry 35_f1 0.571062\n",  "mhcflurry 31_f1 0.568648\n",  "mhcflurry ensemble all_tau 0.539403\n",  "mhcflurry ensemble all impute_tau 0.539144\n",  "mhcflurry ensemble all not impute_tau 0.539034\n",  "mhcflurry ensemble small impute_tau 0.535829\n",  "mhcflurry ensemble small_tau 0.534540\n",  "mhcflurry 74_tau 0.533244\n",  "mhcflurry ensemble big dropout_tau 0.533072\n",  "mhcflurry 54_tau 0.533028\n",  "mhcflurry 42_tau 0.532941\n",  "mhcflurry 18_tau 0.532831\n",  "mhcflurry 58_tau 0.532786\n",  "mhcflurry  2_tau mhcflurry 3_auc ... \\\n",  "allele ... \n",  "HLA-B3801 0.524527 0.725768 ... \n",  "\n",  " netmhcpan_f1 netmhcpan_tau smmpmbec_cpp_auc smmpmbec_cpp_f1 \\\n",  "allele \n",  "HLA-B3801 0 0.652173 0.949206 0 \n",  "\n",  " smmpmbec_cpp_tau test_size train_size mhcflurry standard_tau \\\n",  "allele \n",  "HLA-B3801 0.547438 351 136 0.523753 \n",  "\n",  " mhcflurry standard_f1 mhcflurry standard_auc \n",  "allele \n",  "HLA-B3801 0 0.9359 \n",  "\n",  "[1 rows x 38 columns]" 0.532782\n",  "mhcflurry 26_tau 0.532663\n",  "mhcflurry ensemble big dropout impute_tau 0.532544\n",  "mhcflurry 70_tau 0.532529\n",  "mhcflurry 50_tau 0.532492\n",  "mhcflurry 10_tau 0.532484\n",  "mhcflurry 34_tau 0.532405\n",  "mhcflurry 62_tau 0.532339\n",  "mhcflurry 66_tau 0.532306\n",  "mhcflurry 30_tau 0.532271\n",  "mhcflurry 78_tau 0.532237\n",  "mhcflurry 46_tau 0.532017\n",  "mhcflurry 22_tau 0.531972\n",  "mhcflurry 38_tau 0.531904\n",  "mhcflurry 6_tau 0.531836\n",  "mhcflurry 14_tau 0.531744\n",  "netmhc_tau 0.531214\n",  "mhcflurry 61_tau 0.530432\n",  "mhcflurry 29_tau 0.530146\n",  "netmhcpan_tau 0.529680\n",  "mhcflurry 53_tau 0.528153\n",  "mhcflurry 25_tau 0.527932\n",  "mhcflurry 9_tau 0.527859\n",  "mhcflurry 73_tau 0.527802\n",  "mhcflurry 5_tau 0.527698\n",  "mhcflurry 33_tau 0.527571\n",  "mhcflurry 1_tau 0.527565\n",  "mhcflurry 37_tau 0.527311\n",  "mhcflurry 13_tau 0.526856\n",  "mhcflurry 77_tau 0.526821\n",  "mhcflurry 17_tau 0.526775\n",  "mhcflurry 21_tau 0.526453\n",  "mhcflurry 41_tau 0.526033\n",  "mhcflurry 65_tau 0.525868\n",  "mhcflurry 69_tau 0.525732\n",  "mhcflurry 57_tau 0.524889\n",  "mhcflurry ensemble big_tau 0.524753\n",  "mhcflurry 45_tau 0.524161\n",  "mhcflurry 49_tau 0.523840\n",  "mhcflurry ensemble small dropout impute_tau 0.523797\n",  "mhcflurry ensemble small dropout_tau 0.523631\n",  "mhcflurry ensemble big impute_tau 0.523577\n",  "mhcflurry 55_tau 0.523336\n",  "mhcflurry 63_tau 0.523311\n",  "mhcflurry 35_tau 0.523246\n",  "mhcflurry 67_tau 0.522787\n",  "mhcflurry 15_tau 0.522759\n",  "mhcflurry 43_tau 0.522641\n",  "mhcflurry 47_tau 0.522230\n",  "mhcflurry 59_tau 0.522227\n",  "mhcflurry 71_tau 0.522160\n",  "mhcflurry 19_tau 0.522001\n",  "mhcflurry 79_tau 0.521692\n",  "mhcflurry 23_tau 0.521592\n",  "mhcflurry 7_tau 0.521547\n",  "mhcflurry 51_tau 0.521458\n",  "mhcflurry 11_tau 0.521424\n",  "mhcflurry 31_tau 0.521345\n",  "mhcflurry 39_tau 0.521240\n",  "mhcflurry 27_tau 0.521056\n",  "mhcflurry 75_tau 0.520788\n",  "mhcflurry 3_tau 0.520647\n",  "smmpmbec_cpp_tau 0.510021\n",  "mhcflurry 56_tau 0.505774\n",  "mhcflurry 16_tau 0.505668\n",  "mhcflurry 8_tau 0.505568\n",  "mhcflurry 76_tau 0.503990\n",  "mhcflurry 36_tau 0.502931\n",  "mhcflurry 32_tau 0.502738\n",  "mhcflurry 60_tau 0.502730\n",  "mhcflurry 24_tau 0.502367\n",  "mhcflurry 52_tau 0.502067\n",  "mhcflurry 12_tau 0.501610\n",  "mhcflurry 44_tau 0.501410\n",  "mhcflurry 72_tau 0.501360\n",  "mhcflurry 48_tau 0.501326\n",  "mhcflurry 0_tau 0.500921\n",  "mhcflurry 40_tau 0.500745\n",  "mhcflurry 68_tau 0.500212\n",  "mhcflurry 28_tau 0.498866\n",  "mhcflurry 64_tau 0.498777\n",  "mhcflurry 20_tau 0.498346\n",  "mhcflurry 4_tau 0.498091\n",  "dtype: float64\n"  ]},  "execution_count": 47,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df[df.train_size < 200]" "print_full(scores_df.ix[(scores_df.index != \"overall\") & (scores_df.train_size >= 1000)].mean(0).sort(inplace=False, ascending=False))"  ]  },  {  "cell_type": "code",  "execution_count": 49, 18,  "metadata": {  "collapsed": false,  "scrolled":  false },  "outputs": [  {  "data": {  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ "train_size 565.888889\n",  "test_size 360.666667\n",  "netmhcpan_auc 0.936087\n",  "netmhc_auc 0.926065\n",  "mhcflurry 4_tau 0.496057\n", 30_auc 0.918959\n",  "mhcflurry 0_tau 0.502704\n",  "smmpmbec_cpp_tau 0.516050\n", ensemble all not impute_auc 0.918559\n",  "mhcflurry 3_tau 0.522841\n", ensemble big dropout impute_auc 0.918455\n",  "mhcflurry 7_tau 0.525517\n", ensemble all_auc 0.918428\n",  "mhcflurry 5_tau 0.528831\n", 66_auc 0.918324\n",  "mhcflurry 1_tau 0.532539\n", ensemble big dropout_auc 0.917994\n",  "mhcflurry 2_tau 0.534358\n", ensemble all impute_auc 0.917694\n",  "mhcflurry standard_tau 0.534703\n", 70_auc 0.917616\n",  "mhcflurry 6_tau 0.534703\n",  "netmhcpan_tau 0.534936\n",  "netmhc_tau 0.536833\n", 54_auc 0.917061\n",  "mhcflurry 3_f1 0.603511\n", 38_auc 0.916187\n",  "mhcflurry 7_f1 0.609657\n",  "smmpmbec_cpp_f1 0.707976\n", 2_auc 0.916160\n",  "mhcflurry 0_f1 0.709276\n", 78_auc 0.915861\n",  "mhcflurry standard_f1 0.710507\n", 34_auc 0.915812\n",  "mhcflurry 6_f1 0.710507\n", 10_auc 0.915419\n",  "mhcflurry 2_f1 0.711558\n", 26_auc 0.915396\n",  "mhcflurry 4_f1 0.716505\n", 58_auc 0.915293\n",  "mhcflurry 5_f1 0.717820\n",  "netmhcpan_f1 0.720971\n", 22_auc 0.915185\n",  "mhcflurry 1_f1 0.722733\n",  "netmhc_f1 0.724166\n", 6_auc 0.915118\n",  "mhcflurry 18_auc 0.914417\n",  "mhcflurry ensemble small_auc 0.914335\n",  "mhcflurry 74_auc 0.913987\n",  "mhcflurry 50_auc 0.913961\n",  "mhcflurry 42_auc 0.913924\n",  "mhcflurry 62_auc 0.913588\n",  "mhcflurry 46_auc 0.912436\n",  "mhcflurry ensemble big_auc 0.912376\n",  "mhcflurry 32_auc 0.912109\n",  "mhcflurry 14_auc 0.912070\n",  "mhcflurry ensemble small impute_auc 0.912063\n",  "mhcflurry 25_auc 0.911690\n",  "mhcflurry ensemble big impute_auc 0.911365\n",  "mhcflurry 64_auc 0.910958\n",  "mhcflurry 12_auc 0.910541\n",  "mhcflurry 36_auc 0.910283\n",  "mhcflurry 16_auc 0.910084\n",  "mhcflurry 44_auc 0.909726\n",  "mhcflurry 8_auc 0.909606\n",  "mhcflurry 77_auc 0.908909\n",  "mhcflurry 4_auc 0.883488\n", 0.908750\n",  "mhcflurry 0_auc 0.883998\n", 0.908540\n",  "mhcflurry 41_auc 0.907794\n",  "mhcflurry 56_auc 0.907485\n",  "mhcflurry 48_auc 0.907180\n",  "mhcflurry 60_auc 0.907135\n",  "mhcflurry 68_auc 0.906958\n",  "mhcflurry 52_auc 0.906958\n",  "mhcflurry 24_auc 0.906896\n",  "mhcflurry 40_auc 0.906569\n",  "mhcflurry 28_auc 0.906424\n",  "mhcflurry 76_auc 0.906176\n",  "smmpmbec_cpp_auc 0.890551\n", 0.905258\n",  "mhcflurry 3_auc 0.895132\n", 20_auc 0.904779\n",  "mhcflurry 7_auc 0.896575\n", 72_auc 0.903870\n",  "mhcflurry 5_auc 0.899532\n", 0.902882\n",  "mhcflurry 6_auc 0.900616\n", 45_auc 0.900082\n",  "mhcflurry standard_auc 0.900616\n", 37_auc 0.899811\n",  "mhcflurry 2_auc 0.900671\n", 17_auc 0.898250\n",  "mhcflurry 29_auc 0.897349\n",  "mhcflurry 13_auc 0.896285\n",  "mhcflurry ensemble small dropout impute_auc 0.893958\n",  "mhcflurry 1_auc 0.900868\n",  "netmhcpan_auc 0.902212\n",  "netmhc_auc 0.902225\n",  "test_size 652.027027\n",  "train_size 3386.513514\n", 0.893086\n",  "mhcflurry 49_auc 0.889592\n",  "mhcflurry 73_auc 0.888549\n",  "mhcflurry 21_auc 0.885151\n",  "mhcflurry 65_auc 0.884282\n",  "mhcflurry ensemble small dropout_auc 0.883767\n",  "mhcflurry 9_auc 0.881965\n",  "mhcflurry 15_auc 0.881477\n",  "mhcflurry 39_auc 0.880859\n",  "mhcflurry 7_auc 0.880288\n",  "mhcflurry 61_auc 0.878961\n",  "mhcflurry 63_auc 0.877224\n",  "mhcflurry 47_auc 0.877128\n",  "mhcflurry 3_auc 0.876645\n",  "mhcflurry 31_auc 0.873236\n",  "mhcflurry 75_auc 0.873216\n",  "mhcflurry 27_auc 0.872949\n",  "mhcflurry 79_auc 0.871630\n",  "mhcflurry 23_auc 0.870978\n",  "mhcflurry 67_auc 0.870903\n",  "mhcflurry 35_auc 0.869316\n",  "mhcflurry 57_auc 0.866962\n",  "mhcflurry 69_auc 0.865545\n",  "mhcflurry 71_auc 0.864231\n",  "mhcflurry 53_auc 0.861088\n",  "mhcflurry 55_auc 0.856979\n",  "mhcflurry 33_auc 0.854178\n",  "mhcflurry 11_auc 0.851632\n",  "mhcflurry 51_auc 0.849046\n",  "mhcflurry 19_auc 0.848219\n",  "mhcflurry 59_auc 0.843894\n",  "mhcflurry 43_auc 0.841851\n",  "netmhcpan_f1 0.565589\n",  "netmhc_f1 0.527323\n",  "mhcflurry 36_f1 0.524415\n",  "mhcflurry ensemble big impute_f1 0.522032\n",  "mhcflurry 52_f1 0.519850\n",  "mhcflurry 8_f1 0.518885\n",  "mhcflurry ensemble big_f1 0.516519\n",  "mhcflurry 60_f1 0.515231\n",  "mhcflurry 72_f1 0.514527\n",  "mhcflurry 28_f1 0.514147\n",  "mhcflurry 32_f1 0.513019\n",  "mhcflurry 20_f1 0.512322\n",  "mhcflurry 64_f1 0.511607\n",  "mhcflurry 61_f1 0.511587\n",  "mhcflurry 40_f1 0.510970\n",  "mhcflurry 68_f1 0.510729\n",  "mhcflurry 4_f1 0.510062\n",  "mhcflurry 56_f1 0.509747\n",  "mhcflurry 24_f1 0.509660\n",  "mhcflurry 0_f1 0.508521\n",  "mhcflurry 44_f1 0.508226\n",  "mhcflurry 12_f1 0.507230\n",  "mhcflurry 16_f1 0.503502\n",  "mhcflurry 76_f1 0.502449\n",  "mhcflurry 48_f1 0.501195\n",  "mhcflurry 25_f1 0.500543\n",  "mhcflurry 57_f1 0.496678\n",  "mhcflurry ensemble small impute_f1 0.496230\n",  "mhcflurry 10_f1 0.495999\n",  "mhcflurry 62_f1 0.494614\n",  "smmpmbec_cpp_f1 0.493544\n",  "mhcflurry 6_f1 0.492900\n",  "mhcflurry ensemble small_f1 0.489483\n",  "mhcflurry 77_f1 0.488776\n",  "mhcflurry 37_f1 0.488472\n",  "mhcflurry 65_f1 0.488147\n",  "mhcflurry 21_f1 0.488091\n",  "mhcflurry 29_f1 0.487640\n",  "mhcflurry 13_f1 0.487430\n",  "mhcflurry 49_f1 0.487082\n",  "mhcflurry 1_f1 0.486973\n",  "mhcflurry 5_f1 0.485472\n",  "mhcflurry 73_f1 0.485431\n",  "mhcflurry 66_f1 0.483373\n",  "mhcflurry 18_f1 0.480419\n",  "mhcflurry 53_f1 0.479430\n",  "mhcflurry 69_f1 0.479176\n",  "mhcflurry 58_f1 0.478873\n",  "mhcflurry 54_f1 0.478851\n",  "mhcflurry 34_f1 0.478435\n",  "mhcflurry ensemble all impute_f1 0.478373\n",  "mhcflurry 30_f1 0.477860\n",  "mhcflurry 22_f1 0.477744\n",  "mhcflurry 74_f1 0.476893\n",  "mhcflurry 41_f1 0.476230\n",  "mhcflurry ensemble big dropout_f1 0.475875\n",  "mhcflurry 33_f1 0.475581\n",  "mhcflurry 42_f1 0.473771\n",  "mhcflurry ensemble all_f1 0.471516\n",  "mhcflurry 78_f1 0.470833\n",  "mhcflurry 45_f1 0.470476\n",  "mhcflurry 50_f1 0.470447\n",  "mhcflurry ensemble big dropout impute_f1 0.470316\n",  "mhcflurry 26_f1 0.469715\n",  "mhcflurry 70_f1 0.469639\n",  "mhcflurry 17_f1 0.469113\n",  "mhcflurry 14_f1 0.468982\n",  "mhcflurry 2_f1 0.468908\n",  "mhcflurry 46_f1 0.468425\n",  "mhcflurry 38_f1 0.468420\n",  "mhcflurry ensemble all not impute_f1 0.466306\n",  "mhcflurry 9_f1 0.466063\n",  "mhcflurry 31_f1 0.424886\n",  "mhcflurry 19_f1 0.419287\n",  "mhcflurry 23_f1 0.418466\n",  "mhcflurry 7_f1 0.418060\n",  "mhcflurry 75_f1 0.417655\n",  "mhcflurry 55_f1 0.415659\n",  "mhcflurry 63_f1 0.413056\n",  "mhcflurry 39_f1 0.412995\n",  "mhcflurry 51_f1 0.412559\n",  "mhcflurry ensemble small dropout impute_f1 0.411222\n",  "mhcflurry 11_f1 0.410162\n",  "mhcflurry 15_f1 0.408288\n",  "mhcflurry 27_f1 0.406299\n",  "mhcflurry 59_f1 0.404044\n",  "mhcflurry 47_f1 0.403607\n",  "netmhcpan_tau 0.403266\n",  "mhcflurry 67_f1 0.403010\n",  "mhcflurry 79_f1 0.400183\n",  "mhcflurry 71_f1 0.396040\n",  "mhcflurry ensemble small dropout_f1 0.394268\n",  "mhcflurry 3_f1 0.379194\n",  "mhcflurry 43_f1 0.379114\n",  "smmpmbec_cpp_tau 0.377134\n",  "netmhc_tau 0.375954\n",  "mhcflurry 35_f1 0.372391\n",  "mhcflurry ensemble all not impute_tau 0.369797\n",  "mhcflurry ensemble all_tau 0.369385\n",  "mhcflurry 26_tau 0.368776\n",  "mhcflurry ensemble all impute_tau 0.368391\n",  "mhcflurry ensemble big dropout_tau 0.368155\n",  "mhcflurry ensemble small_tau 0.367748\n",  "mhcflurry ensemble small impute_tau 0.367539\n",  "mhcflurry 66_tau 0.367271\n",  "mhcflurry 58_tau 0.367193\n",  "mhcflurry ensemble big dropout impute_tau 0.367092\n",  "mhcflurry 38_tau 0.366880\n",  "mhcflurry 78_tau 0.366839\n",  "mhcflurry 34_tau 0.366061\n",  "mhcflurry 6_tau 0.365519\n",  "mhcflurry 2_tau 0.365454\n",  "mhcflurry 10_tau 0.365429\n",  "mhcflurry 54_tau 0.364412\n",  "mhcflurry 30_tau 0.364174\n",  "mhcflurry 70_tau 0.362880\n",  "mhcflurry ensemble big_tau 0.361967\n",  "mhcflurry 16_tau 0.361946\n",  "mhcflurry 12_tau 0.361916\n",  "mhcflurry 50_tau 0.361890\n",  "mhcflurry 14_tau 0.361062\n",  "mhcflurry 25_tau 0.360795\n",  "mhcflurry 46_tau 0.360651\n",  "mhcflurry ensemble big impute_tau 0.360501\n",  "mhcflurry 44_tau 0.360119\n",  "mhcflurry 74_tau 0.359965\n",  "mhcflurry 18_tau 0.359889\n",  "mhcflurry 36_tau 0.359602\n",  "mhcflurry 64_tau 0.359470\n",  "mhcflurry 32_tau 0.359237\n",  "mhcflurry 62_tau 0.359184\n",  "mhcflurry 60_tau 0.359115\n",  "mhcflurry 4_tau 0.358225\n",  "mhcflurry 22_tau 0.357977\n",  "mhcflurry 68_tau 0.357952\n",  "mhcflurry 8_tau 0.357895\n",  "mhcflurry 42_tau 0.357797\n",  "mhcflurry 41_tau 0.357553\n",  "mhcflurry 0_tau 0.357457\n",  "mhcflurry 77_tau 0.357111\n",  "mhcflurry 13_tau 0.356615\n",  "mhcflurry 48_tau 0.356389\n",  "mhcflurry 40_tau 0.355280\n",  "mhcflurry 24_tau 0.355054\n",  "mhcflurry 52_tau 0.354026\n",  "mhcflurry 56_tau 0.353757\n",  "mhcflurry 76_tau 0.352782\n",  "mhcflurry 72_tau 0.351810\n",  "mhcflurry 45_tau 0.351479\n",  "mhcflurry 28_tau 0.351078\n",  "mhcflurry 17_tau 0.350528\n",  "mhcflurry 5_tau 0.350238\n",  "mhcflurry 37_tau 0.348835\n",  "mhcflurry 20_tau 0.348679\n",  "mhcflurry 29_tau 0.346874\n",  "mhcflurry 73_tau 0.345549\n",  "mhcflurry 1_tau 0.345142\n",  "mhcflurry ensemble small dropout impute_tau 0.340836\n",  "mhcflurry 65_tau 0.340120\n",  "mhcflurry 49_tau 0.334254\n",  "mhcflurry 23_tau 0.331433\n",  "mhcflurry 9_tau 0.330410\n",  "mhcflurry ensemble small dropout_tau 0.329995\n",  "mhcflurry 15_tau 0.328343\n",  "mhcflurry 63_tau 0.327883\n",  "mhcflurry 21_tau 0.327728\n",  "mhcflurry 7_tau 0.325875\n",  "mhcflurry 61_tau 0.324797\n",  "mhcflurry 3_tau 0.324407\n",  "mhcflurry 79_tau 0.323100\n",  "mhcflurry 27_tau 0.322717\n",  "mhcflurry 35_tau 0.322563\n",  "mhcflurry 75_tau 0.322090\n",  "mhcflurry 39_tau 0.320268\n",  "mhcflurry 47_tau 0.319710\n",  "mhcflurry 53_tau 0.319011\n",  "mhcflurry 67_tau 0.317736\n",  "mhcflurry 69_tau 0.315831\n",  "mhcflurry 71_tau 0.315799\n",  "mhcflurry 31_tau 0.314106\n",  "mhcflurry 33_tau 0.309594\n",  "mhcflurry 55_tau 0.307437\n",  "mhcflurry 57_tau 0.307218\n",  "mhcflurry 51_tau 0.305613\n",  "mhcflurry 11_tau 0.297579\n",  "mhcflurry 19_tau 0.297450\n",  "mhcflurry 59_tau 0.296802\n",  "mhcflurry 43_tau 0.290284\n",  "dtype: float64" float64\n"  ]},  "execution_count": 49,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df[df.train_size > 1000].mean().sort(inplace=False)" "print_full(scores_df.ix[(scores_df.index != \"overall\") & (scores_df.train_size < 1000)].mean(0).sort(inplace=False, ascending=False))"  ]  },  {  "cell_type": "code",  "execution_count": 35, 21,  "metadata": {  "collapsed": false,  "scrolled":  false },  "outputs": [  {  "data": {  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ "allele\n",  "HLA-A0201 False\n",  "HLA-A0301 False\n",  "HLA-A0201 False\n",  "HLA-A0301 False\n",  "HLA-A2601 True\n",  "HLA-B0801 True\n",  "HLA-B5101 True\n",  "HLA-B5701 True\n",  "HLA-B0702 False\n",  "HLA-A3101 False\n",  "HLA-A1101 False\n",  "HLA-A0101 False\n",  "HLA-A0206 False\n",  "HLA-A6802 False\n",  "HLA-A3001 True\n",  "HLA-A0203 False\n",  "HLA-B3901 False\n",  "HLA-B1501 True\n",  "HLA-B1517 True\n",  "HLA-A2402 True\n",  "H-2-DB False\n",  "H-2-KB True\n",  "HLA-B3501 False\n",  "HLA-A6801 False\n",  "HLA-B0802 False\n",  "HLA-B1801 False\n",  "HLA-B5301 True\n",  "HLA-A3301 True\n",  "HLA-A6901 False\n",  "HLA-B1509 False\n",  "HLA-A3201 True\n",  "HLA-B5801 True\n",  "HLA-B2703 False\n",  "HLA-A3002 False\n",  "HLA-A2501 False\n",  "HLA-A2602 False\n",  "HLA-B4402 False\n",  "HLA-B4001 False\n",  "HLA-A2301 False\n",  "Mamu-A02 False\n",  "HLA-A8001 False\n",  "HLA-B4403 False\n",  "HLA-B4601 False\n",  "HLA-B3801 True\n",  "HLA-B2705 False\n",  "HLA-A2603 False\n",  "Mamu-A01 True\n",  "HLA-B0803 False\n",  "H-2-KD False\n",  "HLA-B1503 False\n",  "HLA-A0202 True\n",  "HLA-A2902 True\n",  "HLA-B5401 False\n",  "HLA-B4002 False\n",  "HLA-B4501 False\n", "train_size 2260.018868\n",  "test_size 522.264151\n",  "netmhcpan_auc 0.912458\n",  "mhcflurry ensemble all_auc 0.909130\n",  "mhcflurry ensemble all not impute_auc 0.909011\n",  "netmhc_auc 0.908938\n",  "mhcflurry ensemble all impute_auc 0.908873\n",  "mhcflurry 30_auc 0.907312\n",  "mhcflurry ensemble big dropout impute_auc 0.907048\n",  "mhcflurry 70_auc 0.907012\n",  "mhcflurry 66_auc 0.906921\n",  "mhcflurry ensemble big dropout_auc 0.906889\n",  "mhcflurry ensemble small_auc 0.906681\n",  "mhcflurry 54_auc 0.906629\n",  "mhcflurry 2_auc 0.906404\n",  "mhcflurry 38_auc 0.906311\n",  "mhcflurry ensemble small impute_auc 0.906181\n",  "mhcflurry 10_auc 0.906137\n",  "mhcflurry 78_auc 0.906135\n",  "mhcflurry 34_auc 0.905958\n",  "mhcflurry 26_auc 0.905866\n",  "mhcflurry 58_auc 0.905686\n",  "mhcflurry 18_auc 0.905627\n",  "mhcflurry 6_auc 0.905623\n",  "mhcflurry 22_auc 0.905588\n",  "mhcflurry 42_auc 0.905560\n",  "mhcflurry 74_auc 0.905297\n",  "mhcflurry 50_auc 0.905148\n",  "mhcflurry 62_auc 0.905079\n",  "mhcflurry 25_auc 0.904906\n",  "mhcflurry 46_auc 0.904821\n",  "mhcflurry 14_auc 0.904440\n",  "mhcflurry 77_auc 0.902743\n",  "mhcflurry ensemble big_auc 0.902367\n",  "mhcflurry ensemble big impute_auc 0.902197\n",  "mhcflurry 41_auc 0.901946\n",  "mhcflurry 5_auc 0.901540\n",  "mhcflurry 29_auc 0.899660\n",  "mhcflurry 45_auc 0.899600\n",  "mhcflurry 17_auc 0.899119\n",  "mhcflurry 37_auc 0.899034\n",  "mhcflurry 13_auc 0.898266\n",  "mhcflurry 1_auc 0.897339\n",  "mhcflurry ensemble small dropout impute_auc 0.896163\n",  "mhcflurry 73_auc 0.895816\n",  "mhcflurry 49_auc 0.895503\n",  "mhcflurry 16_auc 0.895494\n",  "mhcflurry 32_auc 0.895243\n",  "mhcflurry 8_auc 0.895123\n",  "mhcflurry 21_auc 0.894653\n",  "mhcflurry 36_auc 0.894647\n",  "mhcflurry 76_auc 0.894393\n",  "mhcflurry 56_auc 0.894181\n",  "mhcflurry 61_auc 0.894119\n",  "mhcflurry 44_auc 0.893980\n",  "mhcflurry 0_auc 0.893908\n",  "mhcflurry 12_auc 0.893892\n",  "smmpmbec_cpp_auc 0.893880\n",  "mhcflurry 9_auc 0.893478\n",  "mhcflurry 64_auc 0.893475\n",  "mhcflurry 65_auc 0.893418\n",  "mhcflurry 68_auc 0.893104\n",  "mhcflurry 52_auc 0.893094\n",  "mhcflurry 24_auc 0.893061\n",  "mhcflurry 60_auc 0.892783\n",  "mhcflurry 40_auc 0.892561\n",  "mhcflurry ensemble small dropout_auc 0.892485\n",  "mhcflurry 20_auc 0.892156\n",  "mhcflurry 4_auc 0.891876\n",  "mhcflurry 28_auc 0.891793\n",  "mhcflurry 48_auc 0.891725\n",  "mhcflurry 15_auc 0.891451\n",  "mhcflurry 72_auc 0.891408\n",  "mhcflurry 39_auc 0.891289\n",  "mhcflurry 7_auc 0.890570\n",  "mhcflurry 63_auc 0.890491\n",  "mhcflurry 47_auc 0.889670\n",  "mhcflurry 3_auc 0.888822\n",  "mhcflurry 31_auc 0.888556\n",  "mhcflurry 57_auc 0.888473\n",  "mhcflurry 79_auc 0.888440\n",  "mhcflurry 75_auc 0.888388\n",  "mhcflurry 67_auc 0.888380\n",  "mhcflurry 27_auc 0.887903\n",  "mhcflurry 35_auc 0.887734\n",  "mhcflurry 23_auc 0.887377\n",  "mhcflurry 69_auc 0.887077\n",  "mhcflurry 53_auc 0.886851\n",  "mhcflurry 71_auc 0.885406\n",  "mhcflurry 33_auc 0.883974\n",  "mhcflurry 55_auc 0.883669\n",  "mhcflurry 11_auc 0.881087\n",  "mhcflurry 19_auc 0.880154\n",  "mhcflurry 51_auc 0.880091\n",  "mhcflurry 59_auc 0.878340\n",  "mhcflurry 43_auc 0.878250\n",  "netmhcpan_f1 0.662084\n",  "netmhc_f1 0.650962\n",  "mhcflurry ensemble big impute_f1 0.650627\n",  "mhcflurry 61_f1 0.649776\n",  "mhcflurry ensemble big_f1 0.648826\n",  "mhcflurry ensemble small impute_f1 0.645341\n",  "mhcflurry ensemble small_f1 0.641861\n",  "mhcflurry 5_f1 0.640630\n",  "mhcflurry 29_f1 0.640238\n",  "mhcflurry 36_f1 0.640147\n",  "mhcflurry 13_f1 0.640017\n",  "mhcflurry 25_f1 0.639972\n",  "mhcflurry 1_f1 0.639926\n",  "mhcflurry 21_f1 0.638943\n",  "mhcflurry 77_f1 0.638652\n",  "mhcflurry 16_f1 0.638280\n",  "mhcflurry 68_f1 0.638279\n",  "mhcflurry 20_f1 0.638029\n",  "mhcflurry 57_f1 0.637895\n",  "mhcflurry 53_f1 0.637867\n",  "mhcflurry 8_f1 0.637515\n",  "mhcflurry 60_f1 0.637259\n",  "mhcflurry 69_f1 0.637074\n",  "mhcflurry 49_f1 0.636633\n",  "mhcflurry 24_f1 0.635981\n",  "mhcflurry 37_f1 0.635962\n",  "mhcflurry 0_f1 0.635924\n",  "mhcflurry 65_f1 0.635705\n",  "mhcflurry 41_f1 0.635691\n",  "mhcflurry 56_f1 0.635608\n",  "mhcflurry 72_f1 0.635511\n",  "mhcflurry 33_f1 0.635327\n",  "mhcflurry 73_f1 0.635212\n",  "mhcflurry 32_f1 0.635185\n",  "mhcflurry 52_f1 0.634533\n",  "mhcflurry 48_f1 0.633679\n",  "mhcflurry 12_f1 0.632075\n",  "mhcflurry 64_f1 0.631731\n",  "mhcflurry 76_f1 0.631641\n",  "mhcflurry 17_f1 0.631577\n",  "mhcflurry 45_f1 0.631487\n",  "mhcflurry 44_f1 0.631066\n",  "mhcflurry 28_f1 0.630987\n",  "mhcflurry 9_f1 0.630817\n",  "smmpmbec_cpp_f1 0.628236\n",  "mhcflurry 10_f1 0.627782\n",  "mhcflurry 40_f1 0.627735\n",  "mhcflurry ensemble all impute_f1 0.626016\n",  "mhcflurry 62_f1 0.625931\n",  "mhcflurry 4_f1 0.625611\n",  "mhcflurry 30_f1 0.624346\n",  "mhcflurry ensemble all_f1 0.624233\n",  "mhcflurry 18_f1 0.623224\n",  "mhcflurry 6_f1 0.623019\n",  "mhcflurry ensemble all not impute_f1 0.622963\n",  "mhcflurry 58_f1 0.622848\n",  "mhcflurry 54_f1 0.622828\n",  "mhcflurry 46_f1 0.622591\n",  "mhcflurry 34_f1 0.622002\n",  "mhcflurry 22_f1 0.621738\n",  "mhcflurry 2_f1 0.621316\n",  "mhcflurry 74_f1 0.621271\n",  "mhcflurry 38_f1 0.621083\n",  "mhcflurry 26_f1 0.620734\n",  "mhcflurry ensemble big dropout_f1 0.620583\n",  "mhcflurry ensemble big dropout impute_f1 0.620180\n",  "mhcflurry 66_f1 0.619851\n",  "mhcflurry 42_f1 0.619503\n",  "mhcflurry 14_f1 0.619201\n",  "mhcflurry 70_f1 0.618687\n",  "mhcflurry 50_f1 0.617363\n",  "mhcflurry 78_f1 0.617056\n",  "mhcflurry 7_f1 0.525433\n",  "mhcflurry 23_f1 0.525374\n",  "mhcflurry 39_f1 0.524493\n",  "mhcflurry 63_f1 0.524315\n",  "mhcflurry 19_f1 0.524181\n",  "mhcflurry ensemble small dropout impute_f1 0.522931\n",  "mhcflurry 51_f1 0.522874\n",  "mhcflurry 55_f1 0.522750\n",  "mhcflurry 75_f1 0.521307\n",  "mhcflurry 15_f1 0.520364\n",  "mhcflurry 31_f1 0.519823\n",  "mhcflurry 59_f1 0.519612\n",  "mhcflurry 67_f1 0.519250\n",  "mhcflurry 11_f1 0.519094\n",  "mhcflurry 27_f1 0.518514\n",  "mhcflurry 47_f1 0.516401\n",  "mhcflurry 79_f1 0.515675\n",  "mhcflurry ensemble small dropout_f1 0.513726\n",  "mhcflurry 71_f1 0.512236\n",  "mhcflurry 43_f1 0.510992\n",  "mhcflurry 3_f1 0.506150\n",  "mhcflurry 35_f1 0.503589\n",  "netmhcpan_tau 0.485921\n",  "mhcflurry ensemble all_tau 0.480551\n",  "mhcflurry ensemble all not impute_tau 0.480452\n",  "mhcflurry ensemble all impute_tau 0.480037\n",  "mhcflurry ensemble small impute_tau 0.477575\n",  "netmhc_tau 0.477470\n",  "mhcflurry ensemble small_tau 0.476804\n",  "mhcflurry ensemble big dropout_tau 0.475985\n",  "mhcflurry 26_tau 0.475933\n",  "mhcflurry 58_tau 0.475465\n",  "mhcflurry ensemble big dropout impute_tau 0.475272\n",  "mhcflurry 66_tau 0.475179\n",  "mhcflurry 78_tau 0.474984\n",  "mhcflurry 2_tau 0.474861\n",  "mhcflurry 34_tau 0.474824\n",  "mhcflurry 38_tau 0.474780\n",  "mhcflurry 54_tau 0.474661\n",  "mhcflurry 10_tau 0.474657\n",  "mhcflurry 6_tau 0.474265\n",  "mhcflurry 30_tau 0.474084\n",  "mhcflurry 70_tau 0.473804\n",  "mhcflurry 50_tau 0.473438\n",  "mhcflurry 74_tau 0.473263\n",  "mhcflurry 18_tau 0.472967\n",  "mhcflurry 46_tau 0.472698\n",  "mhcflurry 14_tau 0.472662\n",  "mhcflurry 62_tau 0.472401\n",  "mhcflurry 42_tau 0.472315\n",  "mhcflurry 22_tau 0.471743\n",  "mhcflurry 25_tau 0.470077\n",  "mhcflurry ensemble big_tau 0.468404\n",  "mhcflurry 77_tau 0.468075\n",  "mhcflurry 13_tau 0.467926\n",  "mhcflurry 41_tau 0.467713\n",  "mhcflurry ensemble big impute_tau 0.467127\n",  "mhcflurry 29_tau 0.466706\n",  "mhcflurry 5_tau 0.466270\n",  "mhcflurry 17_tau 0.465766\n",  "smmpmbec_cpp_tau 0.465725\n",  "mhcflurry 37_tau 0.465531\n",  "mhcflurry 73_tau 0.464715\n",  "mhcflurry 1_tau 0.464419\n",  "mhcflurry 45_tau 0.464387\n",  "mhcflurry 65_tau 0.461571\n",  "mhcflurry ensemble small dropout impute_tau 0.460464\n",  "mhcflurry 9_tau 0.459511\n",  "mhcflurry 61_tau 0.459250\n",  "mhcflurry 49_tau 0.458214\n",  "mhcflurry 21_tau 0.457664\n",  "mhcflurry ensemble small dropout_tau 0.456603\n",  "mhcflurry 16_tau 0.455918\n",  "mhcflurry 23_tau 0.455767\n",  "mhcflurry 53_tau 0.455758\n",  "mhcflurry 63_tau 0.455662\n",  "mhcflurry 15_tau 0.455462\n",  "mhcflurry 8_tau 0.454451\n",  "mhcflurry 7_tau 0.453814\n",  "mhcflurry 35_tau 0.453779\n",  "mhcflurry 36_tau 0.453317\n",  "mhcflurry 12_tau 0.453254\n",  "mhcflurry 56_tau 0.453153\n",  "mhcflurry 69_tau 0.453074\n",  "mhcflurry 32_tau 0.453065\n",  "mhcflurry 60_tau 0.453017\n",  "mhcflurry 79_tau 0.452948\n",  "mhcflurry 3_tau 0.452717\n",  "mhcflurry 44_tau 0.452501\n",  "mhcflurry 27_tau 0.452400\n",  "mhcflurry 47_tau 0.452127\n",  "mhcflurry 33_tau 0.452118\n",  "mhcflurry 75_tau 0.452008\n",  "mhcflurry 67_tau 0.451808\n",  "mhcflurry 39_tau 0.451672\n",  "mhcflurry 76_tau 0.451649\n",  "mhcflurry 24_tau 0.451374\n",  "mhcflurry 0_tau 0.451261\n",  "mhcflurry 48_tau 0.451155\n",  "mhcflurry 68_tau 0.450968\n",  "mhcflurry 52_tau 0.450822\n",  "mhcflurry 71_tau 0.450727\n",  "mhcflurry 64_tau 0.450555\n",  "mhcflurry 40_tau 0.450392\n",  "mhcflurry 4_tau 0.449676\n",  "mhcflurry 31_tau 0.449608\n",  "mhcflurry 72_tau 0.449593\n",  "mhcflurry 57_tau 0.449541\n",  "mhcflurry 55_tau 0.448602\n",  "mhcflurry 28_tau 0.447709\n",  "mhcflurry 51_tau 0.446742\n",  "mhcflurry 20_tau 0.446538\n",  "mhcflurry 19_tau 0.444272\n",  "mhcflurry 59_tau 0.444195\n",  "mhcflurry 11_tau 0.443939\n",  "mhcflurry 43_tau 0.442209\n",  "dtype: bool" float64\n"  ]},  "execution_count": 35,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "(df[\"mhcflurry standard_auc\"] > df[\"netmhc_auc\"])" "print_full(scores_df.ix[scores_df.index != \"overall\"].mean(0).sort(inplace=False, ascending=False))"  ]  },  {  "cell_type": "code",  "execution_count": null,  "metadata": {  "collapsed": true  },  "outputs": [],  "source": []  },  {  "cell_type": "code",  "execution_count": 38, 22,  "metadata": {  "collapsed": false  },  "outputs": [  {  "ename": "SyntaxError",  "evalue": "invalid syntax (, line 2)",  "output_type": "error",  "traceback": "data": {  "text/plain":  [ "\u001b[0;36m File \u001b[0;32m\"\"\u001b[0;36m, line \u001b[0;32m2\u001b[0m\n\u001b[0;31m x=\"\"\u001b[0m\n\u001b[0m ^\u001b[0m\n\u001b[0;31mSyntaxError\u001b[0m\u001b[0;31m:\u001b[0m invalid syntax\n" "allele\n",  "overall 0.995303\n",  "H-2-DB 1.011136\n",  "H-2-KB 1.023012\n",  "H-2-KD 0.958486\n",  "HLA-A0101 1.012477\n",  "HLA-A0201 0.997279\n",  "HLA-A0202 1.009183\n",  "HLA-A0203 1.000951\n",  "HLA-A0206 0.995024\n",  "HLA-A0301 0.986422\n",  "HLA-A1101 0.988892\n",  "HLA-A2301 0.988901\n",  "HLA-A2402 0.995979\n",  "HLA-A2501 1.000491\n",  "HLA-A2601 1.005599\n",  "HLA-A2602 0.993474\n",  "HLA-A2603 0.990339\n",  "HLA-A2902 1.028103\n",  "HLA-A3001 1.021084\n",  "HLA-A3002 0.989223\n",  "HLA-A3101 0.995926\n",  "HLA-A3201 1.016410\n",  "HLA-A3301 1.015176\n",  "HLA-A6801 0.996876\n",  "HLA-A6802 1.000162\n",  "HLA-A6901 1.005053\n",  "HLA-A8001 0.989457\n",  "HLA-B0702 1.001494\n",  "HLA-B0801 1.002733\n",  "HLA-B0802 0.984341\n",  "HLA-B0803 0.961754\n",  "HLA-B1501 1.003644\n",  "HLA-B1503 0.966286\n",  "HLA-B1509 0.968437\n",  "HLA-B1517 1.019622\n",  "HLA-B1801 1.012538\n",  "HLA-B2703 NaN\n",  "HLA-B2705 0.998979\n",  "HLA-B3501 1.004012\n",  "HLA-B3801 0.962732\n",  "HLA-B3901 0.985603\n",  "HLA-B4001 0.979640\n",  "HLA-B4002 0.998922\n",  "HLA-B4402 0.981135\n",  "HLA-B4403 0.952167\n",  "HLA-B4501 1.000000\n",  "HLA-B4601 NaN\n",  "HLA-B5101 1.023293\n",  "HLA-B5301 1.025424\n",  "HLA-B5401 0.986755\n",  "HLA-B5701 1.016456\n",  "HLA-B5801 1.014038\n",  "Mamu-A01 0.994416\n",  "Mamu-A02 0.988303\n",  "dtype: float64"  ] },  "execution_count": 22,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "seaborn.pointplot(data=df[[x for x in df.columns if 'auc' in x or x == \"train_size\"]].stack().reset_index(),\n",  " x=\"\"" "scores_df.ix[:, \"mhcflurry ensemble small impute_auc\"] / scores_df.ix[:, \"netmhc_auc\"]"  ]  },  {  "cell_type": "code",  "execution_count": 30, 23,  "metadata": {  "collapsed": false  }, 

{  "data": {  "text/plain": [  "mhcflurry 0_auc 0.888551\n",  "mhcflurry 1_auc 0.901088\n",  "mhcflurry 2_auc 0.903755\n",  "mhcflurry 3_auc 0.881133\n",  "mhcflurry 4_auc 0.890536\n",  "mhcflurry 5_auc 0.900119\n",  "mhcflurry 6_auc 0.903171\n",  "mhcflurry 7_auc 0.898431\n",  "netmhc_auc 0.909872\n",  "netmhcpan_auc 0.913077\n",  "smmpmbec_cpp_auc 0.895268\n",  "mhcflurry standard_auc 0.900856\n",  "dtype: float64" "\n",  "Dimensions: 94 (items) x 54 (major_axis) x 3 (minor_axis)\n",  "Items axis: mhcflurry 0 to smmpmbec_cpp\n",  "Major_axis axis: overall to Mamu-A02\n",  "Minor_axis axis: auc to tau"  ]  },  "execution_count": 30, 23,  "metadata": {},  "output_type": "execute_result"  }  ],  "source": [  "df.mean()[[x "def sub_df(name):\n",  " result = scores_df[[c  for x c  in df.columns list(scores_df.columns)  if 'auc' (name + \"_\")  in x]]" c]].copy()\n",  " result.columns = [c.split(\"_\")[-1] for c in list(result.columns)]\n",  " return result\n",  "\n",  "d = dict((name, sub_df(name)) for name in predictors)\n",  "panel = pandas.Panel(d)\n",  " \n",  "panel"  ]  },  {  "cell_type": "code",  "execution_count": 21, 24,  "metadata": {  "collapsed": false  },  "outputs": [  {  "data": {  "text/plain": "name": "stdout",  "output_type": "stream",  "text":  [ "netmhc\n",  " auc f1 tau\n",  "allele \n",  "overall 0.929947 0.800909 0.582258\n",  "H-2-DB 0.896152 0.621212 0.600337\n",  "H-2-KB 0.891675 0.813675 0.573199\n",  "H-2-KD 0.815331 0.657718 0.403275\n",  "HLA-A0101 0.915334 0.619565 0.524866\n",  "HLA-A0201 0.932234 0.884336 0.635498\n",  "HLA-A0202 0.890382 0.755556 0.627143\n",  "HLA-A0203 0.975879 0.948626 0.586911\n",  "HLA-A0206 0.913636 0.872902 0.543184\n",  "HLA-A0301 0.935154 0.900621 0.629236\n",  "HLA-A1101 0.949252 0.883402 0.632199\n",  "HLA-A2301 0.881451 0.773842 0.605598\n",  "HLA-A2402 0.864200 0.632911 0.575710\n",  "HLA-A2501 0.991727 0.666667 0.151836\n",  "HLA-A2601 0.930840 0.541176 0.436646\n",  "HLA-A2602 0.931577 0.766839 0.525365\n",  "HLA-A2603 0.890172 0.542373 0.366317\n",  "HLA-A2902 0.868946 0.644068 0.619830\n",  "HLA-A3001 0.866899 0.731959 0.456482\n",  "HLA-A3002 0.749659 0.663438 0.342161\n",  "HLA-A3101 0.862606 0.833958 0.525026\n",  "HLA-A3201 0.893070 0.772881 0.448284\n",  "HLA-A3301 0.914593 0.868327 0.587112\n",  "HLA-A6801 0.948038 0.924791 0.571403\n",  "HLA-A6802 0.971961 0.922636 0.652332\n",  "HLA-A6901 0.960066 0.698413 0.335339\n",  "HLA-A8001 0.983487 0.434783 0.182374\n",  "HLA-B0702 0.916126 0.869383 0.606014\n",  "HLA-B0801 0.946187 0.776053 0.629519\n",  "HLA-B0802 0.989930 0.190476 0.393833\n",  "HLA-B0803 0.968395 0.000000 0.318249\n",  "HLA-B1501 0.934416 0.846512 0.591735\n",  "HLA-B1503 0.864784 0.592593 0.468922\n",  "HLA-B1509 0.901247 0.187500 0.354311\n",  "HLA-B1517 0.902687 0.637931 0.422497\n",  "HLA-B1801 0.794549 0.358974 0.237118\n",  "HLA-B2703 NaN 0.000000 0.053658\n",  "HLA-B2705 0.948457 0.285714 0.430561\n",  "HLA-B3501 0.828690 0.712000 0.515205\n",  "HLA-B3801 0.925684 0.000000 0.513269\n",  "HLA-B3901 0.965195 0.750000 0.305138\n",  "HLA-B4001 0.928725 0.829787 0.635308\n",  "HLA-B4002 0.920635 0.758621 0.456242\n",  "HLA-B4402 0.912335 0.568807 0.574916\n",  "HLA-B4403 0.869501 0.766304 0.541066\n",  "HLA-B4501 1.000000 1.000000 0.263574\n",  "HLA-B4601 NaN 0.000000 NaN\n",  "HLA-B5101 0.919175 0.428571 0.365307\n",  "HLA-B5301 0.841415 0.733813 0.515585\n",  "HLA-B5401 0.816216 0.800000 0.300252\n",  "HLA-B5701 0.899092 0.741840 0.484975\n",  "HLA-B5801 0.891654 0.827411 0.545132\n",  "Mamu-A01 0.916721 0.694915 0.569423\n",  "Mamu-A02 0.929688 0.767123 0.598964\n",  "\n",  "netmhcpan\n",  " auc f1 tau\n",  "allele \n",  "overall 0.932924 0.793170 0.579586\n",  "H-2-DB 0.874574 0.577236 0.574262\n",  "H-2-KB 0.825565 0.665354 0.486836\n",  "H-2-KD 0.819189 0.645570 0.390333\n",  "HLA-A0101 0.894895 0.594286 0.498767\n",  "HLA-A0201 0.930479 0.880963 0.637338\n",  "HLA-A0202 0.898697 0.769231 0.624280\n",  "HLA-A0203 0.974158 0.944578 0.591463\n",  "HLA-A0206 0.910796 0.866258 0.535067\n",  "HLA-A0301 0.927287 0.885106 0.611240\n",  "HLA-A1101 0.945065 0.887671 0.625794\n",  "HLA-A2301 0.895229 0.788406 0.636944\n",  "HLA-A2402 0.892876 0.693069 0.600686\n",  "HLA-A2501 0.998540 0.888889 0.153968\n",  "HLA-A2601 0.942279 0.640000 0.451666\n",  "HLA-A2602 0.957811 0.839378 0.561093\n",  "HLA-A2603 0.934300 0.581818 0.426438\n",  "HLA-A2902 0.882377 0.633333 0.641257\n",  "HLA-A3001 0.871974 0.746114 0.459857\n",  "HLA-A3002 0.732749 0.611260 0.320577\n",  "HLA-A3101 0.859261 0.822335 0.528941\n",  "HLA-A3201 0.907161 0.766423 0.480669\n",  "HLA-A3301 0.931156 0.829175 0.612147\n",  "HLA-A6801 0.948907 0.923944 0.599562\n",  "HLA-A6802 0.964197 0.900293 0.653216\n",  "HLA-A6901 0.944257 0.680851 0.327432\n",  "HLA-A8001 0.980799 0.434783 0.186524\n",  "HLA-B0702 0.913527 0.855011 0.604720\n",  "HLA-B0801 0.942822 0.701671 0.606762\n",  "HLA-B0802 0.989590 0.571429 0.410579\n",  "HLA-B0803 0.952346 0.000000 0.315978\n",  "HLA-B1501 0.935596 0.823245 0.589097\n",  "HLA-B1503 0.870064 0.588235 0.522577\n",  "HLA-B1509 0.922907 0.176471 0.448099\n",  "HLA-B1517 0.934516 0.710280 0.448575\n",  "HLA-B1801 0.789549 0.380952 0.234201\n",  "HLA-B2703 NaN 0.000000 0.067451\n",  "HLA-B2705 0.943860 0.400000 0.377208\n",  "HLA-B3501 0.836281 0.711027 0.514413\n",  "HLA-B3801 0.980074 0.000000 0.652173\n",  "HLA-B3901 0.980065 0.744186 0.316739\n",  "HLA-B4001 0.920678 0.845570 0.619418\n",  "HLA-B4002 0.918651 0.909091 0.518720\n",  "HLA-B4402 0.934554 0.607143 0.598960\n",  "HLA-B4403 0.891047 0.775956 0.587824\n",  "HLA-B4501 0.993333 0.800000 0.246426\n",  "HLA-B4601 NaN 0.000000 NaN\n",  "HLA-B5101 0.948695 0.610169 0.406973\n",  "HLA-B5301 0.885722 0.753623 0.559543\n",  "HLA-B5401 0.845946 0.727273 0.349826\n",  "HLA-B5701 0.883077 0.642623 0.460133\n",  "HLA-B5801 0.882016 0.805195 0.531508\n",  "Mamu-A01 0.912755 0.706897 0.539013\n",  "Mamu-A02 0.883087 0.748092 0.524622\n",  "\n",  "mhcflurry 0_auc 0.888551\n",  "mhcflurry 0_f1 0.636355\n",  "mhcflurry 0_tau 0.449200\n",  "mhcflurry 1_auc 0.901088\n",  "mhcflurry 1_f1 0.644236\n",  "mhcflurry 1_tau 0.471471\n",  "mhcflurry 2_auc 0.903755\n",  "mhcflurry 2_f1 0.630669\n",  "mhcflurry 2_tau 0.472481\n",  "mhcflurry 3_auc 0.881133\n",  "mhcflurry 3_f1 0.533349\n",  "mhcflurry 3_tau 0.449642\n",  "mhcflurry 4_auc 0.890536\n",  "mhcflurry 4_f1 0.649554\n",  "mhcflurry 4_tau 0.447560\n",  "mhcflurry 5_auc 0.900119\n",  "mhcflurry 5_f1 0.636095\n",  "mhcflurry 5_tau 0.468839\n",  "mhcflurry 6_auc 0.903171\n",  "mhcflurry 6_f1 0.635060\n",  "mhcflurry 6_tau 0.474900\n",  "mhcflurry 7_auc 0.898431\n",  "mhcflurry 7_f1 0.543681\n",  "mhcflurry 7_tau 0.462858\n",  "netmhc_auc 0.909872\n",  "netmhc_f1 0.659745\n",  "netmhc_tau 0.483207\n",  "netmhcpan_auc 0.913077\n",  "netmhcpan_f1 0.670119\n",  "netmhcpan_tau 0.491046\n",  "smmpmbec_cpp_auc 0.895268\n",  "smmpmbec_cpp_f1 0.637798\n",  "smmpmbec_cpp_tau 0.471492\n",  "test_size 556.672727\n",  "train_size 2463.400000\n",  "dtype: float64" big\n"  ] }, "execution_count": 21,  "metadata": {}, {  "ename": "AttributeError",  "evalue": "'module' object has no attribute 'panel_mhcflurry'",  "output_type": "execute_result" "error",  "traceback": [  "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",  "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)",  "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 6\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mmodel_name\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mmodel_groups\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7\u001b[0m \u001b[0;32mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"mhcflurry \"\u001b[0m \u001b[0;34m+\u001b[0m \u001b[0mmodel_name\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 8\u001b[0;31m \u001b[0;32mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mscipy\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstats\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmstats\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpanel_mhcflurry\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mmodel_groups\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mmodel_name\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmean\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 9\u001b[0m \u001b[0;32mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",  "\u001b[0;31mAttributeError\u001b[0m: 'module' object has no attribute 'panel_mhcflurry'"  ]  }  ],  "source": [  "df.mean(axis=0)" "for model in [\"netmhc\", \"netmhcpan\"]:\n",  " print(model)\n",  " print(panel[model])\n",  " print(\"\")\n",  "\n",  "for model_name in model_groups.index:\n",  " print(\"mhcflurry \" + model_name)\n",  " print(scipy.stats.mstats.panel_mhcflurry[model_groups[model_name]].mean(0))\n",  " print(\"\")"  ]  },  {  "cell_type": "code",  "execution_count": null,  "metadata": {  "collapsed": false  },  "outputs": [],  "source": [  "threshold = 1000\n",  "big_model = 6\n",  "small_model = 5\n",  "extra_cols = collections.defaultdict(list)\n",  "for (allele, row) in df.iterrows():\n",  " for metric in [\"auc\", \"f1\", \"tau\"]:\n",  " model = big_model if row.train_size >= threshold else small_model\n",  " extra_cols[\"mhcflurry standard_%s\" % metric].append(row[\"mhcflurry %s_%s\" % (model, metric)])\n",  " \n",  "for (col, values) in extra_cols.items():\n",  " df[col] = values\n",  "\n",  "df"  ]  }  ],