Skip to content

Commit

Permalink
Update Workflow_PyPEF.ipynb
Browse files Browse the repository at this point in the history
  • Loading branch information
niklases authored May 8, 2023
1 parent 268aefe commit ce41b19
Showing 1 changed file with 18 additions and 2 deletions.
20 changes: 18 additions & 2 deletions workflow/Workflow_PyPEF.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -362,7 +362,24 @@
"cell_type": "markdown",
"metadata": {},
"source": [
"For hybrid modeling, here we use a very small dataset fraction of the ANEH dataset (37 variants with associated (negative) fitness values). Next, you can run model training and validation on the test sets and save the best models (in this notebook only using a single CPU):"
"For hybrid modeling, here we use a very small dataset fraction of the ANEH dataset (37 variants with associated (negative) fitness values). Next, you can run model training and validation on the test sets and save the best models (in this notebook only using a single CPU). For DCA-based encoding, downloading the plmc parameter file is necessary (uncomment cell below)."
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"#import urllib.request\n",
"#from hashlib import sha256\n",
"#url = 'https://github.com/niklases/PyPEF/raw/main/workflow/test_dataset_aneh/ANEH_72.6.params'\n",
"#urllib.request.urlretrieve(url, 'ANEH_72.6.params') # File size: 207 MB\n",
"#with open('ANEH_72.6.params', 'rb') as f:\n",
"# sha256_hash = sha256(f.read()).hexdigest()\n",
"# if not sha256_hash == 'd84bd2185f5882c3ef01ab99264e30111333b8adb05136b953f407b1b6dfbaf8':\n",
"# raise SystemError(\"Hash of downloaded DCA parameter file not correct, terminating further running.\")\n",
"#print('Successfully downloaded ANEH_72.6.params!')"
]
},
{
Expand Down Expand Up @@ -824,7 +841,6 @@
" sha256_hash = sha256(f.read()).hexdigest()\n",
" if not sha256_hash == 'be4623f35a5ba05d33a29ae6e69dc3c2e994e3c9092cd5880a8d0bbc12f187b1':\n",
" raise SystemError(\"Hash of downloaded CSV file not correct, terminating further running.\")\n",
"# Wild-type encoding,\n",
"url = 'https://github.com/niklases/PyPEF/raw/main/workflow/test_dataset_avgfp/uref100_avgfp_jhmmer_119_plmc_42.6.params'\n",
"urllib.request.urlretrieve(url, 'uref100_avgfp_jhmmer_119_plmc_42.6.params') # File size: 71.2 MB\n",
"with open('uref100_avgfp_jhmmer_119_plmc_42.6.params', 'rb') as f:\n",
Expand Down

0 comments on commit ce41b19

Please sign in to comment.