ProteInfer is an approach for predicting the functional properties of protein sequences using deep neural networks.
📝 Read about the method in our interactive paper (or in the static version, published in eLife).
Go to to use an interactive demo in your browser, and read the related paper.
Or if you're interested in the command line interface instead, see below.
sudo apt install -y google-cloud-sdk
gcloud auth login
gcloud compute instances create proteinfer-gpu --machine-type n1-standard-8 --zone us-west1-b --accelerator type=nvidia-tesla-v100,count=1 --image-family ubuntu-2004-lts --image-project ubuntu-os-cloud --maintenance-policy TERMINATE --boot-disk-size 250
# You may need to wait ~30 seconds for the machine to boot up first.
gcloud compute ssh proteinfer-gpu
sudo apt update
sudo add-apt-repository ppa:graphics-drivers -y
wget -O /tmp/cuda-keyring_1.0-1_all.deb
sudo dpkg -i /tmp/cuda-keyring_1.0-1_all.deb
sudo bash -c 'echo "deb /" > /etc/apt/sources.list.d/cuda_learn.list'
sudo apt-key adv --fetch-keys
sudo apt update
sudo apt install -y cuda-10-0 libcudnn7
sudo apt update
sudo add-apt-repository ppa:deadsnakes/ppa -y
sudo apt install -y python3-venv python3.7 python3-pip python3.7-venv
mkdir ~/python_venv
cd ~/python_venv
python3.7 -m venv proteinfer
source ~/python_venv/proteinfer/bin/activate
cd ~
git clone
cd ~/proteinfer
pip3 install -r requirements.txt
cd ~/proteinfer
python3 -i testdata/test_hemoglobin.fasta -o ~/hemoglobin_predictions.tsv
# View your predictions.
cat ~/hemoglobin_predictions.tsv
# exit the ssh session by typing ctrl D
gcloud compute scp <YOUR_FASTA_FILE_HERE> proteinfer-gpu:~/
# Then ssh back in again
gcloud compute ssh proteinfer-gpu
# Then run your inference
python3 -i ~/<YOUR_FASTA_FILE_HERE> -o ~/predictions.tsv
gcloud compute instances delete 'proteinfer-gpu'
bash -c 'for f in *; do python3 $f || exit 1; done'