diff --git a/data/structdatabases.sh b/data/structdatabases.sh index eae763a0..aec50d98 100644 --- a/data/structdatabases.sh +++ b/data/structdatabases.sh @@ -86,6 +86,15 @@ case "${SELECTION}" in push_back "${TMP_PATH}/afdb" INPUT_TYPE="FOLDSEEK_DB" ;; + "Alphafold/UniProt50") + if notExists "${TMP_PATH}/afdb50.tar.gz"; then + downloadFile "https://foldseek.steineggerlab.workers.dev/afdb50.tar.gz" "${TMP_PATH}/afdb50.tar.gz" + downloadFile "https://foldseek.steineggerlab.workers.dev/afdb50.version" "${TMP_PATH}/version" + fi + tar xvfz "${TMP_PATH}/afdb50.tar.gz" -C "${TMP_PATH}" + push_back "${TMP_PATH}/afdb50" + INPUT_TYPE="FOLDSEEK_DB" + ;; "Alphafold/Proteome") if notExists "${TMP_PATH}/alphafolddb.tar.gz"; then downloadFile "https://foldseek.steineggerlab.workers.dev/alphafolddb.tar.gz" "${TMP_PATH}/alphafolddb.tar.gz" diff --git a/src/foldseek.cpp b/src/foldseek.cpp index e2bd0f17..c2808dce 100644 --- a/src/foldseek.cpp +++ b/src/foldseek.cpp @@ -227,6 +227,14 @@ std::vector externalDownloads = { true, Parameters::DBTYPE_AMINO_ACIDS, structdatabases_sh, structdatabases_sh_len, {} }, + { + "Alphafold/UniProt50", + "AlphaFold UniProt Protein Structure Database clustered at 50% sequence identity.", + "Jumper et al. Highly accurate protein structure prediction with AlphaFold. Nature, (2021)", + "https://alphafold.ebi.ac.uk/", + true, Parameters::DBTYPE_AMINO_ACIDS, structdatabases_sh, structdatabases_sh_len, + {} + }, { "Alphafold/Proteome", "AlphaFold Proteomes Protein Structure Database.",