From 928984bfa3c7c3c98ca58b557d965965038f7e0b Mon Sep 17 00:00:00 2001 From: Martin Steinegger Date: Mon, 12 Aug 2024 15:10:56 +0900 Subject: [PATCH] Add BFMD database to repository --- data/structdatabases.sh | 9 +++++++++ src/FoldseekBase.cpp | 8 ++++++++ 2 files changed, 17 insertions(+) diff --git a/data/structdatabases.sh b/data/structdatabases.sh index 9f0b9486..c3a90e9b 100644 --- a/data/structdatabases.sh +++ b/data/structdatabases.sh @@ -159,6 +159,15 @@ case "${SELECTION}" in push_back "${TMP_PATH}/cath50" INPUT_TYPE="FOLDSEEK_DB" ;; + "BFMD") + if notExists "${TMP_PATH}/bfmd.tar.gz"; then + downloadFile "https://foldseek.steineggerlab.workers.dev/bfmd.tar.gz" "${TMP_PATH}/bfmd.tar.gz" + downloadFile "https://foldseek.steineggerlab.workers.dev/bfmd.version" "${TMP_PATH}/version" + fi + tar xvfz "${TMP_PATH}/bfmd.tar.gz" -C "${TMP_PATH}" + push_back "${TMP_PATH}/bfmd" + INPUT_TYPE="FOLDSEEK_DB" + ;; "ProstT5") MODEL=prostt5-f16-safetensors.tar.gz if [ -n "${PROSTT5_QUANTIZED}" ]; then diff --git a/src/FoldseekBase.cpp b/src/FoldseekBase.cpp index 979ade32..22426c4c 100644 --- a/src/FoldseekBase.cpp +++ b/src/FoldseekBase.cpp @@ -432,6 +432,14 @@ std::vector externalDownloads = { true, Parameters::DBTYPE_AMINO_ACIDS, structdatabases_sh, structdatabases_sh_len, {} }, + { + "BFMD", + "BFMD Big fantastic multimer database (combined multimers from large prediction projects).", + "Kim et al. Rapid and Sensitive Protein Complex Alignment with Foldseek-Multimer. bioRxiv (2024)", + "https://foldseek.steineggerlab.workers.dev/bfmd.version", + true, Parameters::DBTYPE_AMINO_ACIDS, structdatabases_sh, structdatabases_sh_len, + {} + }, { "ProstT5", "Protein language model to predict 3Di directly from sequence.",