openvax
diff --git a/‎README.md
Lines changed: 2 additions & 0 deletions b/‎README.md
Lines changed: 2 additions & 0 deletions
diff --git a/‎api.py
Lines changed: 194 additions & 0 deletions b/‎api.py
Lines changed: 194 additions & 0 deletions
diff --git a/‎application.py
Lines changed: 38 additions & 0 deletions b/‎application.py
Lines changed: 38 additions & 0 deletions
diff --git a/‎config.py
Lines changed: 4 additions & 0 deletions b/‎config.py
Lines changed: 4 additions & 0 deletions
diff --git a/‎docker/base/Dockerfile
Lines changed: 134 additions & 0 deletions b/‎docker/base/Dockerfile
Lines changed: 134 additions & 0 deletions
diff --git a/‎docker/base/build.sh
Lines changed: 6 additions & 0 deletions b/‎docker/base/build.sh
Lines changed: 6 additions & 0 deletions
diff --git a/‎docker/base/container-files/test_protein.fa
Lines changed: 2 additions & 0 deletions b/‎docker/base/container-files/test_protein.fa
Lines changed: 2 additions & 0 deletions
diff --git a/‎docker/base/push_to_dockerhub.sh
Lines changed: 2 additions & 0 deletions b/‎docker/base/push_to_dockerhub.sh
Lines changed: 2 additions & 0 deletions
@@ -1,2 +1,4 @@
 # proteopt
 Common interface to protein design tools and structure predictors
+
+Details coming soon.
@@ -0,0 +1,194 @@
+import argparse
+import collections
+import traceback
+import os
+import sys
+import logging
+import socket
+import time
+
+from flask import Flask
+from flask_restful import reqparse, abort, Api, Resource, inputs
+
+import proteopt.alphafold
+import proteopt.mock_tool
+from proteopt.common import serialize, deserialize
+
+app = Flask(__name__)
+api = Api(app)
+
+
+def add_argument(parser, arg_name, info, append=False):
+    type = info['type']
+    if type is object:
+        type = str  # We will serialize objects
+
+    d = {
+        'type': type,
+    }
+    if 'default' in info:
+        d["default"] = info["default"]
+    else:
+        d["required"] = True
+    if append:
+        d["action"] = "append"
+    parser.add_argument(arg_name, **d)
+
+
+TOOL_CLASSES = [
+    proteopt.mock_tool.MockTool,
+    proteopt.alphafold.AlphaFold,
+]
+TOOLS = dict((cls.tool_name, cls) for cls in TOOL_CLASSES)
+
+
+class Tool(Resource):
+    configuration = None  # this should be set when the app is launched
+
+    tool_parsers = {}
+    for (tool_name, tool_class) in TOOLS.items():
+        tool_parsers[tool_name] = reqparse.RequestParser()
+        for parameter, info in tool_class.model_args.items():
+            add_argument(tool_parsers[tool_name], parameter, info)
+        for parameter, info in tool_class.run_args.items():
+            add_argument(
+                tool_parsers[tool_name],
+                parameter,
+                info,
+                append=not info['type'] is object)
+
+    MODEL_CACHE = collections.OrderedDict()
+
+    def get_model(self, tool_name, args):
+        tool_class = TOOLS[tool_name]
+        args_dict = dict(self.configuration[tool_name])
+        cache_key = []
+        for name, info in tool_class.model_args.items():
+            value = getattr(args, name)
+            cache_key.append((name, value))
+            args_dict[name] = value
+
+        cache_key = tuple(cache_key)
+
+        try:
+            return self.MODEL_CACHE[cache_key]
+        except KeyError:
+            pass
+
+        logging.info("Loading new model: %s %s", tool_name, str(args_dict))
+
+        model = tool_class(**args_dict)
+        if len(self.MODEL_CACHE) >= self.configuration["model_cache_size"]:
+            self.MODEL_CACHE.popitem(last=False)
+        self.MODEL_CACHE[cache_key] = model
+        return model
+
+    def get(self, tool_name):
+        return str(self.MODEL_CACHE.keys())
+
+    def post(self, tool_name):
+        tool_class = TOOLS[tool_name]
+
+        parser = self.tool_parsers[tool_name]
+        args = parser.parse_args()
+        try:
+            total_start = time.time()
+            model = self.get_model(tool_name, args)
+            init_seconds = time.time() - total_start
+
+            run_arg_names = list(tool_class.run_args)
+
+            for arg in run_arg_names:
+                if tool_class.run_args[arg]['type'] is object:
+                    setattr(args, arg, deserialize(getattr(args, arg)))
+
+            example_run_arg = run_arg_names[0]
+            list_of_input_dicts = []
+            for i in range(len(getattr(args, example_run_arg))):
+                d = dict((arg, getattr(args, arg)[i]) for arg in run_arg_names)
+                list_of_input_dicts.append(d)
+
+            start = time.time()
+            results = model.run_multiple(list_of_input_dicts)
+            assert not any(x is None for x in results)
+            payload = {
+                "success": True,
+                "results": serialize(results),
+                "init_seconds": init_seconds,
+                "total_seconds": time.time() - start,
+            }
+            return payload, 200
+        except Exception as e:
+            exc_info = sys.exc_info()
+            message = ''.join(traceback.format_exception(*exc_info))
+            payload = {
+                "success": False,
+                "exception": (e.__class__.__name__, message),
+            }
+            return payload, 500
+
+
+api.add_resource(Tool, '/tool/<tool_name>')
+
+# Run the test server
+arg_parser = argparse.ArgumentParser()
+
+arg_parser.add_argument(
+    "--debug",
+    default=False,
+    action="store_true")
+
+arg_parser.add_argument(
+    "--cuda-visible-devices")
+
+arg_parser.add_argument("--host", default="127.0.0.1")
+arg_parser.add_argument("--write-endpoint-to-file")
+arg_parser.add_argument("--port", type=int)
+arg_parser.add_argument("--model-cache-size", type=float, default=1.0)
+
+
+arg_names_to_tool_configs = {}
+for tool_name, tool_class in TOOLS.items():
+    for parameter, info in tool_class.config_args.items():
+        arg_name = "%s_%s" % (tool_name, parameter)
+        arg_names_to_tool_configs[arg_name] = (tool_name, parameter)
+        add_argument(arg_parser, "--" + arg_name.replace("_", "-"), info)
+
+if __name__ == '__main__':
+    args = arg_parser.parse_args(sys.argv[1:])
+
+    tool_configs = collections.defaultdict(dict)  # tool name -> dict
+    for (arg, (tool, parameter)) in arg_names_to_tool_configs.items():
+        tool_configs[tool][parameter] = getattr(args, arg)
+
+    print("Tool configuration parameters:")
+    for name, d in tool_configs.items():
+        print(name)
+        for (k, v) in d.items():
+            print("\t%15s = %15s" % (k, v))
+        print()
+
+    Tool.configuration = dict(tool_configs)
+    Tool.configuration["model_cache_size"] = args.model_cache_size
+
+    if args.cuda_visible_devices:
+        os.environ["CUDA_VISIBLE_DEVICES"] = args.cuda_visible_devices
+
+    port = args.port
+    if not port:
+        # Identify an available port
+        # Based on https://stackoverflow.com/questions/5085656/how-to-select-random-port-number-in-flask
+        sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+        sock.bind((args.host, 0))
+        port = sock.getsockname()[1]
+        sock.close()
+
+    endpoint = "http://%s:%d" % (args.host, port)
+    print("Endpoint will be", endpoint)
+    if args.write_endpoint_to_file:
+        with open(args.write_endpoint_to_file, "w") as fd:
+            fd.write(endpoint)
+            fd.write("\n")
+        print("Wrote", args.write_endpoint_to_file)
+
+    app.run(host=args.host, port=port, debug=args.debug, use_reloader=False)
@@ -0,0 +1,38 @@
+from flask import Flask
+
+# print a nice greeting.
+def say_hello(username = "World"):
+    return '<p>Hello %s!</p>\n' % username
+
+# some bits of text for the page.
+header_text = '''
+    <html>\n<head> <title>EB Flask Test</title> </head>\n<body>'''
+instructions = '''
+    <p><em>Hint</em>: This is a RESTful web service! Append a username
+    to the URL (for example: <code>/Thelonious</code>) to say hello to
+    someone specific.</p>\n'''
+home_link = '<p><a href="/">Back</a></p>\n'
+footer_text = '</body>\n</html>'
+
+# EB looks for an 'application' callable by default.
+application = Flask(__name__)
+
+# add a rule for the index page.
+application.add_url_rule(
+    '/',
+    'index',
+    lambda: header_text + say_hello() + instructions + footer_text)
+
+# add a rule when the page is accessed with a name appended to the site
+# URL.
+application.add_url_rule(
+    '/<username>',
+    'hello',
+    lambda username: header_text + say_hello(username) + home_link + footer_text)
+
+# run the app.
+if __name__ == "__main__":
+    # Setting debug to True enables debug output. This line should be
+    # removed before deploying a production app.
+    application.debug = True
+    application.run()
@@ -0,0 +1,4 @@
+"""
+Flask configuration.
+"""
+
@@ -0,0 +1,134 @@
+FROM --platform=linux/x86_64 nvidia/cuda:11.3.1-cudnn8-devel-ubuntu20.04 as shrunk
+
+ENV PATH="/root/miniconda3/bin:${PATH}"
+ARG PATH="/root/miniconda3/bin:${PATH}"
+WORKDIR /root
+
+RUN apt-get update \
+    && apt-get install -y wget git vim \
+    && rm -rf /var/lib/apt/lists/* \
+    && wget -nv \
+      https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh \
+    && mkdir /root/.conda \
+    && bash Miniconda3-latest-Linux-x86_64.sh -b \
+    && rm -f Miniconda3-latest-Linux-x86_64.sh \
+    && conda --version
+
+# Make links
+RUN ln -s /data/static/alphafold-params . \
+    && ln -s /data/static/RFDesign . \
+    && ln -s /data/static/AlphaFold . \
+    && ln -s /data/static/openfold . \
+    && ln -s /data/static/OmegaFold . \
+    && ln -s /data/static/ProteinMPNN . \
+    && ln -s /data/static/design-env/ miniconda3/envs/design-env \
+    && mkdir -p /software/mlfold/alphafold-data \
+    && ln -s /data/static/alphafold-params /software/mlfold/alphafold-data/params \
+    && mkdir -p /data/static/omegafold_ckpt \
+    && mkdir -p ~/.cache \
+    && ln -s /data/static/omegafold_ckpt ~/.cache/omegafold_ckpt
+
+# ****************************
+FROM shrunk as complete
+RUN mkdir -p /data/static
+
+RUN cd /data/static \
+    && mkdir -p alphafold-params \
+    && wget -nv --progress=dot:giga --show-progress https://storage.googleapis.com/alphafold/alphafold_params_2022-12-06.tar -O params.tar \
+    && tar --extract --verbose --file=params.tar --directory=alphafold-params --preserve-permissions \
+    && rm -f params.tar
+
+# Note that we are using a different version of pytorch than recommended
+# in RFDesign readme (they recommend pytorch=1.10.1)
+RUN conda update -n base -c defaults conda \
+  && conda config --set ssl_verify no \
+  && conda init bash \
+  && conda clean -afy
+
+RUN rm miniconda3/envs/design-env \
+    && conda create -n design-env \
+        python=3.8 \
+        pytorch=1.11 \
+        dgl-cuda11.3 \
+        cudatoolkit=11.3 \
+        cuda-toolkit \
+        numpy scipy requests packaging pip \
+        -c "nvidia/label/cuda-11.3.1" -c pytorch -c dglteam  \
+    && mv miniconda3/envs/design-env /data/static \
+    && ln -s /data/static/design-env/ miniconda3/envs/design-env
+
+RUN conda install -n design-env \
+    pyg \
+    openmm==7.5.1 \
+    -c pyg -c conda-forge
+
+RUN cd /data/static \
+    && git clone https://github.com/deepmind/AlphaFold.git \
+    && wget -q -P /data/static/AlphaFold/alphafold/common/ \
+      https://git.scicore.unibas.ch/schwede/openstructure/-/raw/7102c63615b64735c4941278d92b554ec94415f8/modules/mol/alg/src/stereo_chemical_props.txt
+
+RUN /root/miniconda3/envs/design-env/bin/pip install \
+        https://github.com/openmm/pdbfixer/archive/refs/tags/v1.7.tar.gz \
+        icecream==2.1.3 \
+        lie_learn==0.0.1.post1 \
+        opt_einsum==3.3.0 \
+        e3nn==0.3.4 \
+    && /root/miniconda3/envs/design-env/bin/pip install \
+        "jax[cuda]==0.3.25" \
+        -f https://storage.googleapis.com/jax-releases/jax_cuda_releases.html \
+    && /root/miniconda3/envs/design-env/bin/pip install \
+        dm-tree==0.1.6 \
+        dm-haiku==0.0.9 \
+        absl-py==1.0.0 \
+        ml-collections==0.1.0 \
+        tensorflow-gpu==2.11.0 \
+        biopython==1.81 \
+        pytorch-lightning==1.9.3 # For openfold \
+    && conda clean -afy \
+    && /root/miniconda3/envs/design-env/bin/pip install -e /data/static/AlphaFold \
+    && /root/miniconda3/envs/design-env/bin/pip cache purge
+
+RUN cd /data/static \
+    && git clone --branch main https://github.com/timodonnell/RFDesign.git \
+    && cd RFDesign \
+    && git remote add upstream https://github.com/RosettaCommons/RFDesign.git \
+    && wget -nv -P rfdesign/hallucination/weights/rf_Nov05 http://files.ipd.uw.edu/pub/rfdesign/weights/BFF_last.pt \
+    && wget -nv -P rfdesign/inpainting/weights/ http://files.ipd.uw.edu/pub/rfdesign/weights/BFF_mix_epoch25.pt \
+    && /root/miniconda3/envs/design-env/bin/pip install -e .
+
+RUN cd /data/static \
+    && git clone https://github.com/timodonnell/ProteinMPNN.git \
+    && cd ProteinMPNN \
+    && git remote add upstream https://github.com/dauparas/ProteinMPNN.git \
+    && /root/miniconda3/envs/design-env/bin/pip install -e .
+
+# OpenFold
+RUN cd /data/static \
+    && git clone https://github.com/timodonnell/openfold.git \
+    && cd openfold \
+    && git remote add upstream https://github.com/aqlaboratory/openfold.git \
+    && /root/miniconda3/envs/design-env/bin/pip install -e . \
+    && /root/miniconda3/envs/design-env/bin/pip cache purge \
+    && mkdir -p /data/static/openfold-params/ \
+    && bash scripts/download_openfold_params_huggingface.sh /data/static/openfold-params/
+
+RUN mkdir -p /data/static/example-data \
+    && wget -nv -P /data/static/example-data https://files.rcsb.org/download/7SL5.pdb
+COPY container-files/test_protein.fa /data/static/example-data/
+
+# We run OmegaFold to force it download the weights
+RUN cd /data/static \
+    && git clone https://github.com/timodonnell/OmegaFold \
+    && cd OmegaFold \
+    && git remote add upstream https://github.com/HeliXonProtein/OmegaFold \
+    && /root/miniconda3/envs/design-env/bin/python setup.py install \
+    && mkdir -p /tmp/omegafold_out \
+    && /root/miniconda3/envs/design-env/bin/omegafold /data/static/example-data/test_protein.fa /tmp/omegafold_out \
+    && ls -lh /tmp/omegafold_out \
+    && rm -rf /tmp/omegafold_out
+
+# Not sure why this is needed, but it seems to be:
+RUN /root/miniconda3/envs/design-env/bin/pip install -e /data/static/AlphaFold
+
+# Switch to the design-env on start:
+RUN echo "conda activate design-env" >> ~/.bashrc
@@ -0,0 +1,6 @@
+set -e
+set -x
+
+time docker build -t timodonnell/proteopt-base-gpu:latest .
+time docker build --target shrunk -t timodonnell/proteopt-base-gpu-shrunk:latest .
+
@@ -0,0 +1,2 @@
+>ubiquitin
+MQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQRESTLHLVLRLRGG
@@ -0,0 +1,2 @@
+docker push timodonnell/proteopt-base-gpu:latest
+docker push timodonnell/proteopt-base-gpu-shrunk:latest
-Original file line number
+Diff line change
@@ @@ -0,0 +1,4 @@ @@
 +"""
 +Flask configuration.
 +"""
++
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+>ubiquitin`
	`2`	`+MQIFVKTLTGKTITLEVEPSDTIENVKAKIQDKEGIPPDQQRLIFAGKQLEDGRTLSDYNIQRESTLHLVLRLRGG`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+docker push timodonnell/proteopt-base-gpu:latest`
	`2`	`+docker push timodonnell/proteopt-base-gpu-shrunk:latest`