Merge pull request #51 from togethercomputer/orangetin/add-tests

orangetin · web-flow · commit afeff89a280a · 2023-10-24T10:03:41.000-07:00
Initial tests for files and fine-tuning
diff --git a/.github/workflows/check_code_quality.yml b/.github/workflows/check_code_quality.yml
@@ -39,6 +39,7 @@ jobs:
         source venv/bin/activate
         pip install --upgrade pip
         pip install .[quality]
+        pip install .[tests]
     - name: Check formatting with mypy
       run: |
         source venv/bin/activate
diff --git a/pyproject.toml b/pyproject.toml
@@ -35,6 +35,7 @@ quality = [
     "types-tqdm>=4.65.0.0", 
     "types-tabulate==0.9.0.3"
 ]
+tests = ["pytest==7.4.2"]
 tokenize = ["transformers>=4.33.2"]
 
 [project.urls]
diff --git a/src/together/finetune.py b/src/together/finetune.py
@@ -45,7 +45,7 @@ def create(
         ] = None,  # resulting finetuned model name will include the suffix
         estimate_price: bool = False,
         wandb_api_key: Optional[str] = None,
-        confirm_inputs: bool = True,
+        confirm_inputs: bool = False,
     ) -> Dict[Any, Any]:
         adjusted_inputs = False
 
@@ -283,7 +283,7 @@ def download(
             if output is None:
                 content_type = str(response.headers.get("content-type"))
 
-                output = self.retrieve(fine_tune_id)["model_output_path"].split("/")[-1]
+                output = self.retrieve(fine_tune_id)["model_output_name"].split("/")[-1]
 
                 if step != -1:
                     output += f"-checkpoint-{step}"
@@ -314,7 +314,7 @@ def download(
             logger.critical(f"Response error raised: {e}")
             raise together.ResponseError(e)
 
-        return output  # this should be null
+        return output  # this should be output file name
 
     # def delete_finetune_model(self, model: str) -> Dict[Any, Any]:
     #     model_url = "https://api.together.xyz/api/models"
diff --git a/tests/README.md b/tests/README.md
@@ -0,0 +1,35 @@
+# How to run tests
+>  🚧 Warning: test_finetune.py can take a while. Please have at least one prior successful finetuning run in your account for successful results. 
+
+>  🚧 Please have enough space on disk to download your lastest successful fine-tuned model's weights into the `tests` directory of this repo. All downloaded files will be deleted after successful test runs but may not be deleted if tests fail.
+
+>  🚧 Warning: This test will start 2 fine-tune jobs on small datasets from your account. You WILL be charged for the amount of one job on a 7B model. The second job will be cancelled soon after creation so you will likely not be charged for it.
+
+1. Clone the repo locally
+```bash
+git clone https://github.com/togethercomputer/together.git
+```
+2. Change directory
+```bash
+cd together
+```
+3. [Optional] Checkout the commit you'd like to test
+```bash
+git checkout COMMIT_HASH
+```
+4. Install together package and dependencies
+```bash
+pip install . && pip install .['tests']
+```
+5. Change directory into `tests`
+```bash
+cd tests
+```
+6. Export API key
+```bash
+export TOGETHER_API_KEY=<API_KEY>
+```
+7. Run pytest
+```bash
+pytest
+```
diff --git a/tests/test_files.py b/tests/test_files.py
@@ -0,0 +1,88 @@
+import os
+from typing import Any, List
+
+import pytest
+import requests
+
+import together
+from together.utils import extract_time
+
+
+def test_upload() -> None:
+    url = "https://huggingface.co/datasets/laion/OIG/resolve/main/unified_joke_explanations.jsonl"
+    save_path = "unified_joke_explanations.jsonl"
+    download_response = requests.get(url)
+
+    assert download_response.status_code == 200
+
+    with open(save_path, "wb") as file:
+        file.write(download_response.content)
+
+    # upload file
+    response = together.Files.upload(save_path)
+
+    assert isinstance(response, dict)
+    assert response["filename"] == os.path.basename(save_path)
+    assert response["object"] == "file"
+
+    os.remove(save_path)
+
+
+def test_list() -> None:
+    response = together.Files.list()
+    assert isinstance(response, dict)
+    assert isinstance(response["data"], list)
+
+
+def test_retrieve() -> None:
+    # extract file id
+    files: List[Any]
+    files = together.Files.list()["data"]
+    files.sort(key=extract_time)
+    file_id = str(files[-1]["id"])
+
+    response = together.Files.retrieve(file_id)
+    assert isinstance(response, dict)
+    assert isinstance(response["filename"], str)
+    assert isinstance(response["bytes"], int)
+    assert isinstance(response["Processed"], bool)
+    assert response["Processed"] is True
+
+
+def test_retrieve_content() -> None:
+    # extract file id
+    files: List[Any]
+    files = together.Files.list()["data"]
+    files.sort(key=extract_time)
+    file_id = str(files[-1]["id"])
+
+    file_path = "retrieved_file.jsonl"
+
+    response = together.Files.retrieve_content(file_id, file_path)
+    print(response)
+    assert os.path.exists(file_path)
+    assert os.path.getsize(file_path) > 0
+    os.remove(file_path)
+
+
+def test_delete() -> None:
+    # extract file id
+    files: List[Any]
+    files = together.Files.list()["data"]
+    files.sort(key=extract_time)
+    file_id = str(files[-1]["id"])
+
+    # delete file
+    response = together.Files.delete(file_id)
+
+    # tests
+    assert isinstance(response, dict)
+    assert response["id"] == file_id
+    assert response["deleted"] == "true"
+
+
+if __name__ == "__main__":
+    assert (
+        together.api_key
+    ), "No API key found, please run `export TOGETHER_API_KEY=<API_KEY>`"
+    pytest.main([__file__])
diff --git a/tests/test_finetune.py b/tests/test_finetune.py
@@ -0,0 +1,206 @@
+import os
+import time
+from typing import Any, Dict, List
+
+import pytest
+import requests
+
+import together
+from together.utils import parse_timestamp
+
+
+MODEL = "togethercomputer/llama-2-7b"
+N_EPOCHS = 1
+N_CHECKPOINTS = 1
+BATCH_SIZE = 32
+LEARNING_RATE = 0.00001
+SUFFIX = "pytest"
+
+CANCEL_TIMEOUT = 60
+
+FT_STATUSES = [
+    "pending",
+    "queued",
+    "running",
+    "cancel_requested",
+    "cancelled",
+    "error",
+    "completed",
+]
+
+
+def list_models() -> List[Any]:
+    model_list = together.Models.list()
+    model: Dict[str, Any]
+
+    finetunable_models = []
+    for model in model_list:
+        if model.get("finetuning_supported"):
+            finetunable_models.append(model.get("name"))
+    return finetunable_models
+
+
+# Download, save, and upload dataset
+def upload_file(
+    url: str = "https://huggingface.co/datasets/laion/OIG/resolve/main/unified_joke_explanations.jsonl",
+    save_path: str = "unified_joke_explanations.jsonl",
+) -> str:
+    download_response = requests.get(url)
+
+    assert download_response.status_code == 200
+
+    with open(save_path, "wb") as file:
+        file.write(download_response.content)
+
+    response = together.Files.upload(save_path)
+    os.remove(save_path)
+
+    assert isinstance(response, dict)
+    file_id = str(response["id"])
+    return file_id
+
+
+def create_ft(
+    model: str,
+    n_epochs: int,
+    n_checkpoints: int,
+    batch_size: int,
+    learning_rate: float,
+    suffix: str,
+    file_id: str,
+) -> Dict[Any, Any]:
+    response = together.Finetune.create(
+        training_file=file_id,
+        model=model,
+        n_epochs=n_epochs,
+        n_checkpoints=n_checkpoints,
+        batch_size=batch_size,
+        learning_rate=learning_rate,
+        suffix=suffix,
+    )
+    return response
+
+
+def test_create() -> None:
+    file_id = upload_file()
+    response = create_ft(
+        MODEL, N_EPOCHS, N_CHECKPOINTS, BATCH_SIZE, LEARNING_RATE, SUFFIX, file_id
+    )
+
+    assert isinstance(response, dict)
+    assert response["training_file"] == file_id
+    assert response["model"] == MODEL
+    assert SUFFIX in str(response["model_output_name"])
+
+
+def test_list() -> None:
+    response = together.Finetune.list()
+    assert isinstance(response, dict)
+    assert isinstance(response["data"], list)
+
+
+def test_retrieve() -> None:
+    ft_list = together.Finetune.list()["data"]
+    ft_list.sort(key=lambda x: parse_timestamp(x["created_at"]))
+    ft_id = ft_list[-1]["id"]
+    response = together.Finetune.retrieve(ft_id)
+
+    assert isinstance(response, dict)
+    assert str(response["training_file"]).startswith("file-")
+    assert str(response["id"]).startswith("ft-")
+
+
+def test_list_events() -> None:
+    ft_list = together.Finetune.list()["data"]
+    ft_list.sort(key=lambda x: parse_timestamp(x["created_at"]))
+    ft_id = ft_list[-1]["id"]
+    response = together.Finetune.list_events(ft_id)
+
+    assert isinstance(response, dict)
+    assert isinstance(response["data"], list)
+
+
+def test_status() -> None:
+    ft_list = together.Finetune.list()["data"]
+    ft_list.sort(key=lambda x: parse_timestamp(x["created_at"]))
+    ft_id = ft_list[-1]["id"]
+    response = together.Finetune.get_job_status(ft_id)
+
+    assert isinstance(response, str)
+    assert response in FT_STATUSES
+
+
+def test_download() -> None:
+    ft_list = together.Finetune.list()["data"]
+    ft_list.sort(key=lambda x: parse_timestamp(x["created_at"]))
+    ft_list.reverse()
+
+    ft_id = None
+    for item in ft_list:
+        id = item["id"]
+        if together.Finetune.get_job_status(id) == "completed":
+            ft_id = id
+            break
+
+    if ft_id is None:
+        # no models available to download
+        assert False
+
+    output_file = together.Finetune.download(ft_id)
+
+    assert os.path.exists(output_file)
+    assert os.path.getsize(output_file) > 0
+
+    os.remove(output_file)
+
+
+def test_cancel() -> None:
+    cancelled = False
+    file_id = upload_file()
+    response, file_id = create_ft(
+        MODEL, N_EPOCHS, N_CHECKPOINTS, BATCH_SIZE, LEARNING_RATE, SUFFIX, file_id
+    )
+    ft_id = response["id"]
+    response = together.Finetune.cancel(ft_id)
+
+    # loop to check if job was cancelled
+    start = time.time()
+    while time.time() - start < CANCEL_TIMEOUT:
+        status = together.Finetune.get_job_status(ft_id)
+        if status == "cancel_requested":
+            cancelled = True
+            break
+        time.sleep(1)
+
+    assert cancelled
+
+    # delete file after cancelling
+    together.Files.delete(file_id)
+
+
+def test_checkpoints() -> None:
+    ft_list = together.Finetune.list()["data"]
+    ft_list.sort(key=lambda x: parse_timestamp(x["created_at"]))
+    ft_list.reverse()
+
+    ft_id = None
+    for item in ft_list:
+        id = item["id"]
+        if together.Finetune.get_job_status(id) == "completed":
+            ft_id = id
+            break
+
+    if ft_id is None:
+        # no models available to download
+        assert False
+
+    response = together.Finetune.get_checkpoints(ft_id)
+
+    assert isinstance(response, list)
+
+
+if __name__ == "__main__":
+    assert (
+        together.api_key
+    ), "No API key found, please run `export TOGETHER_API_KEY=<API_KEY>`"
+    pytest.main([__file__])

Original file line number	Diff line number	Diff line change
`@@ -35,6 +35,7 @@ quality = [`
`35`	`35`	`"types-tqdm>=4.65.0.0",`
`36`	`36`	`"types-tabulate==0.9.0.3"`
`37`	`37`	`]`
	`38`	`+tests = ["pytest==7.4.2"]`
`38`	`39`	`tokenize = ["transformers>=4.33.2"]`
`39`	`40`
`40`	`41`	`[project.urls]`