diff --git a/.github/workflows/config/changelog-config.json b/.github/workflows/config/changelog-config.json index a845104f..0b78b096 100644 --- a/.github/workflows/config/changelog-config.json +++ b/.github/workflows/config/changelog-config.json @@ -1,42 +1,42 @@ { "categories": [ { - "title": "## Executors\n\n
Changelog", + "title": "## Executors\n\n", "labels": ["executor", "local", "slurm", "dgxcloud", "lepton", "skypilot", "docker"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## Ray Integration\n\n
Changelog", + "title": "\n## Ray Integration\n\n", "labels": ["ray", "kuberay", "ray-slurm"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## CLI & Configuration\n\n
Changelog", + "title": "\n## CLI & Configuration\n\n", "labels": ["cli", "config", "parsing"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## Experiment & Job Management\n\n
Changelog", + "title": "\n## Experiment & Job Management\n\n", "labels": ["experiment", "job", "task"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## Packaging & Deployment\n\n
Changelog", + "title": "\n## Packaging & Deployment\n\n", "labels": ["packaging", "deployment"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## Documentation\n\n
Changelog", + "title": "\n## Documentation\n\n", "labels": ["docs", "documentation"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## CI/CD\n\n
Changelog", + "title": "\n## CI/CD\n\n", "labels": ["ci", "github-actions", "workflow"], "exclude_labels": ["ignore"] }, { - "title": "
\n\n## Bug Fixes\n\n
Changelog", + "title": "\n## Bug Fixes\n\n", "labels": ["bug", "bugfix", "fix"], "exclude_labels": ["ignore"] } @@ -46,7 +46,7 @@ "skip-changelog" ], "sort": "ASC", - "template": "\n${{CHANGELOG}}
\n\n## Others\n\n
Changelog\n\n${{UNCATEGORIZED}}\n
\n", + "template": "\n${{CHANGELOG}}\n## Others\n\n${{UNCATEGORIZED}}\n", "pr_template": "- ${{TITLE}} [#${{NUMBER}}](${{URL}})", "empty_template": "- No changes in this release", "label_extractor": [ diff --git a/CHANGELOG.md b/CHANGELOG.md index 0d389dd0..5c18eca5 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,6 +1,63 @@ # Changelog +## NVIDIA Nemo Run 0.6.0 + +### Detailed Changelogs: + +## Executors + +- Added Pre-Launch Commands Support to LeptonExecutor [#312](https://github.com/NVIDIA-NeMo/Run/pull/312) +- Remove breaking torchrun config for single-node runs [#292](https://github.com/NVIDIA-NeMo/Run/pull/292) +- Upgrade skypilot to v0.10.0, introduce network_tier [#297](https://github.com/NVIDIA-NeMo/Run/pull/297) +- Fixes for multi-node execution with torchrun + LocalExecutor [#251](https://github.com/NVIDIA-NeMo/Run/pull/251) +- Add option to specify --container-env for srun [#293](https://github.com/NVIDIA-NeMo/Run/pull/293) +- Fix skypilot archive mount bug [#288](https://github.com/NVIDIA-NeMo/Run/pull/288) +- finetune on dgxcloud with nemo-run and deploy on bedrock example [#286](https://github.com/NVIDIA-NeMo/Run/pull/286) + +## Ray Integration + +- Add nsys patch in ray sub template [#318](https://github.com/NVIDIA-NeMo/Run/pull/318) +- Add logs dir to container mount for ray slurm [#287](https://github.com/NVIDIA-NeMo/Run/pull/287) +- Allow customizing folder for SlurmRayRequest [#281](https://github.com/NVIDIA-NeMo/Run/pull/281) + +## CLI & Configuration + +## Experiment & Job Management + +- Use thread pool for status, run methods inside experiment + other fixes [#295](https://github.com/NVIDIA-NeMo/Run/pull/295) + +## Packaging & Deployment + +- Correctly append tar files for packaging [#317](https://github.com/NVIDIA-NeMo/Run/pull/317) + +## Documentation + +- Create CHANGELOG.md [#314](https://github.com/NVIDIA-NeMo/Run/pull/314) +- docs: Fixing doc build issue [#290](https://github.com/NVIDIA-NeMo/Run/pull/290) +- fix docs tutorial links and add intro to guides/index.md [#285](https://github.com/NVIDIA-NeMo/Run/pull/285) +- README [#277](https://github.com/NVIDIA-NeMo/Run/pull/277) + +## CI/CD + +- changelog workflow [#315](https://github.com/NVIDIA-NeMo/Run/pull/315) +- Update release.yml [#306](https://github.com/NVIDIA-NeMo/Run/pull/306) +- ci(fix): Use GITHUB_TOKEN for community bot [#302](https://github.com/NVIDIA-NeMo/Run/pull/302) +- ci: Add community-bot [#300](https://github.com/NVIDIA-NeMo/Run/pull/300) + +## Bug Fixes + +- [Bugfix] Adding a check for name length [#273](https://github.com/NVIDIA-NeMo/Run/pull/273) +- misc fixes [#280](https://github.com/NVIDIA-NeMo/Run/pull/280) +- adding fix for lowercase and name length k8s requirements [#274](https://github.com/NVIDIA-NeMo/Run/pull/274) + +## Others + +- Specify nodes for gpu metrics collection and split data to each rank [#320](https://github.com/NVIDIA-NeMo/Run/pull/320) +- Apply '_enable_goodbye_message' check to both goodbye messages. [#319](https://github.com/NVIDIA-NeMo/Run/pull/319) +- Update refs [#278](https://github.com/NVIDIA-NeMo/Run/pull/278) +- chore: Bump to version 0.6.0rc0.dev0 [#272](https://github.com/NVIDIA-NeMo/Run/pull/272) + ## NVIDIA Nemo Run 0.5.0