diff --git a/.github/workflows/run-readme-pr-macos.yml b/.github/workflows/run-readme-pr-macos.yml index e3f8df402..522fd9963 100644 --- a/.github/workflows/run-readme-pr-macos.yml +++ b/.github/workflows/run-readme-pr-macos.yml @@ -6,7 +6,7 @@ on: - main workflow_dispatch: jobs: - test-mps: + test-readme-macos: runs-on: macos-14-xlarge steps: - name: Checkout code diff --git a/.github/workflows/run-readme-pr.yml b/.github/workflows/run-readme-pr.yml index c59bdb3b8..cebfa1650 100644 --- a/.github/workflows/run-readme-pr.yml +++ b/.github/workflows/run-readme-pr.yml @@ -8,7 +8,7 @@ on: workflow_dispatch: jobs: - test-readme: + test-readme-any: uses: pytorch/test-infra/.github/workflows/linux_job.yml@main with: runner: linux.g5.4xlarge.nvidia.gpu diff --git a/README.md b/README.md index 11d825600..69e5d96fb 100644 --- a/README.md +++ b/README.md @@ -168,10 +168,12 @@ To build the runner binary on your Mac or Linux: scripts/build_native.sh aoti ``` +[skip default]: begin Execute ```bash cmake-out/aoti_run exportedModels/llama3.so -z ~/.torchchat/model-cache/meta-llama/Meta-Llama-3-8B-Instruct/tokenizer.model -l 3 -i "Once upon a time" ``` +[skip default]: end ## Mobile Execution