Skip to content

Commit c1fa677

Browse files
committed
Merge branch 'feat/blockwise_fp8_quant_triton_gemm_ker' of github.com:Degnel/ao into feat/blockwise_fp8_quant_triton_gemm_ker
2 parents f51a142 + affaf0a commit c1fa677

File tree

184 files changed

+6255
-10624
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

184 files changed

+6255
-10624
lines changed

.github/workflows/build-wheels_m1.yml

-74
This file was deleted.

.github/workflows/build_wheels_aarch64_linux.yml

-87
This file was deleted.

.github/workflows/build_wheels_linux.yml

+2-2
Original file line numberDiff line numberDiff line change
@@ -30,8 +30,8 @@ jobs:
3030
with-cuda: enable
3131
with-rocm: enable
3232
with-xpu: enable
33-
# please note: excluding 3.13t for aarch64 builds for now
34-
python-versions: '["3.9", "3.10", "3.11", "3.12", "3.13"]'
33+
# Note: if free-threaded python is required add py3.13t here
34+
python-versions: '["3.9"]'
3535

3636
build:
3737
needs: generate-matrix

.github/workflows/build_wheels_windows.yml

-97
This file was deleted.

.github/workflows/float8nocompile_test.yaml

-2
Original file line numberDiff line numberDiff line change
@@ -7,14 +7,12 @@ on:
77
- 'gh/**'
88
paths:
99
- 'torchao/prototype/float8nocompile/**'
10-
- '!torchao/prototype/float8nocompile/**'
1110
pull_request:
1211
branches:
1312
- main
1413
- 'gh/**'
1514
paths:
1615
- 'torchao/prototype/float8nocompile/**'
17-
- '!torchao/prototype/float8nocompile/**'
1816

1917
concurrency:
2018
group: floatnocompile_test-${{ github.workflow }}-${{ github.ref == 'refs/heads/main' && github.run_number || github.ref }}

.github/workflows/torchao_experimental_test.yml

+64-2
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ on:
1111
- 'gh/**'
1212

1313
jobs:
14-
test:
14+
test-cpu-ops:
1515
strategy:
1616
matrix:
1717
runner: [macos-14]
@@ -33,9 +33,13 @@ jobs:
3333
- name: Install requirements
3434
run: |
3535
conda activate venv
36-
pip install --extra-index-url "https://download.pytorch.org/whl/nightly/cpu" torch=="2.6.0.dev20250104"
36+
# Install executorch first because it installs its own version
37+
# of torch and torchao, which we do not want to use
38+
pip install executorch
39+
pip install torch --index-url "https://download.pytorch.org/whl/nightly/cpu" --force-reinstall
3740
pip install numpy
3841
pip install pytest
42+
pip install parameterized
3943
USE_CPP=1 pip install .
4044
- name: Run python tests
4145
run: |
@@ -56,3 +60,61 @@ jobs:
5660
sh build_and_run_tests.sh
5761
rm -rf /tmp/cmake-out
5862
popd
63+
- name: ET ops build
64+
run: |
65+
conda activate venv
66+
pushd torchao/experimental
67+
sh build_torchao_ops.sh executorch
68+
popd
69+
70+
test-mps-ops:
71+
strategy:
72+
matrix:
73+
runner: [macos-m1-stable]
74+
runs-on: ${{matrix.runner}}
75+
steps:
76+
- name: Print machine info
77+
run: |
78+
uname -a
79+
if [ $(uname -s) == Darwin ]; then
80+
sysctl machdep.cpu.brand_string
81+
sysctl machdep.cpu.core_count
82+
fi
83+
- name: Checkout repo
84+
uses: actions/checkout@v3
85+
with:
86+
submodules: true
87+
- name: Create conda env
88+
run: |
89+
conda create -yn test-mps-ops-env python=3.11
90+
- name: Activate conda env
91+
run: |
92+
source activate base
93+
conda activate test-mps-ops-env
94+
- name: Install torch
95+
run: |
96+
pip install torch --index-url "https://download.pytorch.org/whl/nightly/cpu"
97+
- name: Print torch version
98+
run: |
99+
python -c "import torch; print(torch.__version__)"
100+
- name: Install requirements
101+
run: |
102+
pip install cmake
103+
pip install parameterized
104+
pip install pyyaml
105+
pip install numpy
106+
- name: Print pip freeze
107+
run: |
108+
pip freeze
109+
- name: Print current directory
110+
run: |
111+
python -c "import os; print(os.getcwd())"
112+
- name: Build ao with experimental mps ops
113+
run: |
114+
USE_CPP=1 TORCHAO_BUILD_EXPERIMENTAL_MPS=1 pip install .
115+
- name: Run mps tests
116+
run: |
117+
pushd torchao/experimental/ops/mps/test
118+
python test_lowbit.py
119+
python test_quantizer.py
120+
popd

.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -375,3 +375,4 @@ checkpoints/
375375

376376
# Experimental
377377
torchao/experimental/cmake-out
378+
torchao/experimental/deps

0 commit comments

Comments
 (0)