Skip to content

Commit fce44e5

Browse files
committed
compile create_block_mask
1 parent c59198f commit fce44e5

File tree

2 files changed

+2
-1
lines changed

2 files changed

+2
-1
lines changed

eval.py

-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,6 @@
1515
torch._dynamo.config.automatic_dynamic_shapes = True
1616
torch._inductor.config.triton.unique_kernel_names = True
1717
torch._inductor.config.epilogue_fusion = False
18-
torch._inductor.config.triton.cudagraphs = True
1918
torch._dynamo.config.cache_size_limit = 100000
2019

2120
from tokenizer import get_tokenizer

generate.py

+2
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,8 @@ def device_sync(device):
3131

3232
default_device = 'cuda' if torch.cuda.is_available() else 'cpu'
3333

34+
create_block_mask = torch.compile(create_block_mask)
35+
3436
# support running without installing as a package
3537
wd = Path(__file__).parent.parent.resolve()
3638
sys.path.append(str(wd))

0 commit comments

Comments
 (0)