Skip to content

Commit 611fbe8

Browse files
committed
Merge branch 'zenflow_zero1_2' of github.com:Antlera/DeepSpeed into zenflow_zero1_2
2 parents 7c4e96f + 5976c49 commit 611fbe8

File tree

2 files changed

+3
-2
lines changed

2 files changed

+3
-2
lines changed

deepspeed/compile/profilers/graph_profile.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,7 @@ def run(self, *args) -> Any:
9696
args: inputs to the graph. Tensors in the inpusts must be real tensors, not fake tensors. args can contain ds parameters.
9797
returns: The output of the graph. Tensor in the output is real tensors.
9898
"""
99+
return_val = None
99100
try:
100101
assert _all_real_if_tensor(args), "Inputs must be real tensors"
101102
self.nz3.enable_profiling(True)
@@ -242,6 +243,7 @@ def __init__(self, gm: GraphModule, debug_log=False):
242243
self.debug_log = debug_log
243244

244245
def run(self, *args) -> Any:
246+
return_val = None
245247
try:
246248
assert _all_real_if_tensor(args), "Inputs must be real tensors"
247249
self.nz3.enable_profiling(True)

op_builder/builder.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -83,8 +83,7 @@ def get_default_compute_capabilities():
8383
cuda_minor_mismatch_ok = {
8484
10: ["10.0", "10.1", "10.2"],
8585
11: ["11.0", "11.1", "11.2", "11.3", "11.4", "11.5", "11.6", "11.7", "11.8"],
86-
12: ["12.0", "12.1", "12.2", "12.3", "12.4", "12.5", "12.6",
87-
"12.8"], # There does not appear to be a CUDA Toolkit 12.7
86+
12: ["12.0", "12.1", "12.2", "12.3", "12.4", "12.5", "12.6", "12.8", "12.9"], # There is no CUDATk 12.7
8887
}
8988

9089

0 commit comments

Comments
 (0)