diff --git a/backends/qualcomm/debugger/utils.py b/backends/qualcomm/debugger/utils.py index b1d3ea84900..d6b91c83996 100644 --- a/backends/qualcomm/debugger/utils.py +++ b/backends/qualcomm/debugger/utils.py @@ -183,11 +183,11 @@ def draw(self): cleanup=not self.dot_string, ) source_file = os.path.join(temp_directory, f"{self.filename}.svg") - destination_file = os.path.join(".", f"{self.filename}.svg") + destination_file = os.path.join(self.directory, f"{self.filename}.svg") shutil.move(source_file, destination_file) if self.dot_string: dot_file = os.path.join(temp_directory, f"{self.filename}") - dot_dest_file = os.path.join(".", f"{self.filename}.dot") + dot_dest_file = os.path.join(self.directory, f"{self.filename}.dot") shutil.move(dot_file, dot_dest_file) diff --git a/examples/qualcomm/oss_scripts/llama/__init__.py b/examples/qualcomm/oss_scripts/llama/__init__.py index 99b0739f1f0..5908fcf32a6 100644 --- a/examples/qualcomm/oss_scripts/llama/__init__.py +++ b/examples/qualcomm/oss_scripts/llama/__init__.py @@ -501,6 +501,7 @@ class Smollm3_3B(LLMModelConfig): ptq = QuantDtype.use_16a4w_block group_size = 32 masked_softmax = True + seq_mse_candidates = 0 r1 = False r2 = False r3 = False