diff --git a/examples/mediatek/model_export_scripts/llama.py b/examples/mediatek/model_export_scripts/llama.py index 9c371f46ca6..980a502c5ae 100644 --- a/examples/mediatek/model_export_scripts/llama.py +++ b/examples/mediatek/model_export_scripts/llama.py @@ -369,7 +369,6 @@ def export_to_et_ir( alloc_graph_input=False, alloc_graph_output=False, ), - extract_constant_segment=True, extract_delegate_segments=True, ) ) diff --git a/examples/portable/scripts/export.py b/examples/portable/scripts/export.py index 7849fa06ccd..6055ecef0f3 100644 --- a/examples/portable/scripts/export.py +++ b/examples/portable/scripts/export.py @@ -62,7 +62,7 @@ def main() -> None: *MODEL_NAME_TO_MODEL[args.model_name] ) - backend_config = ExecutorchBackendConfig(extract_constant_segment=True) + backend_config = ExecutorchBackendConfig() if args.segment_alignment is not None: backend_config.segment_alignment = int(args.segment_alignment, 16) if ( diff --git a/exir/_serialize/_program.py b/exir/_serialize/_program.py index d22de71d1c2..24ee6bd21a3 100644 --- a/exir/_serialize/_program.py +++ b/exir/_serialize/_program.py @@ -347,7 +347,7 @@ def serialize_pte_binary( *, mutable_data: Optional[List[Buffer]] = None, extract_delegate_segments: bool = False, - extract_constant_segment: bool = False, + extract_constant_segment: bool = True, segment_alignment: int = 128, constant_tensor_alignment: Optional[int] = None, delegate_alignment: Optional[int] = None, diff --git a/exir/_serialize/test/test_program.py b/exir/_serialize/test/test_program.py index 09927ad9648..c4f4df0d0b2 100644 --- a/exir/_serialize/test/test_program.py +++ b/exir/_serialize/test/test_program.py @@ -169,7 +169,6 @@ def constant_segment_with_tensor_alignment( pte_data = bytes( serialize_pte_binary( program, - extract_constant_segment=True, segment_alignment=SEGMENT_ALIGNMENT, constant_tensor_alignment=constant_tensor_alignment, ) @@ -427,16 +426,12 @@ def test_round_trip_large_buffer_sizes(self) -> None: def test_round_trip_no_segments_and_no_header(self) -> None: """Tests that a Program serialized with extract_delegate_segments=True - or extract_constant_segment=True, when there are no segments, does not - contain an extended header, constant segment, or delegate segments. Confirm - that a Program remains the same after serializing and deserializing. + when there are no segments does not contain an extended header, + constant segment, or delegate segments. Confirm that a Program remains + the same after serializing and deserializing. """ program = get_test_program() - pte_data = bytes( - serialize_pte_binary( - program, extract_delegate_segments=True, extract_constant_segment=True - ) - ) + pte_data = bytes(serialize_pte_binary(program, extract_delegate_segments=True)) self.assertGreater(len(pte_data), 16) # File magic should be present at the expected offset. @@ -637,7 +632,6 @@ def test_constant_segment_tensor_alignment_non_power_of_2_fails(self) -> None: with self.assertRaises(ValueError): serialize_pte_binary( program, - extract_constant_segment=True, segment_alignment=SEGMENT_ALIGNMENT, constant_tensor_alignment=constant_tensor_alignment, ) @@ -662,7 +656,6 @@ def test_constant_segment_and_delegate_segment(self) -> None: serialize_pte_binary( program, extract_delegate_segments=True, - extract_constant_segment=True, segment_alignment=SEGMENT_ALIGNMENT, constant_tensor_alignment=CONSTANT_TENSOR_ALIGNMENT, ) diff --git a/extension/llm/export/builder.py b/extension/llm/export/builder.py index eccb3317e7f..4f5bab7bc02 100644 --- a/extension/llm/export/builder.py +++ b/extension/llm/export/builder.py @@ -261,7 +261,6 @@ def to_executorch(self) -> "LLMEdgeManager": assert self.edge_manager, "Need to run export_to_edge() first" self.export_program = self.edge_manager.to_executorch( ExecutorchBackendConfig( - extract_constant_segment=True, extract_delegate_segments=True, passes=[ QuantFusionPass(),