pytorch · metascroy · Dec 23, 2024 · Dec 24, 2024 · Dec 24, 2024 · Dec 24, 2024
diff --git a/.github/workflows/apple-perf.yml b/.github/workflows/apple-perf.yml
@@ -329,6 +329,9 @@ jobs:
       script: |
         set -eux
 
+        echo "Setting XCode version"
+        sudo xcode-select -switch /Applications/Xcode_16.app
+
         echo "::group::Setting up CI environment"
         .ci/scripts/setup-conda.sh
 

diff --git a/extension/benchmark/apple/Benchmark/README.md b/extension/benchmark/apple/Benchmark/README.md
@@ -72,6 +72,15 @@ kernels_portable.xcframework
 kernels_quantized.xcframework
 ```
 
+#### MLState
+The prebuilt frameworks do not work with CoreML models that use MLState, which is used in LLM models exported for iOS18.  When executing the *.pte file, you will see an error like:
+
+```
+The input feature for X must be an MLState, but it was not.
+```
+
+If you encounter this issue, build the frameworks locally (option 2) using **XCode 16.0** or higher.
+
 ## Adding Models and Resources
 
 Place your exported model files (`.pte`) and any other resources (e.g., `tokenizer.bin`) into the `extension/benchmark/apple/Benchmark/Resources` directory:

diff --git a/extension/llm/export/partitioner_lib.py b/extension/llm/export/partitioner_lib.py
@@ -158,11 +158,7 @@ def _validate_ios_version() -> None:
         op_linear_quantizer_config=op_linear_quantizer_config,
     )
 
-    # ExecuTorch does not build CoreML delegate runtime to handle state
-    # when using OSS scripts, so we define take_over_mutable_buffer = False,
-    # even when target is iOS18
-    # take_over_mutable_buffer = minimum_deployment_target >= ct.target.iOS18
-    take_over_mutable_buffer = False
+    take_over_mutable_buffer = minimum_deployment_target >= ct.target.iOS18
     return CoreMLPartitioner(  # pyre-fixme[16]
         compile_specs=compile_specs,
         take_over_mutable_buffer=take_over_mutable_buffer,