diff --git a/.release-please-manifest.json b/.release-please-manifest.json
index cce9d1c..5660725 100644
--- a/.release-please-manifest.json
+++ b/.release-please-manifest.json
@@ -1,3 +1,3 @@
 {
-  ".": "1.7.0"
+  ".": "1.7.1"
 }
\ No newline at end of file
diff --git a/.stats.yml b/.stats.yml
index 603f57a..25ece8f 100644
--- a/.stats.yml
+++ b/.stats.yml
@@ -1,4 +1,4 @@
 configured_endpoints: 21
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/cas-parser%2Fcas-parser-d9763d006969b49a1473851069fdfa429eb13133b64103a62963bb70ddb22305.yml
-openapi_spec_hash: 6aee689b7a759b12c85c088c15e29bc0
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/cas-parser%2Fcas-parser-d868ff00b7b07f6b6802b00f22fad531a91a76bb219a634f3f90fe488bd499ba.yml
+openapi_spec_hash: 20e9f2fc31feee78878cdf56e46dab60
 config_hash: 5509bb7a961ae2e79114b24c381606d4
diff --git a/CHANGELOG.md b/CHANGELOG.md
index af49a3a..8bdd74b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,19 @@
 # Changelog
 
+## 1.7.1 (2026-04-18)
+
+Full Changelog: [v1.7.0...v1.7.1](https://github.com/CASParser/cas-parser-python/compare/v1.7.0...v1.7.1)
+
+### Bug Fixes
+
+* **client:** preserve hardcoded query params when merging with user params ([3e5eea1](https://github.com/CASParser/cas-parser-python/commit/3e5eea1e92928bd98243022c607f6f15afa24d52))
+* ensure file data are only sent as 1 parameter ([4985a34](https://github.com/CASParser/cas-parser-python/commit/4985a349eee6f59007dfdf770c26deba75acc7dd))
+
+
+### Performance Improvements
+
+* **client:** optimize file structure copying in multipart requests ([1c854af](https://github.com/CASParser/cas-parser-python/commit/1c854af1baa2f1e702881692b65e9a85efffedd5))
+
 ## 1.7.0 (2026-03-27)
 
 Full Changelog: [v1.6.3...v1.7.0](https://github.com/CASParser/cas-parser-python/compare/v1.6.3...v1.7.0)
diff --git a/pyproject.toml b/pyproject.toml
index 724085d..ffa8d10 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "cas-parser-python"
-version = "1.7.0"
+version = "1.7.1"
 description = "The official Python library for the cas-parser API"
 dynamic = ["readme"]
 license = "Apache-2.0"
diff --git a/src/cas_parser/_base_client.py b/src/cas_parser/_base_client.py
index 5b130cf..33ae5fa 100644
--- a/src/cas_parser/_base_client.py
+++ b/src/cas_parser/_base_client.py
@@ -558,6 +558,10 @@ def _build_request(
                 files = cast(HttpxRequestFiles, ForceMultipartDict())
 
         prepared_url = self._prepare_url(options.url)
+        # preserve hard-coded query params from the url
+        if params and prepared_url.query:
+            params = {**dict(prepared_url.params.items()), **params}
+            prepared_url = prepared_url.copy_with(raw_path=prepared_url.raw_path.split(b"?", 1)[0])
         if "_" in prepared_url.host:
             # work around https://github.com/encode/httpx/discussions/2880
             kwargs["extensions"] = {"sni_hostname": prepared_url.host.replace("_", "-")}
diff --git a/src/cas_parser/_files.py b/src/cas_parser/_files.py
index cc14c14..0fdce17 100644
--- a/src/cas_parser/_files.py
+++ b/src/cas_parser/_files.py
@@ -3,8 +3,8 @@
 import io
 import os
 import pathlib
-from typing import overload
-from typing_extensions import TypeGuard
+from typing import Sequence, cast, overload
+from typing_extensions import TypeVar, TypeGuard
 
 import anyio
 
@@ -17,7 +17,9 @@
     HttpxFileContent,
     HttpxRequestFiles,
 )
-from ._utils import is_tuple_t, is_mapping_t, is_sequence_t
+from ._utils import is_list, is_mapping, is_tuple_t, is_mapping_t, is_sequence_t
+
+_T = TypeVar("_T")
 
 
 def is_base64_file_input(obj: object) -> TypeGuard[Base64FileInput]:
@@ -121,3 +123,51 @@ async def async_read_file_content(file: FileContent) -> HttpxFileContent:
         return await anyio.Path(file).read_bytes()
 
     return file
+
+
+def deepcopy_with_paths(item: _T, paths: Sequence[Sequence[str]]) -> _T:
+    """Copy only the containers along the given paths.
+
+    Used to guard against mutation by extract_files without copying the entire structure.
+    Only dicts and lists that lie on a path are copied; everything else
+    is returned by reference.
+
+    For example, given paths=[["foo", "files", "file"]] and the structure:
+        {
+            "foo": {
+                "bar": {"baz": {}},
+                "files": {"file": <content>}
+            }
+        }
+    The root dict, "foo", and "files" are copied (they lie on the path).
+    "bar" and "baz" are returned by reference (off the path).
+    """
+    return _deepcopy_with_paths(item, paths, 0)
+
+
+def _deepcopy_with_paths(item: _T, paths: Sequence[Sequence[str]], index: int) -> _T:
+    if not paths:
+        return item
+    if is_mapping(item):
+        key_to_paths: dict[str, list[Sequence[str]]] = {}
+        for path in paths:
+            if index < len(path):
+                key_to_paths.setdefault(path[index], []).append(path)
+
+        # if no path continues through this mapping, it won't be mutated and copying it is redundant
+        if not key_to_paths:
+            return item
+
+        result = dict(item)
+        for key, subpaths in key_to_paths.items():
+            if key in result:
+                result[key] = _deepcopy_with_paths(result[key], subpaths, index + 1)
+        return cast(_T, result)
+    if is_list(item):
+        array_paths = [path for path in paths if index < len(path) and path[index] == "<array>"]
+
+        # if no path expects a list here, nothing will be mutated inside it - return by reference
+        if not array_paths:
+            return cast(_T, item)
+        return cast(_T, [_deepcopy_with_paths(entry, array_paths, index + 1) for entry in item])
+    return item
diff --git a/src/cas_parser/_utils/__init__.py b/src/cas_parser/_utils/__init__.py
index 10cb66d..1c090e5 100644
--- a/src/cas_parser/_utils/__init__.py
+++ b/src/cas_parser/_utils/__init__.py
@@ -24,7 +24,6 @@
     coerce_integer as coerce_integer,
     file_from_path as file_from_path,
     strip_not_given as strip_not_given,
-    deepcopy_minimal as deepcopy_minimal,
     get_async_library as get_async_library,
     maybe_coerce_float as maybe_coerce_float,
     get_required_header as get_required_header,
diff --git a/src/cas_parser/_utils/_utils.py b/src/cas_parser/_utils/_utils.py
index eec7f4a..771859f 100644
--- a/src/cas_parser/_utils/_utils.py
+++ b/src/cas_parser/_utils/_utils.py
@@ -86,8 +86,9 @@ def _extract_items(
     index += 1
     if is_dict(obj):
         try:
-            # We are at the last entry in the path so we must remove the field
-            if (len(path)) == index:
+            # Remove the field if there are no more dict keys in the path,
+            # only "<array>" traversal markers or end.
+            if all(p == "<array>" for p in path[index:]):
                 item = obj.pop(key)
             else:
                 item = obj[key]
@@ -176,21 +177,6 @@ def is_iterable(obj: object) -> TypeGuard[Iterable[object]]:
     return isinstance(obj, Iterable)
 
 
-def deepcopy_minimal(item: _T) -> _T:
-    """Minimal reimplementation of copy.deepcopy() that will only copy certain object types:
-
-    - mappings, e.g. `dict`
-    - list
-
-    This is done for performance reasons.
-    """
-    if is_mapping(item):
-        return cast(_T, {k: deepcopy_minimal(v) for k, v in item.items()})
-    if is_list(item):
-        return cast(_T, [deepcopy_minimal(entry) for entry in item])
-    return item
-
-
 # copied from https://github.com/Rapptz/RoboDanny
 def human_join(seq: Sequence[str], *, delim: str = ", ", final: str = "or") -> str:
     size = len(seq)
diff --git a/src/cas_parser/_version.py b/src/cas_parser/_version.py
index e314464..816fce9 100644
--- a/src/cas_parser/_version.py
+++ b/src/cas_parser/_version.py
@@ -1,4 +1,4 @@
 # File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
 
 __title__ = "cas_parser"
-__version__ = "1.7.0"  # x-release-please-version
+__version__ = "1.7.1"  # x-release-please-version
diff --git a/src/cas_parser/resources/cams_kfintech.py b/src/cas_parser/resources/cams_kfintech.py
index fb32699..c11c3a9 100644
--- a/src/cas_parser/resources/cams_kfintech.py
+++ b/src/cas_parser/resources/cams_kfintech.py
@@ -7,8 +7,9 @@
 import httpx
 
 from ..types import cams_kfintech_parse_params
+from .._files import deepcopy_with_paths
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
-from .._utils import extract_files, maybe_transform, deepcopy_minimal, async_maybe_transform
+from .._utils import extract_files, maybe_transform, async_maybe_transform
 from .._compat import cached_property
 from .._resource import SyncAPIResource, AsyncAPIResource
 from .._response import (
@@ -78,12 +79,13 @@ def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
@@ -157,12 +159,13 @@ async def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
diff --git a/src/cas_parser/resources/cdsl/cdsl.py b/src/cas_parser/resources/cdsl/cdsl.py
index d0c69b9..75e66b3 100644
--- a/src/cas_parser/resources/cdsl/cdsl.py
+++ b/src/cas_parser/resources/cdsl/cdsl.py
@@ -15,8 +15,9 @@
     AsyncFetchResourceWithStreamingResponse,
 )
 from ...types import cdsl_parse_pdf_params
+from ..._files import deepcopy_with_paths
 from ..._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
-from ..._utils import extract_files, maybe_transform, deepcopy_minimal, async_maybe_transform
+from ..._utils import extract_files, maybe_transform, async_maybe_transform
 from ..._compat import cached_property
 from ..._resource import SyncAPIResource, AsyncAPIResource
 from ..._response import (
@@ -94,12 +95,13 @@ def parse_pdf(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
@@ -181,12 +183,13 @@ async def parse_pdf(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
diff --git a/src/cas_parser/resources/contract_note.py b/src/cas_parser/resources/contract_note.py
index 7133be7..45e6464 100644
--- a/src/cas_parser/resources/contract_note.py
+++ b/src/cas_parser/resources/contract_note.py
@@ -8,8 +8,9 @@
 import httpx
 
 from ..types import contract_note_parse_params
+from .._files import deepcopy_with_paths
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
-from .._utils import extract_files, maybe_transform, deepcopy_minimal, async_maybe_transform
+from .._utils import extract_files, maybe_transform, async_maybe_transform
 from .._compat import cached_property
 from .._resource import SyncAPIResource, AsyncAPIResource
 from .._response import (
@@ -110,13 +111,14 @@ def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "broker_type": broker_type,
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
@@ -221,13 +223,14 @@ async def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "broker_type": broker_type,
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
diff --git a/src/cas_parser/resources/nsdl.py b/src/cas_parser/resources/nsdl.py
index 4312757..9e3f8d1 100644
--- a/src/cas_parser/resources/nsdl.py
+++ b/src/cas_parser/resources/nsdl.py
@@ -7,8 +7,9 @@
 import httpx
 
 from ..types import nsdl_parse_params
+from .._files import deepcopy_with_paths
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
-from .._utils import extract_files, maybe_transform, deepcopy_minimal, async_maybe_transform
+from .._utils import extract_files, maybe_transform, async_maybe_transform
 from .._compat import cached_property
 from .._resource import SyncAPIResource, AsyncAPIResource
 from .._response import (
@@ -78,12 +79,13 @@ def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
@@ -157,12 +159,13 @@ async def parse(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
diff --git a/src/cas_parser/resources/smart.py b/src/cas_parser/resources/smart.py
index 0d85213..1cb95d5 100644
--- a/src/cas_parser/resources/smart.py
+++ b/src/cas_parser/resources/smart.py
@@ -7,8 +7,9 @@
 import httpx
 
 from ..types import smart_parse_cas_pdf_params
+from .._files import deepcopy_with_paths
 from .._types import Body, Omit, Query, Headers, NotGiven, omit, not_given
-from .._utils import extract_files, maybe_transform, deepcopy_minimal, async_maybe_transform
+from .._utils import extract_files, maybe_transform, async_maybe_transform
 from .._compat import cached_property
 from .._resource import SyncAPIResource, AsyncAPIResource
 from .._response import (
@@ -79,12 +80,13 @@ def parse_cas_pdf(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
@@ -159,12 +161,13 @@ async def parse_cas_pdf(
 
           timeout: Override the client-level default timeout for this request, in seconds
         """
-        body = deepcopy_minimal(
+        body = deepcopy_with_paths(
             {
                 "password": password,
                 "pdf_file": pdf_file,
                 "pdf_url": pdf_url,
-            }
+            },
+            [["pdf_file"]],
         )
         files = extract_files(cast(Mapping[str, object], body), paths=[["pdf_file"]])
         if files:
diff --git a/tests/test_client.py b/tests/test_client.py
index 9e2377f..dd96b67 100644
--- a/tests/test_client.py
+++ b/tests/test_client.py
@@ -429,6 +429,30 @@ def test_default_query_option(self) -> None:
 
         client.close()
 
+    def test_hardcoded_query_params_in_url(self, client: CasParser) -> None:
+        request = client._build_request(FinalRequestOptions(method="get", url="/foo?beta=true"))
+        url = httpx.URL(request.url)
+        assert dict(url.params) == {"beta": "true"}
+
+        request = client._build_request(
+            FinalRequestOptions(
+                method="get",
+                url="/foo?beta=true",
+                params={"limit": "10", "page": "abc"},
+            )
+        )
+        url = httpx.URL(request.url)
+        assert dict(url.params) == {"beta": "true", "limit": "10", "page": "abc"}
+
+        request = client._build_request(
+            FinalRequestOptions(
+                method="get",
+                url="/files/a%2Fb?beta=true",
+                params={"limit": "10"},
+            )
+        )
+        assert request.url.raw_path == b"/files/a%2Fb?beta=true&limit=10"
+
     def test_request_extra_json(self, client: CasParser) -> None:
         request = client._build_request(
             FinalRequestOptions(
@@ -1320,6 +1344,30 @@ async def test_default_query_option(self) -> None:
 
         await client.close()
 
+    async def test_hardcoded_query_params_in_url(self, async_client: AsyncCasParser) -> None:
+        request = async_client._build_request(FinalRequestOptions(method="get", url="/foo?beta=true"))
+        url = httpx.URL(request.url)
+        assert dict(url.params) == {"beta": "true"}
+
+        request = async_client._build_request(
+            FinalRequestOptions(
+                method="get",
+                url="/foo?beta=true",
+                params={"limit": "10", "page": "abc"},
+            )
+        )
+        url = httpx.URL(request.url)
+        assert dict(url.params) == {"beta": "true", "limit": "10", "page": "abc"}
+
+        request = async_client._build_request(
+            FinalRequestOptions(
+                method="get",
+                url="/files/a%2Fb?beta=true",
+                params={"limit": "10"},
+            )
+        )
+        assert request.url.raw_path == b"/files/a%2Fb?beta=true&limit=10"
+
     def test_request_extra_json(self, client: CasParser) -> None:
         request = client._build_request(
             FinalRequestOptions(
diff --git a/tests/test_deepcopy.py b/tests/test_deepcopy.py
deleted file mode 100644
index c1e03c0..0000000
--- a/tests/test_deepcopy.py
+++ /dev/null
@@ -1,58 +0,0 @@
-from cas_parser._utils import deepcopy_minimal
-
-
-def assert_different_identities(obj1: object, obj2: object) -> None:
-    assert obj1 == obj2
-    assert id(obj1) != id(obj2)
-
-
-def test_simple_dict() -> None:
-    obj1 = {"foo": "bar"}
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-
-
-def test_nested_dict() -> None:
-    obj1 = {"foo": {"bar": True}}
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-    assert_different_identities(obj1["foo"], obj2["foo"])
-
-
-def test_complex_nested_dict() -> None:
-    obj1 = {"foo": {"bar": [{"hello": "world"}]}}
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-    assert_different_identities(obj1["foo"], obj2["foo"])
-    assert_different_identities(obj1["foo"]["bar"], obj2["foo"]["bar"])
-    assert_different_identities(obj1["foo"]["bar"][0], obj2["foo"]["bar"][0])
-
-
-def test_simple_list() -> None:
-    obj1 = ["a", "b", "c"]
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-
-
-def test_nested_list() -> None:
-    obj1 = ["a", [1, 2, 3]]
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-    assert_different_identities(obj1[1], obj2[1])
-
-
-class MyObject: ...
-
-
-def test_ignores_other_types() -> None:
-    # custom classes
-    my_obj = MyObject()
-    obj1 = {"foo": my_obj}
-    obj2 = deepcopy_minimal(obj1)
-    assert_different_identities(obj1, obj2)
-    assert obj1["foo"] is my_obj
-
-    # tuples
-    obj3 = ("a", "b")
-    obj4 = deepcopy_minimal(obj3)
-    assert obj3 is obj4
diff --git a/tests/test_extract_files.py b/tests/test_extract_files.py
index 37985fb..bb4d8bb 100644
--- a/tests/test_extract_files.py
+++ b/tests/test_extract_files.py
@@ -35,6 +35,15 @@ def test_multiple_files() -> None:
     assert query == {"documents": [{}, {}]}
 
 
+def test_top_level_file_array() -> None:
+    query = {"files": [b"file one", b"file two"], "title": "hello"}
+    assert extract_files(query, paths=[["files", "<array>"]]) == [
+        ("files[]", b"file one"),
+        ("files[]", b"file two"),
+    ]
+    assert query == {"title": "hello"}
+
+
 @pytest.mark.parametrize(
     "query,paths,expected",
     [
diff --git a/tests/test_files.py b/tests/test_files.py
index 1f448b8..117534b 100644
--- a/tests/test_files.py
+++ b/tests/test_files.py
@@ -4,7 +4,8 @@
 import pytest
 from dirty_equals import IsDict, IsList, IsBytes, IsTuple
 
-from cas_parser._files import to_httpx_files, async_to_httpx_files
+from cas_parser._files import to_httpx_files, deepcopy_with_paths, async_to_httpx_files
+from cas_parser._utils import extract_files
 
 readme_path = Path(__file__).parent.parent.joinpath("README.md")
 
@@ -49,3 +50,99 @@ def test_string_not_allowed() -> None:
                 "file": "foo",  # type: ignore
             }
         )
+
+
+def assert_different_identities(obj1: object, obj2: object) -> None:
+    assert obj1 == obj2
+    assert obj1 is not obj2
+
+
+class TestDeepcopyWithPaths:
+    def test_copies_top_level_dict(self) -> None:
+        original = {"file": b"data", "other": "value"}
+        result = deepcopy_with_paths(original, [["file"]])
+        assert_different_identities(result, original)
+
+    def test_file_value_is_same_reference(self) -> None:
+        file_bytes = b"contents"
+        original = {"file": file_bytes}
+        result = deepcopy_with_paths(original, [["file"]])
+        assert_different_identities(result, original)
+        assert result["file"] is file_bytes
+
+    def test_list_popped_wholesale(self) -> None:
+        files = [b"f1", b"f2"]
+        original = {"files": files, "title": "t"}
+        result = deepcopy_with_paths(original, [["files", "<array>"]])
+        assert_different_identities(result, original)
+        result_files = result["files"]
+        assert isinstance(result_files, list)
+        assert_different_identities(result_files, files)
+
+    def test_nested_array_path_copies_list_and_elements(self) -> None:
+        elem1 = {"file": b"f1", "extra": 1}
+        elem2 = {"file": b"f2", "extra": 2}
+        original = {"items": [elem1, elem2]}
+        result = deepcopy_with_paths(original, [["items", "<array>", "file"]])
+        assert_different_identities(result, original)
+        result_items = result["items"]
+        assert isinstance(result_items, list)
+        assert_different_identities(result_items, original["items"])
+        assert_different_identities(result_items[0], elem1)
+        assert_different_identities(result_items[1], elem2)
+
+    def test_empty_paths_returns_same_object(self) -> None:
+        original = {"foo": "bar"}
+        result = deepcopy_with_paths(original, [])
+        assert result is original
+
+    def test_multiple_paths(self) -> None:
+        f1 = b"file1"
+        f2 = b"file2"
+        original = {"a": f1, "b": f2, "c": "unchanged"}
+        result = deepcopy_with_paths(original, [["a"], ["b"]])
+        assert_different_identities(result, original)
+        assert result["a"] is f1
+        assert result["b"] is f2
+        assert result["c"] is original["c"]
+
+    def test_extract_files_does_not_mutate_original_top_level(self) -> None:
+        file_bytes = b"contents"
+        original = {"file": file_bytes, "other": "value"}
+
+        copied = deepcopy_with_paths(original, [["file"]])
+        extracted = extract_files(copied, paths=[["file"]])
+
+        assert extracted == [("file", file_bytes)]
+        assert original == {"file": file_bytes, "other": "value"}
+        assert copied == {"other": "value"}
+
+    def test_extract_files_does_not_mutate_original_nested_array_path(self) -> None:
+        file1 = b"f1"
+        file2 = b"f2"
+        original = {
+            "items": [
+                {"file": file1, "extra": 1},
+                {"file": file2, "extra": 2},
+            ],
+            "title": "example",
+        }
+
+        copied = deepcopy_with_paths(original, [["items", "<array>", "file"]])
+        extracted = extract_files(copied, paths=[["items", "<array>", "file"]])
+
+        assert extracted == [("items[][file]", file1), ("items[][file]", file2)]
+        assert original == {
+            "items": [
+                {"file": file1, "extra": 1},
+                {"file": file2, "extra": 2},
+            ],
+            "title": "example",
+        }
+        assert copied == {
+            "items": [
+                {"extra": 1},
+                {"extra": 2},
+            ],
+            "title": "example",
+        }